libhb/stream.c

   1 /* $Id$
   2
   3    This file is part of the HandBrake source code.
   4    Homepage: <http://handbrake.m0k.org/>.
   5    It may be used under the terms of the GNU General Public License. */
   6
   7 #include "hb.h"
   8 #include "lang.h"
   9 #include "a52dec/a52.h"
  10
  11 #include <string.h>
  12
  13 #define min(a, b) a < b ? a : b
  14
  15 typedef enum {
  16     hb_stream_type_unknown = 0,
  17     hb_stream_type_transport,
  18     hb_stream_type_program
  19 } hb_stream_type_t;
  20
  21 #define kMaxNumberVideoPIDS 1
  22 #define kMaxNumberAudioPIDS 15
  23 #define kMaxNumberDecodeStreams (kMaxNumberVideoPIDS+kMaxNumberAudioPIDS)
  24 #define kMaxNumberPMTStreams 32
  25
  26
  27 struct hb_stream_s
  28 {
  29     int     frames;             /* video frames so far */
  30     int     errors;             /* total errors so far */
  31     int     last_error_frame;   /* frame # at last error message */
  32     int     last_error_count;   /* # errors at last error message */
  33
  34     int64_t ts_lastpcr;         /* the last pcr we found in the TS stream */
  35     int64_t ts_nextpcr;         /* the next pcr to put in a PS packet */
  36
  37     uint8_t *ts_buf[kMaxNumberDecodeStreams];
  38     int     ts_pos[kMaxNumberDecodeStreams];
  39     int8_t  ts_foundfirst[kMaxNumberDecodeStreams];
  40     int8_t  ts_skipbad[kMaxNumberDecodeStreams];
  41     int8_t  ts_streamcont[kMaxNumberDecodeStreams];
  42     int8_t  ts_start[kMaxNumberDecodeStreams];
  43
  44     uint8_t *fwrite_buf;        /* PS buffer (set by hb_ts_stream_decode) */
  45     uint8_t *fwrite_buf_orig;   /* PS buffer start (set by hb_ts_stream_decode) */
  46
  47     /*
  48      * Stuff before this point is dynamic state updated as we read the
  49      * stream. Stuff after this point is stream description state that
  50      * we learn during the initial scan but cache so it can be
  51      * reused during the conversion read.
  52      */
  53     int16_t ts_video_pids[kMaxNumberVideoPIDS];
  54     int16_t ts_audio_pids[kMaxNumberAudioPIDS];
  55
  56     uint8_t ts_number_video_pids;
  57     uint8_t ts_number_audio_pids;
  58
  59     uint8_t ts_streamid[kMaxNumberDecodeStreams];
  60     uint8_t ts_audio_stream_type[kMaxNumberDecodeStreams];
  61
  62     char    *path;
  63     FILE    *file_handle;
  64     hb_stream_type_t stream_type;
  65     int     opentype;
  66
  67     struct {
  68         int lang_code;
  69         int flags;
  70         int rate;
  71         int bitrate;
  72     } a52_info[kMaxNumberAudioPIDS];
  73
  74     struct
  75     {
  76         unsigned short program_number;
  77         unsigned short program_map_PID;
  78     } pat_info[kMaxNumberPMTStreams];
  79     int     ts_number_pat_entries;
  80
  81     struct
  82     {
  83         int reading;
  84         unsigned char *tablebuf;
  85         unsigned int tablepos;
  86         unsigned char current_continuity_counter;
  87
  88         int section_length;
  89         int program_number;
  90         unsigned int PCR_PID;
  91         int program_info_length;
  92         unsigned char *progam_info_descriptor_data;
  93         struct
  94         {
  95             unsigned char stream_type;
  96             unsigned short elementary_PID;
  97             unsigned short ES_info_length;
  98             unsigned char *es_info_descriptor_data;
  99         } pmt_stream_info[kMaxNumberPMTStreams];
 100     } pmt_info;
 101 };
 102
 103 /***********************************************************************
 104  * Local prototypes
 105  **********************************************************************/
 106 static void hb_stream_duration(hb_stream_t *stream, hb_title_t *inTitle);
 107 static void hb_ts_stream_init(hb_stream_t *stream);
 108 static void hb_ts_stream_find_pids(hb_stream_t *stream);
 109 static int hb_ts_stream_decode(hb_stream_t *stream, uint8_t *obuf);
 110 static void hb_ts_stream_reset(hb_stream_t *stream);
 111 static hb_audio_t *hb_ts_stream_set_audio_id_and_codec(hb_stream_t *stream,
 112                                                        int aud_pid_index);
 113 static void hb_ps_stream_find_audio_ids(hb_stream_t *stream, hb_title_t *title);
 114 static off_t align_to_next_packet(FILE* f);
 115
 116 /*
 117  * streams have a bunch of state that's learned during the scan. We don't
 118  * want to throw away the state when scan does a close then relearn
 119  * everything when reader does an open. So we save the stream state on
 120  * the close following a scan and reuse it when 'reader' does an open.
 121  */
 122 static hb_list_t *stream_state_list;
 123
 124 static hb_stream_t *hb_stream_lookup( const char *path )
 125 {
 126     if ( stream_state_list == NULL )
 127         return NULL;
 128
 129     hb_stream_t *ss;
 130     int i = 0;
 131
 132     while ( ( ss = hb_list_item( stream_state_list, i++ ) ) != NULL )
 133     {
 134         if ( strcmp( path, ss->path ) == 0 )
 135         {
 136             break;
 137         }
 138     }
 139     return ss;
 140 }
 141
 142 static void hb_stream_state_delete( hb_stream_t *ss )
 143 {
 144     hb_list_rem( stream_state_list, ss );
 145     free( ss->path );
 146     free( ss );
 147 }
 148
 149 static inline int check_ps_sync(const uint8_t *buf)
 150 {
 151     // a legal MPEG program stream must start with a Pack header in the
 152     // first four bytes.
 153     return (buf[0] == 0x00) && (buf[1] == 0x00) &&
 154            (buf[2] == 0x01) && (buf[3] == 0xba);
 155 }
 156
 157 static inline int check_ts_sync(const uint8_t *buf)
 158 {
 159     // must have initial sync byte, no scrambling & a legal adaptation ctrl
 160     return (buf[0] == 0x47) && ((buf[3] >> 6) == 0) && ((buf[3] >> 4) > 0);
 161 }
 162
 163 static inline int have_ts_sync(const uint8_t *buf)
 164 {
 165     return check_ts_sync(&buf[0*188]) && check_ts_sync(&buf[1*188]) &&
 166            check_ts_sync(&buf[2*188]) && check_ts_sync(&buf[3*188]) &&
 167            check_ts_sync(&buf[4*188]) && check_ts_sync(&buf[5*188]) &&
 168            check_ts_sync(&buf[6*188]) && check_ts_sync(&buf[7*188]);
 169 }
 170
 171 static int hb_stream_check_for_ts(const uint8_t *buf)
 172 {
 173     // transport streams should have a sync byte every 188 bytes.
 174     // search the first KB of buf looking for at least 8 consecutive
 175     // correctly located sync patterns.
 176     int offset = 0;
 177
 178     for ( offset = 0; offset < 1024; ++offset )
 179     {
 180         if ( have_ts_sync( &buf[offset]) )
 181             return 1;
 182     }
 183     return 0;
 184 }
 185
 186 static int hb_stream_check_for_ps(const uint8_t *buf)
 187 {
 188     // program streams should have a Pack header every 2048 bytes.
 189     // check that we have 4 of these.
 190     return check_ps_sync(&buf[0*2048]) && check_ps_sync(&buf[1*2048]) &&
 191            check_ps_sync(&buf[2*2048]) && check_ps_sync(&buf[3*2048]);
 192 }
 193
 194 static int hb_stream_get_type(hb_stream_t *stream)
 195 {
 196     uint8_t buf[2048*4];
 197
 198     if ( fread(buf, 1, sizeof(buf), stream->file_handle) == sizeof(buf) )
 199     {
 200         if ( hb_stream_check_for_ts(buf) != 0 )
 201         {
 202             hb_log("file is MPEG Transport Stream");
 203             stream->stream_type = hb_stream_type_transport;
 204             hb_ts_stream_init(stream);
 205             return 1;
 206         }
 207         if ( hb_stream_check_for_ps(buf) != 0 )
 208         {
 209             hb_log("file is MPEG Program Stream");
 210             stream->stream_type = hb_stream_type_program;
 211             return 1;
 212         }
 213     }
 214     return 0;
 215 }
 216
 217 static void hb_stream_delete_dynamic( hb_stream_t *d )
 218 {
 219     if( d->file_handle )
 220     {
 221         fclose( d->file_handle );
 222                 d->file_handle = NULL;
 223     }
 224
 225         int i=0;
 226
 227         for (i = 0; i < kMaxNumberDecodeStreams; i++)
 228         {
 229                 if (d->ts_buf[i])
 230                 {
 231                         free(d->ts_buf[i]);
 232                         d->ts_buf[i] = NULL;
 233                 }
 234         }
 235 }
 236
 237 static void hb_stream_delete( hb_stream_t *d )
 238 {
 239     hb_stream_delete_dynamic( d );
 240     free( d->path );
 241     free( d );
 242 }
 243
 244 /***********************************************************************
 245  * hb_stream_open
 246  ***********************************************************************
 247  *
 248  **********************************************************************/
 249 hb_stream_t * hb_stream_open( char *path, int opentype )
 250 {
 251
 252     FILE *f = fopen( path, "r" );
 253     if ( f == NULL )
 254     {
 255         hb_log( "hb_stream_open: open %s failed", path );
 256         return NULL;
 257     }
 258
 259     hb_stream_t *d = calloc( sizeof( hb_stream_t ), 1 );
 260     if ( d == NULL )
 261     {
 262         fclose( f );
 263         hb_log( "hb_stream_open: can't allocate space for %s stream state", path );
 264         return NULL;
 265     }
 266
 267     /*
 268      * if we're opening the stream to read & convert, we need
 269      * the state we saved when we scanned the stream. if we're
 270      * opening the stream to scan it we want to rebuild the state
 271      * (even if we have saved state, the stream may have changed).
 272      */
 273     hb_stream_t *ss = hb_stream_lookup( path );
 274     if ( opentype == 1 )
 275     {
 276         /* opening to read - we must have saved state */
 277         if ( ss == NULL )
 278         {
 279             hb_log( "hb_stream_open: error: re-opening %s but no scan state", path );
 280             fclose( f );
 281             free( d );
 282             return NULL;
 283         }
 284         /*
 285          * copy the saved state since we might be encoding the same stream
 286          * multiple times.
 287          */
 288         memcpy( d, ss, sizeof(*d) );
 289         d->file_handle = f;
 290         d->opentype = opentype;
 291         d->path = strdup( path );
 292
 293         if ( d->stream_type == hb_stream_type_transport )
 294         {
 295             int i = 0;
 296             for ( ; i < d->ts_number_video_pids + d->ts_number_audio_pids; i++)
 297             {
 298                 d->ts_buf[i] = malloc( HB_DVD_READ_BUFFER_SIZE );
 299             }
 300             hb_stream_seek( d, 0. );
 301         }
 302         return d;
 303     }
 304
 305     /*
 306      * opening for scan - delete any saved state then (re)scan the stream.
 307      * If it's something we can deal with (MPEG2 PS or TS) return a stream
 308      * reference structure & null otherwise.
 309      */
 310
 311     if ( ss != NULL )
 312     {
 313         hb_stream_state_delete( ss );
 314     }
 315     d->file_handle = f;
 316     d->opentype = opentype;
 317     d->path = strdup( path );
 318     if (d->path != NULL &&  hb_stream_get_type( d ) != 0 )
 319     {
 320         return d;
 321     }
 322     fclose( d->file_handle );
 323     if (d->path)
 324     {
 325         free( d->path );
 326     }
 327     hb_log( "hb_stream_open: open %s failed", path );
 328     free( d );
 329     return NULL;
 330 }
 331
 332 /***********************************************************************
 333  * hb_stream_close
 334  ***********************************************************************
 335  * Closes and frees everything
 336  **********************************************************************/
 337 void hb_stream_close( hb_stream_t ** _d )
 338 {
 339     hb_stream_t *stream = * _d;
 340     if ( stream->frames )
 341     {
 342         hb_log( "stream: %d good frames, %d errors (%.0f%%)", stream->frames,
 343                 stream->errors, (double)stream->errors * 100. /
 344                 (double)stream->frames );
 345     }
 346     /*
 347      * if the stream was opened for a scan, cache the result, otherwise delete
 348      * the state.
 349      */
 350     if ( stream->opentype == 0 )
 351     {
 352         hb_stream_delete_dynamic( stream );
 353         if ( stream_state_list == NULL )
 354         {
 355             stream_state_list = hb_list_init();
 356         }
 357         hb_list_add( stream_state_list, stream );
 358     }
 359     else
 360     {
 361         hb_stream_delete( stream );
 362     }
 363     *_d = NULL;
 364 }
 365
 366 /* when the file was first opened we made entries for all the audio elementary
 367  * streams we found in it. Streams that were later found during the preview scan
 368  * now have an audio codec, type, rate, etc., associated with them. At the end
 369  * of the scan we delete all the audio entries that weren't found by the scan
 370  * or don't have a format we support. This routine deletes audio entry 'indx'
 371  * by copying all later entries down one slot. */
 372 static void hb_stream_delete_audio_entry(hb_stream_t *stream, int indx)
 373 {
 374     int i;
 375
 376     for (i = indx+1; i < stream->ts_number_audio_pids; ++i)
 377     {
 378         stream->ts_audio_pids[indx] = stream->ts_audio_pids[i];
 379         stream->ts_audio_stream_type[1 + indx] = stream->ts_audio_stream_type[1+i];
 380         stream->ts_streamid[1 + indx] = stream->ts_streamid[1 + i];
 381         ++indx;
 382     }
 383     --stream->ts_number_audio_pids;
 384 }
 385
 386 static int index_of_pid(int pid, hb_stream_t *stream)
 387 {
 388     int i;
 389
 390     if ( pid == stream->ts_video_pids[0] )
 391         return 0;
 392
 393     for ( i = 0; i < stream->ts_number_audio_pids; ++i )
 394         if ( pid == stream->ts_audio_pids[i] )
 395             return i + 1;
 396
 397     return -1;
 398 }
 399
 400 /***********************************************************************
 401  * hb_ps_stream_title_scan
 402  ***********************************************************************
 403  *
 404  **********************************************************************/
 405 hb_title_t * hb_stream_title_scan(hb_stream_t *stream)
 406 {
 407     // 'Barebones Title'
 408     hb_title_t *aTitle = hb_title_init( stream->path, 0 );
 409     aTitle->index = 1;
 410
 411         // Copy part of the stream path to the title name
 412         char *sep = strrchr(stream->path, '/');
 413         if (sep)
 414                 strcpy(aTitle->name, sep+1);
 415         char *dot_term = strrchr(aTitle->name, '.');
 416         if (dot_term)
 417                 *dot_term = '\0';
 418
 419     // Height, width,  rate and aspect ratio information is filled in when the previews are built
 420
 421     hb_stream_duration(stream, aTitle);
 422
 423     // One Chapter
 424     hb_chapter_t * chapter;
 425     chapter = calloc( sizeof( hb_chapter_t ), 1 );
 426     chapter->index = 1;
 427     chapter->duration = aTitle->duration;
 428     chapter->hours = aTitle->hours;
 429     chapter->minutes = aTitle->minutes;
 430     chapter->seconds = aTitle->seconds;
 431     hb_list_add( aTitle->list_chapter, chapter );
 432
 433     // Figure out how many audio streams we really have:
 434     // - For transport streams, for each PID listed in the PMT (whether
 435     //   or not it was an audio stream type) read the bitstream until we
 436     //   find an packet from that PID containing a PES header and see if
 437     //   the elementary stream is an audio type.
 438     // - For program streams read the first 4MB and take every unique
 439     //   audio stream we find.
 440         if (stream->stream_type == hb_stream_type_transport)
 441         {
 442         int i;
 443
 444         for (i=0; i < stream->ts_number_audio_pids; i++)
 445         {
 446             hb_audio_t *audio = hb_ts_stream_set_audio_id_and_codec(stream, i);
 447             if (audio->config.in.codec)
 448                 hb_list_add( aTitle->list_audio, audio );
 449             else
 450             {
 451                 free(audio);
 452                 hb_stream_delete_audio_entry(stream, i);
 453                 --i;
 454             }
 455         }
 456
 457         // add the PCR PID if we don't already have it
 458         if ( index_of_pid( stream->pmt_info.PCR_PID, stream ) < 0 )
 459         {
 460             stream->ts_audio_pids[stream->ts_number_audio_pids++] =
 461                 stream->pmt_info.PCR_PID;
 462         }
 463         }
 464     else
 465     {
 466         hb_ps_stream_find_audio_ids(stream, aTitle);
 467     }
 468
 469   return aTitle;
 470 }
 471
 472 /*
 473  * scan the next MB of 'stream' to find the next start packet for
 474  * the Packetized Elementary Stream associated with TS PID 'pid'.
 475  */
 476 static const uint8_t *hb_ts_stream_getPEStype(hb_stream_t *stream, uint32_t pid)
 477 {
 478     static uint8_t buf[188];
 479     int npack = 100000; // max packets to read
 480
 481     while (--npack >= 0)
 482     {
 483         if (fread(buf, 1, 188, stream->file_handle) != 188)
 484         {
 485             hb_log("hb_ts_stream_getPEStype: EOF while searching for PID 0x%x", pid);
 486             return 0;
 487         }
 488         if (buf[0] != 0x47)
 489         {
 490             hb_log("hb_ts_stream_getPEStype: lost sync while searching for PID 0x%x", pid);
 491             align_to_next_packet(stream->file_handle);
 492             continue;
 493         }
 494
 495         /*
 496          * The PES header is only in TS packets with 'start' set so we check
 497          * that first then check for the right PID.
 498          */
 499         if ((buf[1] & 0x40) == 0 || (buf[1] & 0x1f) != (pid >> 8) ||
 500             buf[2] != (pid & 0xff))
 501         {
 502             // not a start packet or not the pid we want
 503             continue;
 504         }
 505
 506         /* skip over the TS hdr to return a pointer to the PES hdr */
 507         int udata = 4;
 508         switch (buf[3] & 0x30)
 509         {
 510             case 0x00: // illegal
 511             case 0x20: // fill packet
 512                 continue;
 513
 514             case 0x30: // adaptation
 515                 if (buf[4] > 182)
 516                 {
 517                     hb_log("hb_ts_stream_getPEStype: invalid adaptation field length %d for PID 0x%x", buf[4], pid);
 518                     continue;
 519                 }
 520                 udata += buf[4] + 1;
 521                 break;
 522         }
 523         return &buf[udata];
 524     }
 525
 526     /* didn't find it */
 527     return 0;
 528 }
 529
 530 static uint64_t hb_ps_stream_getVideoPTS(hb_stream_t *stream)
 531 {
 532     hb_buffer_t *buf  = hb_buffer_init(HB_DVD_READ_BUFFER_SIZE);
 533     hb_list_t *list = hb_list_init();
 534     // how many blocks we read while searching for a video PES header
 535     int blksleft = 1024;
 536     uint64_t pts = 0;
 537
 538     while (--blksleft >= 0 && hb_stream_read(stream, buf) == 1)
 539     {
 540         hb_buffer_t *es;
 541
 542         // 'buf' contains an MPEG2 PACK - get a list of all it's elementary streams
 543         hb_demux_ps(buf, list);
 544
 545         while ( ( es = hb_list_item( list, 0 ) ) )
 546         {
 547             hb_list_rem( list, es );
 548             if ( es->id == 0xe0 )
 549             {
 550                 // this PES contains video - if there's a PTS we're done
 551                 // hb_demux_ps left the PTS in buf_es->start.
 552                 if ( es->start != ~0 )
 553                 {
 554                     pts = es->start;
 555                     blksleft = 0;
 556                     break;
 557                 }
 558             }
 559             hb_buffer_close( &es );
 560         }
 561     }
 562     hb_list_empty( &list );
 563     hb_buffer_close(&buf);
 564     return pts;
 565 }
 566
 567 /***********************************************************************
 568  * hb_stream_duration
 569  ***********************************************************************
 570  *
 571  * Finding stream duration is difficult.  One issue is that the video file
 572  * may have chunks from several different program fragments (main feature,
 573  * commercials, station id, trailers, etc.) all with their own base pts
 574  * value.  We can't find the piece boundaries without reading the entire
 575  * file but if we compute a rate based on time stamps from two different
 576  * pieces the result will be meaningless.  The second issue is that the
 577  * data rate of compressed video normally varies by 5-10x over the length
 578  * of the video. This says that we want to compute the rate over relatively
 579  * long segments to get a representative average but long segments increase
 580  * the likelihood that we'll cross a piece boundary.
 581  *
 582  * What we do is take time stamp samples at several places in the file
 583  * (currently 16) then compute the average rate (i.e., ticks of video per
 584  * byte of the file) for all pairs of samples (N^2 rates computed for N
 585  * samples). Some of those rates will be absurd because the samples came
 586  * from different segments. Some will be way low or high because the
 587  * samples came from a low or high motion part of the segment. But given
 588  * that we're comparing *all* pairs the majority of the computed rates
 589  * should be near the overall average.  So we median filter the computed
 590  * rates to pick the most representative value.
 591  *
 592  **********************************************************************/
 593 struct pts_pos {
 594     uint64_t pos;   /* file position of this PTS sample */
 595     uint64_t pts;   /* PTS from video stream */
 596 };
 597
 598 #define NDURSAMPLES 16
 599
 600 // get one (position, timestamp) sampple from a transport or program
 601 // stream.
 602 static struct pts_pos hb_sample_pts(hb_stream_t *stream, uint64_t fpos)
 603 {
 604     struct pts_pos pp = { 0, 0 };
 605
 606     if ( stream->stream_type == hb_stream_type_program )
 607     {
 608         // round address down to nearest dvd sector start
 609         fpos &=~ ( HB_DVD_READ_BUFFER_SIZE - 1 );
 610         fseeko( stream->file_handle, fpos, SEEK_SET );
 611         pp.pts = hb_ps_stream_getVideoPTS( stream );
 612     }
 613     else
 614     {
 615         const uint8_t *buf;
 616         fseeko( stream->file_handle, fpos, SEEK_SET );
 617         align_to_next_packet( stream->file_handle );
 618         buf = hb_ts_stream_getPEStype( stream, stream->ts_video_pids[0] );
 619         if ( buf == NULL )
 620         {
 621             hb_log("hb_sample_pts: couldn't find video packet near %llu", fpos);
 622             return pp;
 623         }
 624         if ( ( buf[7] >> 7 ) != 1 )
 625         {
 626             hb_log("hb_sample_pts: no PTS in video packet near %llu", fpos);
 627             return pp;
 628         }
 629         pp.pts = ( ( (uint64_t)buf[9] >> 1 ) & 7 << 30 ) |
 630                  ( (uint64_t)buf[10] << 22 ) |
 631                  ( ( (uint64_t)buf[11] >> 1 ) << 15 ) |
 632                  ( (uint64_t)buf[12] << 7 ) |
 633                  ( (uint64_t)buf[13] >> 1 );
 634     }
 635     pp.pos = ftello(stream->file_handle);
 636     hb_log("hb_sample_pts: pts %lld at %llu", pp.pts, pp.pos );
 637     return pp;
 638 }
 639
 640 static int dur_compare( const void *a, const void *b )
 641 {
 642     const double *aval = a, *bval = b;
 643     return ( *aval < *bval ? -1 : ( *aval == *bval ? 0 : 1 ) );
 644 }
 645
 646 // given an array of (position, time) samples, compute a max-likelihood
 647 // estimate of the average rate by computing the rate between all pairs
 648 // of samples then taking the median of those rates.
 649 static double compute_stream_rate( struct pts_pos *pp, int n )
 650 {
 651     int i, j;
 652     double rates[NDURSAMPLES * NDURSAMPLES / 2];
 653     double *rp = rates;
 654
 655     // the following nested loops compute the rates between all pairs.
 656     *rp = 0;
 657     for ( i = 0; i < n-1; ++i )
 658     {
 659         // Bias the median filter by not including pairs that are "far"
 660         // from one another. This is to handle cases where the file is
 661         // made of roughly equal size pieces where a symmetric choice of
 662         // pairs results in having the same number of intra-piece &
 663         // inter-piece rate estimates. This would mean that the median
 664         // could easily fall in the inter-piece part of the data which
 665         // would give a bogus estimate. The 'ns' index creates an
 666         // asymmetry that favors locality.
 667         int ns = i + ( n >> 1 );
 668         if ( ns > n )
 669             ns = n;
 670         for ( j = i+1; j < ns; ++j )
 671         {
 672             if ( pp[j].pts != pp[i].pts && pp[j].pos > pp[i].pos )
 673             {
 674                 *rp = ((double)( pp[j].pts - pp[i].pts )) /
 675                       ((double)( pp[j].pos - pp[i].pos ));
 676                                 ++rp;
 677             }
 678         }
 679     }
 680     // now compute and return the median of all the (n*n/2) rates we computed
 681     // above.
 682     int nrates = rp - rates;
 683     qsort( rates, nrates, sizeof (rates[0] ), dur_compare );
 684     return rates[nrates >> 1];
 685 }
 686
 687 static void hb_stream_duration(hb_stream_t *stream, hb_title_t *inTitle)
 688 {
 689     struct pts_pos ptspos[NDURSAMPLES];
 690     struct pts_pos *pp = ptspos;
 691     int i;
 692
 693     fseeko(stream->file_handle, 0, SEEK_END);
 694     uint64_t fsize = ftello(stream->file_handle);
 695     uint64_t fincr = fsize / NDURSAMPLES;
 696     uint64_t fpos = fincr / 2;
 697     for ( i = NDURSAMPLES; --i >= 0; fpos += fincr )
 698     {
 699         *pp++ = hb_sample_pts(stream, fpos);
 700     }
 701     uint64_t dur = compute_stream_rate( ptspos, pp - ptspos ) * (double)fsize;
 702     inTitle->duration = dur;
 703     dur /= 90000;
 704     inTitle->hours    = dur / 3600;
 705     inTitle->minutes  = ( dur % 3600 ) / 60;
 706     inTitle->seconds  = dur % 60;
 707
 708     rewind(stream->file_handle);
 709 }
 710
 711 /***********************************************************************
 712  * hb_stream_read
 713  ***********************************************************************
 714  *
 715  **********************************************************************/
 716 int hb_stream_read( hb_stream_t * src_stream, hb_buffer_t * b )
 717 {
 718     if ( src_stream->stream_type == hb_stream_type_program )
 719     {
 720         size_t amt_read = fread(b->data, HB_DVD_READ_BUFFER_SIZE, 1,
 721                                 src_stream->file_handle);
 722         return (amt_read > 0);
 723     }
 724     return hb_ts_stream_decode( src_stream, b->data );
 725 }
 726
 727 /***********************************************************************
 728  * hb_stream_seek
 729  ***********************************************************************
 730  *
 731  **********************************************************************/
 732 int hb_stream_seek( hb_stream_t * src_stream, float f )
 733 {
 734   off_t stream_size, cur_pos, new_pos;
 735   double pos_ratio = f;
 736   cur_pos = ftello(src_stream->file_handle);
 737   fseeko(src_stream->file_handle,0 ,SEEK_END);
 738   stream_size = ftello(src_stream->file_handle);
 739   new_pos = (off_t) ((double) (stream_size) * pos_ratio);
 740   new_pos &=~ (HB_DVD_READ_BUFFER_SIZE - 1);
 741   int r = fseeko(src_stream->file_handle, new_pos, SEEK_SET);
 742
 743   if (r == -1)
 744   {
 745     fseeko(src_stream->file_handle, cur_pos, SEEK_SET);
 746     return 0;
 747   }
 748
 749   if (src_stream->stream_type == hb_stream_type_transport)
 750   {
 751         // We need to drop the current decoder output and move
 752         // forwards to the next transport stream packet.
 753         hb_ts_stream_reset(src_stream);
 754   }
 755
 756   return 1;
 757 }
 758
 759 static void set_audio_description( hb_audio_t *audio, iso639_lang_t *lang )
 760 {
 761     /* XXX
 762      * This is a duplicate of code in dvd.c - it should get factored out
 763      * into a common routine. We probably should only be putting the lang
 764      * code or a lang pointer into the audio config & let the common description
 765      * formatting routine in scan.c do all the stuff below.
 766      */
 767     snprintf( audio->config.lang.description,
 768               sizeof( audio->config.lang.description ), "%s (%s)",
 769               strlen(lang->native_name) ? lang->native_name : lang->eng_name,
 770               audio->config.in.codec == HB_ACODEC_AC3 ? "AC3" :
 771                   audio->config.in.codec == HB_ACODEC_DCA ? "DTS" :
 772                       audio->config.in.codec == HB_ACODEC_MPGA ? "MPEG" : "LPCM" );
 773     snprintf( audio->config.lang.simple, sizeof( audio->config.lang.simple ), "%s",
 774               strlen(lang->native_name) ? lang->native_name : lang->eng_name );
 775     snprintf( audio->config.lang.iso639_2, sizeof( audio->config.lang.iso639_2 ),
 776               "%s", lang->iso639_2);
 777 }
 778
 779 static hb_audio_t *hb_ts_stream_set_audio_id_and_codec(hb_stream_t *stream,
 780                                                        int aud_pid_index)
 781 {
 782     off_t cur_pos = ftello(stream->file_handle);
 783     hb_audio_t *audio = calloc( sizeof( hb_audio_t ), 1 );
 784     const uint8_t *buf;
 785
 786     fseeko(stream->file_handle, 0, SEEK_SET);
 787     align_to_next_packet(stream->file_handle);
 788     buf = hb_ts_stream_getPEStype(stream, stream->ts_audio_pids[aud_pid_index]);
 789
 790     /* check that we found a PES header */
 791     if (buf && buf[0] == 0x00 && buf[1] == 0x00 && buf[2] == 0x01)
 792     {
 793         if (buf[3] == 0xbd)
 794         {
 795             audio->id = 0x80bd | (aud_pid_index << 8);
 796             audio->config.in.codec = HB_ACODEC_AC3;
 797             hb_log("transport stream pid 0x%x (type 0x%x) is AC-3 audio id 0x%x",
 798                    stream->ts_audio_pids[aud_pid_index],
 799                    stream->ts_audio_stream_type[1 + aud_pid_index],
 800                    audio->id);
 801             stream->ts_audio_stream_type[1 + aud_pid_index] = 0x81;
 802             stream->ts_streamid[1 + aud_pid_index] = buf[3];
 803         }
 804         else if ((buf[3] & 0xe0) == 0xc0)
 805         {
 806             audio->id = buf[3] | aud_pid_index;
 807             audio->config.in.codec = HB_ACODEC_MPGA;
 808             hb_log("transport stream pid 0x%x (type 0x%x) is MPEG audio id 0x%x",
 809                    stream->ts_audio_pids[aud_pid_index],
 810                    stream->ts_audio_stream_type[1 + aud_pid_index],
 811                    audio->id);
 812             stream->ts_audio_stream_type[1 + aud_pid_index] = 0x03;
 813             stream->ts_streamid[1 + aud_pid_index] = buf[3];
 814         }
 815     }
 816     fseeko(stream->file_handle, cur_pos, SEEK_SET);
 817     if ( audio->config.in.codec )
 818     {
 819                 set_audio_description( audio,
 820                   lang_for_code( stream->a52_info[aud_pid_index].lang_code ) );
 821     }
 822     else
 823     {
 824         hb_log("transport stream pid 0x%x (type 0x%x) isn't audio",
 825                 stream->ts_audio_pids[aud_pid_index],
 826                 stream->ts_audio_stream_type[1 + aud_pid_index]);
 827         }
 828     return audio;
 829 }
 830
 831 static void add_audio_to_title(hb_title_t *title, int id)
 832 {
 833     hb_audio_t *audio = calloc( sizeof( hb_audio_t ), 1 );
 834
 835     audio->id = id;
 836     switch ( id >> 12 )
 837     {
 838         case 0x0:
 839             audio->config.in.codec = HB_ACODEC_MPGA;
 840             hb_log("add_audio_to_title: added MPEG audio stream 0x%x", id);
 841             break;
 842         case 0x2:
 843             // type 2 is a DVD subtitle stream - just ignore it */
 844             free( audio );
 845             return;
 846         case 0x8:
 847             audio->config.in.codec = HB_ACODEC_AC3;
 848             hb_log("add_audio_to_title: added AC3 audio stream 0x%x", id);
 849             break;
 850         case 0xa:
 851             audio->config.in.codec = HB_ACODEC_LPCM;
 852             hb_log("add_audio_to_title: added LPCM audio stream 0x%x", id);
 853             break;
 854         default:
 855             hb_log("add_audio_to_title: unknown audio stream type 0x%x", id);
 856             free( audio );
 857             return;
 858
 859     }
 860     set_audio_description( audio, lang_for_code( 0 ) );
 861     hb_list_add( title->list_audio, audio );
 862 }
 863
 864 static void hb_ps_stream_find_audio_ids(hb_stream_t *stream, hb_title_t *title)
 865 {
 866     off_t cur_pos = ftello(stream->file_handle);
 867     hb_buffer_t *buf  = hb_buffer_init(HB_DVD_READ_BUFFER_SIZE);
 868     hb_list_t *list = hb_list_init();
 869     // how many blocks we read while searching for audio streams
 870     int blksleft = 4096;
 871     // there can be at most 16 unique streams in an MPEG PS (8 in a DVD)
 872     // so we use a bitmap to keep track of the ones we've already seen.
 873     // Bit 'i' of smap is set if we've already added the audio for
 874     // audio substream id 'i' to the title's audio list.
 875     uint32_t smap = 0;
 876
 877     // start looking 20% into the file since there's occasionally no
 878     // audio at the beginning (particularly for vobs).
 879     hb_stream_seek(stream, 0.2f);
 880
 881     while (--blksleft >= 0 && hb_stream_read(stream, buf) == 1)
 882     {
 883         hb_buffer_t *es;
 884
 885         // 'buf' contains an MPEG2 PACK - get a list of all it's elementary streams
 886         hb_demux_ps(buf, list);
 887
 888         while ( ( es = hb_list_item( list, 0 ) ) )
 889         {
 890             hb_list_rem( list, es );
 891             if ( (es->id & 0xff) == 0xbd || (es->id & 0xe0) == 0xc0 )
 892             {
 893                 // this PES contains some kind of audio - get the substream id
 894                 // and check if we've seen it already.
 895                 int ssid = (es->id > 0xff ? es->id >> 8 : es->id) & 0xf;
 896                 if ( (smap & (1 << ssid)) == 0 )
 897                 {
 898                     // we haven't seen this stream before - add it to the
 899                     // title's list of audio streams.
 900                     smap |= (1 << ssid);
 901                     add_audio_to_title(title, es->id);
 902                 }
 903             }
 904             hb_buffer_close( &es );
 905         }
 906     }
 907     hb_list_empty( &list );
 908     hb_buffer_close(&buf);
 909     fseeko(stream->file_handle, cur_pos, SEEK_SET);
 910 }
 911
 912 /***********************************************************************
 913  * hb_ts_stream_init
 914  ***********************************************************************
 915  *
 916  **********************************************************************/
 917
 918 static void hb_ts_stream_init(hb_stream_t *stream)
 919 {
 920         int i;
 921
 922         for (i=0; i < kMaxNumberDecodeStreams; i++)
 923         {
 924                 stream->ts_streamcont[i] = -1;
 925         }
 926         stream->ts_video_pids[0] = -1;
 927     for ( i = 0; i < stream->ts_number_audio_pids; i++ )
 928     {
 929         stream-> ts_audio_pids[i] = -1;
 930     }
 931
 932         // Find the audio and video pids in the stream
 933         hb_ts_stream_find_pids(stream);
 934
 935     stream->ts_streamid[0] = 0xE0;              // stream 0 must be video
 936
 937         for (i = 0; i < stream->ts_number_video_pids + stream->ts_number_audio_pids; i++)
 938         {
 939         // demuxing buffer for TS to PS conversion
 940                 stream->ts_buf[i] = malloc( HB_DVD_READ_BUFFER_SIZE );
 941         }
 942 }
 943
 944 // ------------------------------------------------------------------------------------
 945
 946 static off_t align_to_next_packet(FILE* f)
 947 {
 948         unsigned char buf[188*20];
 949
 950         off_t start = ftello(f);
 951         off_t pos = 0;
 952
 953         if (fread(buf, 188*20, 1, f) == 1)
 954         {
 955                 int found = 0;
 956                 while (!found && (pos < 188))
 957                 {
 958                         found = 1;
 959                         int i = 0;
 960                         for (i = 0; i < 188*20; i += 188)
 961                         {
 962                                 unsigned char c = buf[pos+i];
 963                                 // Check sync byte
 964                                 if ((c != 0x47) && (c != 0x72) && (c != 0x29))
 965                                 {
 966                                         // this offset failed, try next
 967                                         found = 0;
 968                                         pos++;
 969                                         break;
 970                                 }
 971                         }
 972                 }
 973         }
 974
 975         if (pos == 188)
 976                 pos = 0;                // failed to find anything!!!!!?
 977
 978     fseeko(f, start+pos, SEEK_SET);
 979
 980         return pos;
 981 }
 982
 983
 984 typedef struct {
 985     uint8_t *buf;
 986     uint32_t val;
 987     int pos;
 988 } bitbuf_t;
 989
 990 static const unsigned int bitmask[] = {
 991         0x0,0x1,0x3,0x7,0xf,0x1f,0x3f,0x7f,0xff,
 992         0x1ff,0x3ff,0x7ff,0xfff,0x1fff,0x3fff,0x7fff,0xffff,
 993         0x1ffff,0x3ffff,0x7ffff,0xfffff,0x1fffff,0x3fffff,0x7fffff,0xffffff,
 994         0x1ffffff,0x3ffffff,0x7ffffff,0xfffffff,0x1fffffff,0x3fffffff,0x7fffffff,0xffffffff};
 995
 996 static inline void set_buf(bitbuf_t *bb, uint8_t* buf, int bufsize, int clear)
 997 {
 998         bb->pos = 0;
 999         bb->buf = buf;
1000         bb->val = (bb->buf[0] << 24) | (bb->buf[1] << 16) |
1001               (bb->buf[2] << 8) | bb->buf[3];
1002         if (clear)
1003                 memset(bb->buf, 0, bufsize);
1004 }
1005
1006 static inline int buf_size(bitbuf_t *bb)
1007 {
1008         return bb->pos >> 3;
1009 }
1010
1011 static inline unsigned int get_bits(bitbuf_t *bb, int bits)
1012 {
1013         unsigned int val;
1014         int left = 32 - (bb->pos & 31);
1015
1016         if (bits < left)
1017         {
1018                 val = (bb->val >> (left - bits)) & bitmask[bits];
1019                 bb->pos += bits;
1020         }
1021         else
1022         {
1023                 val = (bb->val & bitmask[left]) << (bits - left);
1024                 bb->pos += left;
1025                 bits -= left;
1026
1027                 int pos = bb->pos >> 3;
1028                 bb->val = (bb->buf[pos] << 24) | (bb->buf[pos + 1] << 16) | (bb->buf[pos + 2] << 8) | bb->buf[pos + 3];
1029
1030                 if (bits > 0)
1031                 {
1032                         val |= (bb->val >> (32 - bits)) & bitmask[bits];
1033                         bb->pos += bits;
1034                 }
1035         }
1036
1037         return val;
1038 }
1039
1040 // extract what useful information we can from the elementary stream
1041 // descriptor list at 'dp' and add it to the stream at 'esindx'.
1042 // Descriptors with info we don't currently use are ignored.
1043 // The descriptor list & descriptor item formats are defined in
1044 // ISO 13818-1 (2000E) section 2.6 (pg. 62).
1045 static void decode_element_descriptors(hb_stream_t* stream, int esindx,
1046                                        const uint8_t *dp, uint8_t dlen)
1047 {
1048     const uint8_t *ep = dp + dlen;
1049
1050     while (dp < ep)
1051     {
1052         switch (dp[0])
1053         {
1054             case 10:    // ISO_639_language descriptor
1055                 stream->a52_info[esindx].lang_code = lang_to_code(lang_for_code2((const char *)&dp[2]));
1056                 break;
1057
1058             default:
1059                 break;
1060         }
1061         dp += dp[1] + 2;
1062     }
1063 }
1064
1065 int decode_program_map(hb_stream_t* stream)
1066 {
1067     bitbuf_t bb;
1068         set_buf(&bb, stream->pmt_info.tablebuf, stream->pmt_info.tablepos, 0);
1069
1070     get_bits(&bb, 8);  // table_id
1071     get_bits(&bb, 4);
1072     unsigned int section_length = get_bits(&bb, 12);
1073     stream->pmt_info.section_length = section_length;
1074
1075     unsigned int program_number = get_bits(&bb, 16);
1076     stream->pmt_info.program_number = program_number;
1077     get_bits(&bb, 2);
1078     get_bits(&bb, 5);  // version_number
1079     get_bits(&bb, 1);
1080     get_bits(&bb, 8);  // section_number
1081     get_bits(&bb, 8);  // last_section_number
1082     get_bits(&bb, 3);
1083     unsigned int PCR_PID = get_bits(&bb, 13);
1084     stream->pmt_info.PCR_PID = PCR_PID;
1085     get_bits(&bb, 4);
1086     unsigned int program_info_length = get_bits(&bb, 12);
1087     stream->pmt_info.program_info_length = program_info_length;
1088
1089         int i=0;
1090         unsigned char *descriptor_buf = (unsigned char *) malloc(program_info_length);
1091         for (i = 0; i < program_info_length; i++)
1092         {
1093           descriptor_buf[i] = get_bits(&bb, 8);
1094         }
1095
1096         int cur_pos =  9 /* data after the section length field*/ + program_info_length;
1097         int done_reading_stream_types = 0;
1098         while (!done_reading_stream_types)
1099         {
1100           unsigned char stream_type = get_bits(&bb, 8);
1101                   get_bits(&bb, 3);
1102           unsigned int elementary_PID = get_bits(&bb, 13);
1103                   get_bits(&bb, 4);
1104           unsigned int ES_info_length = get_bits(&bb, 12);
1105
1106           int i=0;
1107           unsigned char *ES_info_buf = (unsigned char *) malloc(ES_info_length);
1108           for (i=0; i < ES_info_length; i++)
1109           {
1110                 ES_info_buf[i] = get_bits(&bb, 8);
1111           }
1112
1113           if (stream_type == 0x02)
1114           {
1115                 if (stream->ts_number_video_pids <= kMaxNumberVideoPIDS)
1116                   stream->ts_number_video_pids++;
1117                 stream->ts_video_pids[stream->ts_number_video_pids-1] = elementary_PID;
1118           }
1119       else
1120       {
1121         // Defined audio stream types are 0x81 for AC-3/A52 audio and 0x03
1122         // for mpeg audio. But content producers seem to use other
1123         // values (0x04 and 0x06 have both been observed) so at this point
1124         // we say everything that isn't a video pid is audio then at the end
1125         // of hb_stream_title_scan we'll figure out which are really audio
1126         // by looking at the PES headers.
1127         i = stream->ts_number_audio_pids;
1128         if (i < kMaxNumberAudioPIDS)
1129             stream->ts_number_audio_pids++;
1130         stream->ts_audio_pids[i] = elementary_PID;
1131         stream->ts_audio_stream_type[1 + i] = stream_type;
1132
1133                 if (ES_info_length > 0)
1134                 {
1135             decode_element_descriptors(stream, i, ES_info_buf, ES_info_length);
1136                 }
1137           }
1138
1139           cur_pos += 5 /* stream header */ + ES_info_length;
1140
1141           free(ES_info_buf);
1142
1143           if (cur_pos >= section_length - 4 /* stop before the CRC */)
1144                 done_reading_stream_types = 1;
1145         }
1146
1147         free(descriptor_buf);
1148         return 1;
1149 }
1150
1151 // ------------------------------------------------------------------------------------
1152
1153 int build_program_map(unsigned char *buf, hb_stream_t *stream)
1154 {
1155     // Get adaption header info
1156     int adapt_len = 0;
1157     int adaption = (buf[3] & 0x30) >> 4;
1158     if (adaption == 0)
1159             return 0;
1160     else if (adaption == 0x2)
1161             adapt_len = 184;
1162     else if (adaption == 0x3)
1163             adapt_len = buf[4] + 1;
1164     if (adapt_len > 184)
1165             return 0;
1166
1167     // Get payload start indicator
1168     int start;
1169     start = (buf[1] & 0x40) != 0;
1170
1171     // Get pointer length - only valid in packets with a start flag
1172     int pointer_len = 0;
1173         if (start && stream->pmt_info.reading)
1174         {
1175                 // We just finished a bunch of packets - parse the program map details
1176                 int decode_ok = 0;
1177                 if (stream->pmt_info.tablebuf[0] == 0x02)
1178                         decode_ok = decode_program_map(stream);
1179                 free(stream->pmt_info.tablebuf);
1180                 stream->pmt_info.tablebuf = NULL;
1181                 stream->pmt_info.tablepos = 0;
1182         stream->pmt_info.reading = 0;
1183         if (decode_ok)
1184                         return decode_ok;
1185         }
1186
1187         if (start)
1188         {
1189                 pointer_len = buf[4 + adapt_len] + 1;
1190                 stream->pmt_info.tablepos = 0;
1191         }
1192         // Get Continuity Counter
1193         int continuity_counter = buf[3] & 0x0f;
1194         if (!start && (stream->pmt_info.current_continuity_counter + 1 != continuity_counter))
1195         {
1196                 hb_log("build_program_map - Continuity Counter %d out of sequence - expected %d", continuity_counter, stream->pmt_info.current_continuity_counter+1);
1197                 return 0;
1198         }
1199         stream->pmt_info.current_continuity_counter = continuity_counter;
1200         stream->pmt_info.reading |= start;
1201
1202     // Add the payload for this packet to the current buffer
1203         int amount_to_copy = 184 - adapt_len - pointer_len;
1204     if (stream->pmt_info.reading && (amount_to_copy > 0))
1205     {
1206                         stream->pmt_info.tablebuf = realloc(stream->pmt_info.tablebuf, stream->pmt_info.tablepos + amount_to_copy);
1207
1208             memcpy(stream->pmt_info.tablebuf + stream->pmt_info.tablepos, buf + 4 + adapt_len + pointer_len, amount_to_copy);
1209             stream->pmt_info.tablepos += amount_to_copy;
1210     }
1211
1212     return 0;
1213 }
1214
1215 int decode_PAT(unsigned char *buf, hb_stream_t *stream)
1216 {
1217     unsigned char tablebuf[1024];
1218     unsigned int tablepos = 0;
1219
1220     int reading = 0;
1221
1222
1223     // Get adaption header info
1224     int adapt_len = 0;
1225     int adaption = (buf[3] & 0x30) >> 4;
1226     if (adaption == 0)
1227             return 0;
1228     else if (adaption == 0x2)
1229             adapt_len = 184;
1230     else if (adaption == 0x3)
1231             adapt_len = buf[4] + 1;
1232     if (adapt_len > 184)
1233             return 0;
1234
1235     // Get pointer length
1236     int pointer_len = buf[4 + adapt_len] + 1;
1237
1238     // Get payload start indicator
1239     int start;
1240     start = (buf[1] & 0x40) != 0;
1241
1242     if (start)
1243             reading = 1;
1244
1245     // Add the payload for this packet to the current buffer
1246     if (reading && (184 - adapt_len) > 0)
1247     {
1248             if (tablepos + 184 - adapt_len - pointer_len > 1024)
1249             {
1250                     hb_log("decode_PAT - Bad program section length (> 1024)");
1251                     return 0;
1252             }
1253             memcpy(tablebuf + tablepos, buf + 4 + adapt_len + pointer_len, 184 - adapt_len - pointer_len);
1254             tablepos += 184 - adapt_len - pointer_len;
1255     }
1256
1257     if (start && reading)
1258     {
1259             memcpy(tablebuf + tablepos, buf + 4 + adapt_len + 1, pointer_len - 1);
1260
1261
1262             unsigned int pos = 0;
1263             //while (pos < tablepos)
1264             {
1265                     bitbuf_t bb;
1266                     set_buf(&bb, tablebuf + pos, tablepos - pos, 0);
1267
1268                     unsigned char section_id    = get_bits(&bb, 8);
1269                     get_bits(&bb, 4);
1270                     unsigned int section_len    = get_bits(&bb, 12);
1271                     get_bits(&bb, 16); // transport_id
1272                     get_bits(&bb, 2);
1273                     get_bits(&bb, 5);  // version_num
1274                     get_bits(&bb, 1);  // current_next
1275                     get_bits(&bb, 8);  // section_num
1276                     get_bits(&bb, 8);  // last_section
1277
1278                     switch (section_id)
1279                     {
1280                       case 0x00:
1281                         {
1282                           // Program Association Section
1283                           section_len -= 5;    // Already read transport stream ID, version num, section num, and last section num
1284                           section_len -= 4;   // Ignore the CRC
1285                           int curr_pos = 0;
1286                                                   stream->ts_number_pat_entries = 0;
1287                           while ((curr_pos < section_len) && (stream->ts_number_pat_entries < kMaxNumberPMTStreams))
1288                           {
1289                             unsigned int pkt_program_num = get_bits(&bb, 16);
1290                                                         stream->pat_info[stream->ts_number_pat_entries].program_number = pkt_program_num;
1291
1292                             get_bits(&bb, 3);  // Reserved
1293                             if (pkt_program_num == 0)
1294                             {
1295                               get_bits(&bb, 13); // pkt_network_id
1296                             }
1297                             else
1298                             {
1299                               unsigned int pkt_program_map_PID = get_bits(&bb, 13);
1300                                 stream->pat_info[stream->ts_number_pat_entries].program_map_PID = pkt_program_map_PID;
1301                             }
1302                             curr_pos += 4;
1303                                                         stream->ts_number_pat_entries++;
1304                           }
1305                         }
1306                         break;
1307                       case 0xC7:
1308                             {
1309                                     break;
1310                             }
1311                       case 0xC8:
1312                             {
1313                                     break;
1314                             }
1315                     }
1316
1317                     pos += 3 + section_len;
1318             }
1319
1320             tablepos = 0;
1321     }
1322     return 1;
1323 }
1324
1325 static void hb_ts_stream_find_pids(hb_stream_t *stream)
1326 {
1327         unsigned char buf[188];
1328
1329         // align to first packet
1330         align_to_next_packet(stream->file_handle);
1331
1332         // Read the Transport Stream Packets (188 bytes each) looking at first for PID 0 (the PAT PID), then decode that
1333         // to find the program map PID and then decode that to get the list of audio and video PIDs
1334
1335         int bytesReadInPacket = 0;
1336         for (;;)
1337         {
1338                 // Try to read packet..
1339                 int bytesRead;
1340                 if ((bytesRead = fread(buf+bytesReadInPacket, 1, 188-bytesReadInPacket, stream->file_handle)) != 188-bytesReadInPacket)
1341                 {
1342                         if (bytesRead < 0)
1343                                 bytesRead = 0;
1344                         bytesReadInPacket += bytesRead;
1345
1346                         hb_log("hb_ts_stream_find_pids - end of file");
1347                         break;
1348                 }
1349                 else
1350                 {
1351                         bytesReadInPacket = 0;
1352                 }
1353
1354                 // Check sync byte
1355                 if ((buf[0] != 0x47) && (buf[0] != 0x72) && (buf[0] != 0x29))
1356                 {
1357             off_t pos = ftello(stream->file_handle) - 188;
1358             off_t pos2 = align_to_next_packet(stream->file_handle);
1359             if ( pos2 == 0 )
1360             {
1361                 hb_log( "hb_ts_stream_find_pids: eof while re-establishing sync @ %lld",
1362                         pos );
1363                 break;
1364             }
1365             hb_log("hb_ts_stream_decode: sync lost @%lld, regained after %lld bytes",
1366                     pos, pos2 );
1367                         continue;
1368                 }
1369
1370                 // Get pid
1371                 int pid = (((buf[1] & 0x1F) << 8) | buf[2]) & 0x1FFF;
1372
1373         if ((pid == 0x0000) && (stream->ts_number_pat_entries == 0))
1374                 {
1375                   decode_PAT(buf, stream);
1376                   continue;
1377                 }
1378
1379                 int pat_index = 0;
1380                 for (pat_index = 0; pat_index < stream->ts_number_pat_entries; pat_index++)
1381                 {
1382                         // There are some streams where the PAT table has multiple entries as if their are
1383                         // multiple programs in the same transport stream, and yet there's actually only one
1384                         // program really in the stream. This seems to be true for transport streams that
1385                         // originate in the HDHomeRun but have been output by EyeTV's export utility. What I think
1386                         // is happening is that the HDHomeRun is sending the entire transport stream as broadcast,
1387                         // but the EyeTV is only recording a single (selected) program number and not rewriting the
1388                         // PAT info on export to match what's actually on the stream.
1389                         // Until we have a way of handling multiple programs per transport stream elegantly we'll match
1390                         // on the first pat entry for which we find a matching program map PID.  The ideal solution would
1391                         // be to build a title choice popup from the PAT program number details and then select from
1392                         // their - but right now the API's not capable of that.
1393                         if (pid == stream->pat_info[pat_index].program_map_PID)
1394                         {
1395                           if (build_program_map(buf, stream) > 0)
1396                                 break;
1397                         }
1398                 }
1399                 // Keep going  until we have a complete set of PIDs
1400                 if ((stream->ts_number_video_pids > 0) && (stream->ts_number_audio_pids > 0))
1401                   break;
1402         }
1403
1404         hb_log("hb_ts_stream_find_pids - found the following PIDS");
1405         hb_log("    Video PIDS : ");
1406         int i=0;
1407         for (i=0; i < stream->ts_number_video_pids; i++)
1408         {
1409                 hb_log("      0x%x (%d)", stream->ts_video_pids[i], stream->ts_video_pids[i]);
1410         }
1411         hb_log("    Audio PIDS : ");
1412         for (i = 0; i < stream->ts_number_audio_pids; i++)
1413         {
1414                 hb_log("      0x%x (%d)", stream->ts_audio_pids[i], stream->ts_audio_pids[i]);
1415         }
1416  }
1417
1418
1419 static void fwrite64( hb_stream_t *stream, void *buf, int size )
1420 {
1421     if ( (stream->fwrite_buf - stream->fwrite_buf_orig) + size > 2048 )
1422     {
1423         hb_log( "steam fwrite64 buffer overflow - writing %d with %d already",
1424                 size, stream->fwrite_buf - stream->fwrite_buf_orig );
1425         return;
1426     }
1427     memcpy( stream->fwrite_buf, buf, size );
1428     stream->fwrite_buf += size;
1429 }
1430
1431 static void write_pack(hb_stream_t* stream, uint64_t time, int stuffing)
1432 {
1433         uint8_t buf[24];
1434
1435     buf[0] = 0x00;      // pack id
1436     buf[1] = 0x00;
1437     buf[2] = 0x01;
1438     buf[3] = 0xba;
1439
1440     buf[4] = 0x44 |     // SCR
1441              ( ( ( time >> 30 ) & 7 ) << 3 ) |
1442              ( ( time >> 28 ) & 3 );
1443     buf[5] = time >> 20;
1444     buf[6] = 0x04 |
1445              ( ( ( time >> 15 ) & 0x1f ) << 3 ) |
1446              ( ( time >> 13 ) & 3 );
1447     buf[7] = time >> 5;
1448     buf[8] = 0x04 | ( time << 3 );
1449
1450     buf[9] = 0x01;      // SCR extension
1451
1452     buf[10] = 384000 >> (22 - 8);     // program mux rate
1453     buf[11] = (uint8_t)( 384000 >> (22 - 16) );
1454     buf[12] = (uint8_t)( 384000 << 2 ) | 0x03;
1455
1456     buf[13] = 0xf8 | stuffing;
1457
1458     int i;
1459     for (i = 0; i < stuffing; ++i )
1460         buf[14+i] = 0xff;
1461
1462         fwrite64(stream, buf, 14 + stuffing );
1463 }
1464
1465 static void pad_buffer(hb_stream_t* stream, int pad)
1466 {
1467         pad -= 6;
1468
1469         uint8_t buf[6];
1470         buf[0] = 0;
1471     buf[1] = 0;
1472     buf[2] = 0;
1473     buf[3] = 0xbe;
1474         buf[4] = pad >> 8;
1475     buf[5] = pad;
1476
1477         fwrite64(stream, buf, 6);
1478
1479         buf[0] = 0xff;
1480     while ( --pad >= 0 )
1481     {
1482                 fwrite64(stream, buf, 1);
1483         }
1484 }
1485
1486 static void make_pes_header(hb_stream_t* stream, int len, uint8_t streamid)
1487 {
1488         uint8_t buf[9];
1489
1490     memset(buf, 0, sizeof(buf) );
1491     buf[2] = 1;
1492     buf[3] = streamid;
1493     buf[4] = ( len + 3 ) >> 8;
1494     buf[5] = len + 3;
1495     buf[6] = 0x88;
1496
1497     fwrite64(stream, buf, 9);
1498 }
1499
1500 static void generate_output_data(hb_stream_t *stream, int curstream)
1501 {
1502     uint8_t *tdat = stream->ts_buf[curstream];
1503     int len;
1504
1505     // we always ship a PACK header plus all the data in our demux buf.
1506     // AC3 audio also always needs it substream header.
1507     len = 14 + stream->ts_pos[curstream];
1508     if ( stream->ts_audio_stream_type[curstream] == 0x81)
1509     {
1510         len += 4;
1511     }
1512
1513     if ( ! stream->ts_start[curstream] )
1514     {
1515         // we're in the middle of a chunk of PES data - we need to add
1516         // a 'continuation' PES header after the PACK header.
1517         len += 9;
1518     }
1519
1520     // Write out pack header
1521     // If we don't have 2048 bytes we need to pad to 2048. We can
1522     // add a padding frame after our data but we need at least 7
1523     // bytes of space to do it (6 bytes of header & 1 of pad). If
1524     // we have fewer than 7 bytes left we need to fill the excess
1525     // space with stuffing bytes added to the pack header.
1526     int stuffing = 0;
1527     if ( len > HB_DVD_READ_BUFFER_SIZE )
1528     {
1529         hb_log( "stream ts length botch %d", len );
1530     }
1531     if ( HB_DVD_READ_BUFFER_SIZE - len < 8)
1532     {
1533         stuffing = HB_DVD_READ_BUFFER_SIZE - len;
1534     }
1535     write_pack(stream, stream->ts_nextpcr, stuffing );
1536     stream->ts_nextpcr += 10;
1537
1538     if ( stream->ts_start[curstream] )
1539     {
1540         // Start frames already have a PES header but we have modify it
1541         // to map from TS PID to PS stream id. Also, if the stream is AC3
1542         // audio we have to insert an AC3 stream header between the end of
1543         // the PES header and the start of the stream data.
1544
1545         stream->ts_start[curstream] = 0;
1546         tdat[3] = stream->ts_streamid[curstream];
1547
1548         uint16_t plen = stream->ts_pos[curstream] - 6;
1549         if ( stream->ts_audio_stream_type[curstream] == 0x81)
1550         {
1551             // We have to add an AC3 header in front of the data. Add its
1552             // size to the PES packet length.
1553             plen += 4;
1554             tdat[4] = plen >> 8;
1555             tdat[5] = plen;
1556
1557             // Write out the PES header
1558             int hdrsize = 9 + tdat[8];
1559             fwrite64(stream, tdat, hdrsize);
1560
1561             // add a four byte DVD ac3 stream header
1562             uint8_t ac3_substream_id[4];
1563             int ssid = (curstream - stream->ts_number_video_pids) & 0xf;
1564             ac3_substream_id[0] = 0x80 | ssid;  // substream id
1565             ac3_substream_id[1] = 0x01;         // number of sync words
1566             ac3_substream_id[2] = 0x00;         // first offset (16 bits)
1567             ac3_substream_id[3] = 0x02;
1568             fwrite64(stream, ac3_substream_id, 4);
1569
1570             // add the rest of the data
1571             fwrite64(stream, tdat + hdrsize, stream->ts_pos[curstream] - hdrsize);
1572         }
1573         else
1574         {
1575             // not audio - don't need to modify the stream so write what we've got
1576             tdat[4] = plen >> 8;
1577             tdat[5] = plen;
1578             fwrite64( stream,  tdat, stream->ts_pos[curstream] );
1579         }
1580     }
1581     else
1582     {
1583         // data without a PES start header needs a simple 'continuation'
1584         // PES header. AC3 audio also needs its substream header.
1585         if ( stream->ts_audio_stream_type[curstream] != 0x81)
1586         {
1587             make_pes_header(stream, stream->ts_pos[curstream],
1588                             stream->ts_streamid[curstream]);
1589         }
1590         else
1591         {
1592             make_pes_header(stream, stream->ts_pos[curstream] + 4,
1593                             stream->ts_streamid[curstream]);
1594
1595             // add a four byte DVD ac3 stream header
1596             uint8_t ac3_substream_id[4];
1597             int ssid = (curstream - stream->ts_number_video_pids) & 0xf;
1598             ac3_substream_id[0] = 0x80 | ssid;  // substream id
1599             ac3_substream_id[1] = 0x01;         // number of sync words
1600             ac3_substream_id[2] = 0x00;         // first offset (16 bits)
1601             ac3_substream_id[3] = 0x02;
1602             fwrite64(stream, ac3_substream_id, 4);
1603         }
1604         fwrite64( stream, tdat, stream->ts_pos[curstream] );
1605     }
1606
1607     // Write padding
1608     int left = HB_DVD_READ_BUFFER_SIZE - len;
1609     if ( left >= 8 )
1610     {
1611         pad_buffer(stream, left);
1612     }
1613
1614     stream->ts_pos[curstream] = 0;
1615 }
1616
1617 static void ts_warn_helper( hb_stream_t *stream, char *log, va_list args )
1618 {
1619     // limit error printing to at most one per minute of video (at 30fps)
1620     ++stream->errors;
1621     if ( stream->frames - stream->last_error_frame >= 30*60 )
1622     {
1623         char msg[256];
1624
1625         vsnprintf( msg, sizeof(msg), log, args );
1626
1627         if ( stream->errors - stream->last_error_count < 10 )
1628         {
1629             hb_log( "stream: error near frame %d: %s", stream->frames, msg );
1630         }
1631         else
1632         {
1633             int Edelta = stream->errors - stream->last_error_count;
1634             double Epcnt = (double)Edelta * 100. /
1635                             (stream->frames - stream->last_error_frame);
1636             hb_log( "stream: %d new errors (%.0f%%) up to frame %d: %s",
1637                     Edelta, Epcnt, stream->frames, msg );
1638         }
1639         stream->last_error_frame = stream->frames;
1640         stream->last_error_count = stream->errors;
1641     }
1642 }
1643
1644 static void ts_warn( hb_stream_t *stream, char *log, ... )
1645 {
1646     va_list     args;
1647     va_start( args, log );
1648     ts_warn_helper( stream, log, args );
1649     va_end( args );
1650 }
1651
1652 static void ts_err( hb_stream_t *stream, int curstream, char *log, ... )
1653 {
1654     va_list     args;
1655     va_start( args, log );
1656     ts_warn_helper( stream, log, args );
1657     va_end( args );
1658
1659     stream->ts_skipbad[curstream] = 1;
1660     stream->ts_pos[curstream] = 0;
1661     stream->ts_streamcont[curstream] = -1;
1662 }
1663
1664 static int isIframe( const uint8_t *buf, int adapt_len )
1665 {
1666     // Look for the Group of Pictures packet
1667     int i;
1668     uint32_t strid = 0;
1669
1670     for (i = 4 + adapt_len; i < 188; i++)
1671     {
1672         strid = (strid << 8) | buf[i];
1673         switch ( strid )
1674         {
1675             case 0x000001B8: // group_start_code (GOP header)
1676             case 0x000001B3: // sequence_header code
1677                 return 1;
1678
1679             case 0x00000100: // picture_start_code
1680                 // picture_header, let's see if it's an I-frame
1681                 if (i<185)
1682                 {
1683                     // check if picture_coding_type == 1
1684                     if ((buf[i+2] & (0x7 << 3)) == (1 << 3))
1685                     {
1686                         // found an I-frame picture
1687                         return 1;
1688                     }
1689                 }
1690                 break;
1691         }
1692     }
1693     // didn't find an I frame
1694     return 0;
1695 }
1696
1697 /***********************************************************************
1698  * hb_ts_stream_decode
1699  ***********************************************************************
1700  *
1701  **********************************************************************/
1702 static int hb_ts_stream_decode( hb_stream_t *stream, uint8_t *obuf )
1703 {
1704     int64_t pcr = stream->ts_lastpcr;
1705         int curstream;
1706         uint8_t buf[188];
1707
1708     /*
1709      * stash the output buffer pointer in our stream so we don't have to
1710      * pass it & its original value to everything we call.
1711      */
1712     stream->fwrite_buf = obuf;
1713     stream->fwrite_buf_orig = obuf;
1714
1715         // spin until we get a packet of data from some stream or hit eof
1716         while ( 1 )
1717         {
1718         if ((fread(buf, 188, 1, stream->file_handle)) != 1)
1719                 {
1720             // end of file - we didn't finish filling our ps write buffer
1721             // so just discard the remainder (the partial buffer is useless)
1722             hb_log("hb_ts_stream_decode - eof");
1723             return 0;
1724                 }
1725
1726         /* This next section validates the packet */
1727
1728                 // Check sync byte
1729                 if ((buf[0] != 0x47) && (buf[0] != 0x72) && (buf[0] != 0x29))
1730                 {
1731             // lost sync - back up to where we started then try to
1732             // re-establish sync.
1733             off_t pos = ftello(stream->file_handle) - 188;
1734             off_t pos2 = align_to_next_packet(stream->file_handle);
1735             if ( pos2 == 0 )
1736             {
1737                 hb_log( "hb_ts_stream_decode: eof while re-establishing sync @ %lld",
1738                         pos );
1739                 return 0;
1740             }
1741             ts_warn( stream, "hb_ts_stream_decode: sync lost @%lld, "
1742                      "regained after %lld bytes", pos, pos2 );
1743                         continue;
1744                 }
1745
1746                 // Get pid and use it to find stream state.
1747                 int pid = ((buf[1] & 0x1F) << 8) | buf[2];
1748         if ( ( curstream = index_of_pid( pid, stream ) ) < 0 )
1749             continue;
1750
1751                 // Get error
1752                 int errorbit = (buf[1] & 0x80) != 0;
1753                 if (errorbit)
1754                 {
1755                         ts_err( stream, curstream,  "packet error bit set");
1756                         continue;
1757                 }
1758
1759                 // Get adaption header info
1760                 int adaption = (buf[3] & 0x30) >> 4;
1761                 int adapt_len = 0;
1762                 if (adaption == 0)
1763                 {
1764                         ts_err( stream, curstream,  "adaptation code 0");
1765                         continue;
1766                 }
1767                 else if (adaption == 0x2)
1768                         adapt_len = 184;
1769                 else if (adaption == 0x3)
1770                 {
1771                         adapt_len = buf[4] + 1;
1772                         if (adapt_len > 184)
1773                         {
1774                                 ts_err( stream, curstream,  "invalid adapt len %d", adapt_len);
1775                 continue;
1776                         }
1777                 }
1778
1779         // if there's an adaptation header & PCR_flag is set
1780         // get the PCR (Program Clock Reference)
1781         if ( adapt_len > 7 && ( buf[5] & 0x10 ) != 0 )
1782         {
1783             pcr = ( (uint64_t)buf[6] << (33 - 8) ) |
1784                   ( (uint64_t)buf[7] << (33 - 16) ) |
1785                   ( (uint64_t)buf[8] << (33 - 24) ) |
1786                   ( (uint64_t)buf[9] << (33 - 32) ) |
1787                   ( buf[10] >> 7 );
1788             stream->ts_nextpcr = pcr;
1789
1790             // remember the pcr across calls to this routine
1791             stream->ts_lastpcr = pcr;
1792         }
1793
1794                 if ( pcr == -1 )
1795                 {
1796             // don't accumulate data until we get a pcr
1797                     continue;
1798                 }
1799
1800                 // Get continuity
1801         // Continuity only increments for adaption values of 0x3 or 0x01
1802         // and is not checked for start packets.
1803
1804                 int start = (buf[1] & 0x40) != 0;
1805
1806         if ( (adaption & 0x01) != 0 )
1807                 {
1808             int continuity = (buf[3] & 0xF);
1809             if ( continuity == stream->ts_streamcont[curstream] )
1810             {
1811                 // we got a duplicate packet (usually used to introduce
1812                 // a PCR when one is needed). The only thing that can
1813                 // change in the dup is the PCR which we grabbed above
1814                 // so ignore the rest.
1815                 continue;
1816             }
1817             if ( !start && (stream->ts_streamcont[curstream] != -1) &&
1818                  (continuity != ( (stream->ts_streamcont[curstream] + 1) & 0xf ) ) )
1819                         {
1820                                 ts_err( stream, curstream,  "continuity error: got %d expected %d",
1821                         (int)continuity,
1822                         (stream->ts_streamcont[curstream] + 1) & 0xf );
1823                 stream->ts_streamcont[curstream] = continuity;
1824                                 continue;
1825                         }
1826                         stream->ts_streamcont[curstream] = continuity;
1827                 }
1828
1829         /* If we get here the packet is valid - process its data */
1830
1831         if ( start )
1832         {
1833             // Found a random access point (now we can start a frame/audio packet..)
1834
1835                         // If we were skipping a bad packet, start fresh on this new PES packet..
1836                         if (stream->ts_skipbad[curstream] == 1)
1837                         {
1838                 // video skips to an iframe after a bad packet to minimize
1839                 // screen corruption
1840                 if ( curstream == 0 && !isIframe( buf, adapt_len ) )
1841                 {
1842                     continue;
1843                 }
1844                                 stream->ts_skipbad[curstream] = 0;
1845                         }
1846
1847                         // If we don't have video yet, check to see if this is an
1848             // i_frame (group of picture start)
1849                         if ( curstream == 0 )
1850             {
1851                 if ( !stream->ts_foundfirst[0] )
1852                 {
1853                     if ( !isIframe( buf, adapt_len ) )
1854                     {
1855                         // didn't find an I frame
1856                         continue;
1857                     }
1858                     stream->ts_foundfirst[0] = 1;
1859                 }
1860                 ++stream->frames;
1861             }
1862                         else if ( ! stream->ts_foundfirst[curstream] )
1863             {
1864                 // start other streams only after first video frame found.
1865                 if ( ! stream->ts_foundfirst[0] )
1866                 {
1867                     continue;
1868                 }
1869                 stream->ts_foundfirst[curstream] = 1;
1870                         }
1871
1872             // If we have some data already on this stream, turn it into
1873             // a program stream packet. Then add the payload for this
1874             // packet to the current pid's buffer.
1875             if ( stream->ts_pos[curstream] )
1876             {
1877                 generate_output_data(stream, curstream);
1878                 stream->ts_start[curstream] = 1;
1879                 memcpy(stream->ts_buf[curstream],
1880                        buf + 4 + adapt_len, 184 - adapt_len);
1881                 stream->ts_pos[curstream] = 184 - adapt_len;
1882                 return 1;
1883             }
1884             stream->ts_start[curstream] = 1;
1885         }
1886
1887                 // Add the payload for this packet to the current buffer
1888                 if (!stream->ts_skipbad[curstream] && stream->ts_foundfirst[curstream] &&
1889             (184 - adapt_len) > 0)
1890                 {
1891                         memcpy(stream->ts_buf[curstream] + stream->ts_pos[curstream],
1892                    buf + 4 + adapt_len, 184 - adapt_len);
1893                         stream->ts_pos[curstream] += 184 - adapt_len;
1894
1895             // if the next TS packet could possibly overflow our 2K output buffer
1896             // we need to generate a packet now. Overflow would be 184 bytes of
1897             // data + the 9 byte PES hdr + the 14 byte PACK hdr = 211 bytes.
1898             if ( stream->ts_pos[curstream] >= (HB_DVD_READ_BUFFER_SIZE - 216) )
1899             {
1900                 // we have enough data to make a PS packet
1901                 generate_output_data(stream, curstream);
1902                 return 1;
1903             }
1904                 }
1905         }
1906 }
1907
1908 /***********************************************************************
1909  * hb_ts_stream_reset
1910  ***********************************************************************
1911  *
1912  **********************************************************************/
1913 static void hb_ts_stream_reset(hb_stream_t *stream)
1914 {
1915         int i;
1916
1917         for (i=0; i < kMaxNumberDecodeStreams; i++)
1918         {
1919                 stream->ts_pos[i] = 0;
1920                 stream->ts_foundfirst[i] = 0;
1921                 stream->ts_skipbad[i] = 0;
1922                 stream->ts_streamcont[i] = -1;
1923                 stream->ts_start[i] = 0;
1924         }
1925
1926     stream->ts_lastpcr = -1;
1927     stream->ts_nextpcr = -1;
1928
1929     stream->frames = 0;
1930     stream->errors = 0;
1931     stream->last_error_frame = -10000;
1932     stream->last_error_count = 0;
1933
1934         align_to_next_packet(stream->file_handle);
1935 }
1936