mp4.c 42.7 KB
Newer Older
1 2 3 4
/*****************************************************************************
 * mp4.c : MP4 file input module for vlc
 *****************************************************************************
 * Copyright (C) 2001 VideoLAN
5
 * $Id: mp4.c,v 1.17 2003/02/07 01:22:55 fenrir Exp $
6
 * Authors: Laurent Aimar <fenrir@via.ecp.fr>
7
 *
8 9 10 11
 * This program is free software; you can redistribute it and/or modify
 * it under the terms of the GNU General Public License as published by
 * the Free Software Foundation; either version 2 of the License, or
 * (at your option) any later version.
12
 *
13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32
 * This program is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU General Public License for more details.
 *
 * You should have received a copy of the GNU General Public License
 * along with this program; if not, write to the Free Software
 * Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA  02111, USA.
 *****************************************************************************/

/*****************************************************************************
 * Preamble
 *****************************************************************************/
#include <stdlib.h>                                      /* malloc(), free() */
#include <string.h>                                              /* strdup() */
#include <errno.h>
#include <sys/types.h>

#include <vlc/vlc.h>
#include <vlc/input.h>
33
#include "codecs.h"
34 35 36 37 38 39 40 41 42 43
#include "libmp4.h"
#include "mp4.h"

/*****************************************************************************
 * Local prototypes
 *****************************************************************************/
static int    MP4Init    ( vlc_object_t * );
static void __MP4End     ( vlc_object_t * );
static int    MP4Demux   ( input_thread_t * );

44 45 46
/* New input could have something like that... */
static int   MP4Seek     ( input_thread_t *, mtime_t );

47 48 49 50 51 52 53 54 55 56 57 58
#define MP4End(a) __MP4End(VLC_OBJECT(a))

/*****************************************************************************
 * Module descriptor
 *****************************************************************************/
vlc_module_begin();
    set_description( "MP4 demuxer" );
    set_capability( "demux", 242 );
    set_callbacks( MP4Init, __MP4End );
vlc_module_end();

/*****************************************************************************
59
 * Declaration of local function
60
 *****************************************************************************/
61 62 63

static int MP4_TrackSynchro( input_thread_t *p_input, track_data_mp4_t *p_track );

64 65 66 67 68 69 70 71 72 73 74 75
static void MP4_ParseTrack();

static int MP4_CreateChunksIndex();
static int MP4_CreateSamplesIndex();

static void MP4_StartDecoder();
static void MP4_StopDecoder();

static int  MP4_ReadSample();
static int  MP4_DecodeSample();

#define MP4_Set4BytesLE( p, dw ) \
76 77 78 79
    *((uint8_t*)p)   = ( (dw)&0xff ); \
    *((uint8_t*)p+1) = ( ((dw)>> 8)&0xff ); \
    *((uint8_t*)p+2) = ( ((dw)>>16)&0xff ); \
    *((uint8_t*)p+3) = ( ((dw)>>24)&0xff )
80 81

#define MP4_Set2BytesLE( p, dw ) \
82 83
    *((uint8_t*)p) = ( (dw)&0xff ); \
    *((uint8_t*)p+1) = ( ((dw)>> 8)&0xff )
84

85

86 87 88 89
/*****************************************************************************
 * MP4Init: check file and initializes MP4 structures
 *****************************************************************************/
static int MP4Init( vlc_object_t * p_this )
90
{
91 92
    input_thread_t  *p_input = (input_thread_t *)p_this;
    uint8_t         *p_peek;
93

94
    demux_sys_t     *p_demux;
95

96
    MP4_Box_t       *p_ftyp;
97 98


99 100
    MP4_Box_t       *p_mvhd;
    MP4_Box_t       *p_trak;
101

102
    unsigned int    i;
103 104 105 106 107
    /* I need to seek */
    if( !p_input->stream.b_seekable )
    {
        msg_Warn( p_input, "MP4 plugin discarded (unseekable)" );
        return( -1 );
108 109

    }
110 111 112 113 114 115 116 117 118 119 120 121 122 123 124
    /* Initialize access plug-in structures. */
    if( p_input->i_mtu == 0 )
    {
        /* Improve speed. */
        p_input->i_bufsize = INPUT_DEFAULT_BUFSIZE ;
    }

    p_input->pf_demux = MP4Demux;

    /* a little test to see if it could be a mp4 */
    if( input_Peek( p_input, &p_peek, 8 ) < 8 )
    {
        msg_Warn( p_input, "MP4 plugin discarded (cannot peek)" );
        return( -1 );
    }
125

126

127
    switch( VLC_FOURCC( p_peek[4], p_peek[5], p_peek[6], p_peek[7] ) )
128 129 130 131 132
    {
        case( FOURCC_ftyp ):
        case( FOURCC_moov ):
        case( FOURCC_moof ):
        case( FOURCC_mdat ):
133
        case( FOURCC_udta ):
134 135
        case( FOURCC_free ):
        case( FOURCC_skip ):
136
        case( FOURCC_wide ):
137 138 139 140 141 142 143
            break;
         default:
            msg_Warn( p_input, "MP4 plugin discarded (not a valid file)" );
            return( -1 );
    }

    /* create our structure that will contains all data */
144
    if( !( p_input->p_demux_data =
145
                p_demux = malloc( sizeof( demux_sys_t ) ) ) )
146 147 148 149
    {
        msg_Err( p_input, "out of memory" );
        return( -1 );
    }
150
    memset( p_demux, 0, sizeof( demux_sys_t ) );
151
    p_input->p_demux_data = p_demux;
152

153 154

    /* Now load all boxes ( except raw data ) */
155
    if( !MP4_BoxGetRoot( p_input, &p_demux->box_root ) )
156 157 158 159 160
    {
        msg_Warn( p_input, "MP4 plugin discarded (not a valid file)" );
        return( -1 );
    }

161
    MP4_BoxDumpStructure( p_input, &p_demux->box_root );
162

163
    if( ( p_ftyp = MP4_BoxGet( &p_demux->box_root, "/ftyp" ) ) )
164 165 166 167
    {
        switch( p_ftyp->data.p_ftyp->i_major_brand )
        {
            case( FOURCC_isom ):
168
                msg_Dbg( p_input,
169 170
                         "ISO Media file (isom) version %d.",
                         p_ftyp->data.p_ftyp->i_minor_version );
171 172
                break;
            default:
173
                msg_Dbg( p_input,
174 175
                         "unrecognized major file specification (%4.4s).",
                          (char*)&p_ftyp->data.p_ftyp->i_major_brand );
176 177 178 179 180
                break;
        }
    }
    else
    {
181
        msg_Dbg( p_input, "file type box missing (assuming ISO Media file)" );
182 183 184
    }

    /* the file need to have one moov box */
185
    if( MP4_BoxCount( &p_demux->box_root, "/moov" ) != 1 )
186
    {
187
        msg_Err( p_input,
188
                 "MP4 plugin discarded (%d moov boxes)",
189
                 MP4_BoxCount( &p_demux->box_root, "/moov" ) );
190 191
//        MP4End( p_input );
//        return( -1 );
192 193
    }

194
    if( !(p_mvhd = MP4_BoxGet( &p_demux->box_root, "/moov/mvhd" ) ) )
195
    {
196
        msg_Err( p_input, "cannot find /moov/mvhd" );
197 198 199 200 201 202
        MP4End( p_input );
        return( -1 );
    }
    else
    {
        p_demux->i_timescale = p_mvhd->data.p_mvhd->i_timescale;
203
        p_demux->i_duration = p_mvhd->data.p_mvhd->i_duration;
204
    }
205

206
    if( !( p_demux->i_tracks =
207
                MP4_BoxCount( &p_demux->box_root, "/moov/trak" ) ) )
208
    {
209
        msg_Err( p_input, "cannot find any /moov/trak" );
210 211 212
        MP4End( p_input );
        return( -1 );
    }
213 214 215
    msg_Dbg( p_input, "find %d track%c",
                        p_demux->i_tracks,
                        p_demux->i_tracks ? 's':' ' );
216 217 218 219 220 221 222

    /* allocate memory */
    p_demux->track = calloc( p_demux->i_tracks, sizeof( track_data_mp4_t ) );

    /* now process each track and extract all usefull informations */
    for( i = 0; i < p_demux->i_tracks; i++ )
    {
223
        p_trak = MP4_BoxGet( &p_demux->box_root, "/moov/trak[%d]", i );
224 225 226 227 228 229 230 231 232 233 234 235 236 237
        MP4_ParseTrack( p_input, &p_demux->track[i], p_trak );

        if( p_demux->track[i].b_ok )
        {
            char *psz_cat;
            switch( p_demux->track[i].i_cat )
            {
                case( VIDEO_ES ):
                    psz_cat = "video";
                    break;
                case( AUDIO_ES ):
                    psz_cat = "audio";
                    break;
                default:
238
                    psz_cat = "unknown";
239 240
                    break;
            }
241

242 243
            msg_Dbg( p_input, "adding track[Id 0x%x] %s (%s) language %c%c%c",
                            p_demux->track[i].i_track_ID,
244 245 246
                            psz_cat,
                            p_demux->track[i].b_enable ? "enable":"disable",
                            p_demux->track[i].i_language[0],
247
                            p_demux->track[i].i_language[1],
248 249 250 251
                            p_demux->track[i].i_language[2] );
        }
        else
        {
252
            msg_Dbg( p_input, "ignoring track[Id 0x%x]", p_demux->track[i].i_track_ID );
253 254 255
        }

    }
256

257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273
    /*  create one program */
    vlc_mutex_lock( &p_input->stream.stream_lock );
    if( input_InitStream( p_input, 0 ) == -1)
    {
        vlc_mutex_unlock( &p_input->stream.stream_lock );
        msg_Err( p_input, "cannot init stream" );
        MP4End( p_input );
        return( -1 );
    }
    if( input_AddProgram( p_input, 0, 0) == NULL )
    {
        vlc_mutex_unlock( &p_input->stream.stream_lock );
        msg_Err( p_input, "cannot add program" );
        MP4End( p_input );
        return( -1 );
    }
    p_input->stream.p_selected_program = p_input->stream.pp_programs[0];
274
    /* XXX beurk and beurk, see MP4Demux and MP4Seek */
275 276
    if( p_demux->i_duration/p_demux->i_timescale > 0 )
    {
277 278
        p_input->stream.i_mux_rate =
            p_input->stream.p_selected_area->i_size / 50 /
279 280 281 282 283 284
            ( p_demux->i_duration / p_demux->i_timescale );
    }
    else
    {
        p_input->stream.i_mux_rate = 0;
    }
285
    vlc_mutex_unlock( &p_input->stream.stream_lock );
286 287


288 289 290 291 292 293 294 295 296 297 298 299
    for( i = 0; i < p_demux->i_tracks; i++ )
    {
        /* start decoder for this track if enable by default*/
        if( p_demux->track[i].b_enable )
        {
            MP4_StartDecoder( p_input, &p_demux->track[i] );
        }
    }

    vlc_mutex_lock( &p_input->stream.stream_lock );
    p_input->stream.p_selected_program->b_is_ok = 1;
    vlc_mutex_unlock( &p_input->stream.stream_lock );
300 301

    return( 0 );
302 303 304 305

}

/*****************************************************************************
306
 * MP4Demux: read packet and send them to decoders
307 308
 *****************************************************************************
 * TODO check for newly selected track (ie audio upt to now )
309 310 311
 *****************************************************************************/
static int MP4Demux( input_thread_t *p_input )
{
312
    demux_sys_t *p_demux = p_input->p_demux_data;
313
    unsigned int i_track;
314

315
    /* XXX beurk, beuRK and BEURK,
316 317 318 319
       but only way I've found to detect seek from interface */
    if( p_input->stream.p_selected_program->i_synchro_state == SYNCHRO_REINIT )
    {
        mtime_t i_date;
320

321 322 323 324
        /* first wait for empty buffer, arbitrary time FIXME */
        msleep( DEFAULT_PTS_DELAY );
        /* *** calculate new date *** */

325
        i_date = (mtime_t)1000000 *
326
                 (mtime_t)p_demux->i_duration /
327
                 (mtime_t)p_demux->i_timescale *
328 329 330 331
                 (mtime_t)MP4_TellAbsolute( p_input ) /
                 (mtime_t)p_input->stream.p_selected_area->i_size;
        MP4Seek( p_input, i_date );
    }
332

333 334 335 336 337 338 339 340
    /* first wait for the good time to read a packet */
    input_ClockManageRef( p_input,
                          p_input->stream.p_selected_program,
                          p_demux->i_pcr );


    /* update pcr XXX in mpeg scale so in 90000 unit/s */
    p_demux->i_pcr = MP4_GetMoviePTS( p_demux ) * 9 / 100;
341

342 343 344

    /* we will read 100ms for each stream so ...*/
    p_demux->i_time += __MAX( p_demux->i_timescale / 10 , 1 );
345

346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363 364 365 366 367 368 369 370

    for( i_track = 0; i_track < p_demux->i_tracks; i_track++ )
    {
        if( ( !p_demux->track[i_track].b_ok )||
            ( !p_demux->track[i_track].p_es )||
            ( !p_demux->track[i_track].p_es->p_decoder_fifo )||
            ( MP4_GetTrackPTS( &p_demux->track[i_track] ) >=
                        MP4_GetMoviePTS( p_demux ) ) )
        {
            continue; /* no need to read something */
        }
        while( MP4_GetTrackPTS( &p_demux->track[i_track] ) <
                        MP4_GetMoviePTS( p_demux ) )
        {

            pes_packet_t *p_pes;

            /* read a sample */
            if( !MP4_ReadSample( p_input ,
                                 &p_demux->track[i_track],
                                 &p_pes ) )
            {
                break;
            }

371
            /* send it to decoder and update time of this track
372 373 374 375 376 377 378
                 it also launch a new decoder if needed */
            MP4_DecodeSample( p_input ,
                              &p_demux->track[i_track],
                              p_pes );
        }

    }
379

380
    /* now check if all tracks are finished or unhandled*/
381

382 383 384 385 386 387 388 389 390 391 392 393 394
    for( i_track = 0; i_track < p_demux->i_tracks; i_track++ )
    {
        if( ( p_demux->track[i_track].b_ok )&&
            ( p_demux->track[i_track].i_sample < p_demux->track[i_track].i_sample_count )&&
            ( p_demux->track[i_track].p_es )&&
            ( p_demux->track[i_track].p_es->p_decoder_fifo ) )
        {
            return( 1 );
        }
    }

    return( 0 ); /* EOF */
}
395 396 397 398 399 400
/*****************************************************************************
 * MP4Seek: Got to i_date
 ******************************************************************************/
static int   MP4Seek     ( input_thread_t *p_input, mtime_t i_date )
{
    demux_sys_t *p_demux = p_input->p_demux_data;
401
    unsigned int i_track;
402 403 404 405

    /* First update update global time */
    p_demux->i_time = i_date * p_demux->i_timescale / 1000000;
    p_demux->i_pcr = __MAX( MP4_GetMoviePTS( p_demux ) - DEFAULT_PTS_DELAY,
406 407
                            0 ) * 9 / 100;

408 409 410 411 412 413 414
    /* Now for each stream try to go to this time */
    for( i_track = 0; i_track < p_demux->i_tracks; i_track++ )
    {
        MP4_TrackSynchro( p_input, &p_demux->track[i_track] );
    }
    return( 1 );
}
415 416 417 418 419

/*****************************************************************************
 * MP4End: frees unused data
 *****************************************************************************/
static void __MP4End ( vlc_object_t * p_this )
420
{
421
#define FREE( p ) \
422 423
    if( p ) { free( p ); }
    unsigned int i_track;
424
    input_thread_t *  p_input = (input_thread_t *)p_this;
425
    demux_sys_t *p_demux = p_input->p_demux_data;
426

427
    msg_Dbg( p_input, "freeing all memory" );
428
    MP4_BoxFree( p_input, &p_demux->box_root );
429 430
    for( i_track = 0; i_track < p_demux->i_tracks; i_track++ )
    {
431 432
        unsigned int i_chunk;
        for( i_chunk = 0;
433 434 435 436 437 438 439 440
                i_chunk < p_demux->track[i_track].i_chunk_count; i_chunk++ )
        {
            if( p_demux->track[i_track].chunk )
            {
               FREE(p_demux->track[i_track].chunk[i_chunk].p_sample_count_dts);
               FREE(p_demux->track[i_track].chunk[i_chunk].p_sample_delta_dts );
            }
        }
441
        FREE( p_demux->track[i_track].chunk );
442 443 444 445 446 447 448

        if( !p_demux->track[i_track].i_sample_size )
        {
            FREE( p_demux->track[i_track].p_sample_size );
        }
    }
    FREE( p_demux->track );
449 450

    FREE( p_input->p_demux_data );
451 452 453 454 455 456 457 458
#undef FREE
}


/****************************************************************************
 * Local functions, specific to vlc
 ****************************************************************************/

459
/****************************************************************************
460
 * MP4_TrackSynchro : synchronize a track with movie time after seek or
461 462 463 464 465 466 467
 *                    for newly selected track
 *****************************************************************************
 * TODO add support of Edit List (edts/elts) and Shadow Sync Sample(stsh)
 ****************************************************************************/
static int MP4_TrackSynchro( input_thread_t *p_input, track_data_mp4_t *p_track )
{
    demux_sys_t *p_demux = p_input->p_demux_data;
468
    unsigned int i_chunk_last;
469 470 471 472 473 474 475 476 477 478 479 480 481 482 483
    MP4_Box_t   *p_stss;

    if( !p_track->b_ok ||
        !p_track->p_es ||
        !p_track->p_es->p_decoder_fifo )
    {
        return( 0 );
    }
    p_track->i_sample = 0;
    i_chunk_last = p_track->i_chunk;
    p_track->i_chunk = 0;
    for( ;; )
    {
        if( p_track->i_sample >= p_track->i_sample_count )
        {
484
            msg_Warn( p_input,
485 486 487 488 489 490 491 492 493 494 495 496 497 498 499 500 501 502 503 504 505 506 507 508 509
                        "track[Id 0x%x] will be disabled (seeking too far)",
                        p_track->i_track_ID );
            MP4_StopDecoder( p_input, p_track );
            break;
        }
        if( MP4_GetTrackPTS( p_track ) >= MP4_GetMoviePTS( p_demux ) )
        {
            break;
        }
        /* go one sample after */
        p_track->i_sample++;
        if( p_track->i_sample >= p_track->chunk[p_track->i_chunk].i_sample_first +
                p_track->chunk[p_track->i_chunk].i_sample_count )
        {
            p_track->i_chunk++;
        }
    }
    if( p_track->i_sample >= p_track->i_sample_count )
    {
        return( 0 );
    }

    /* *** Try to find nearest sync points *** */
    if( ( p_stss = MP4_BoxGet( p_track->p_stbl, "stss" ) ) )
    {
510 511 512
        unsigned int i_index;
        msg_Dbg( p_input,
                    "track[Id 0x%x] using Sync Sample Box (stss)",
513 514 515 516 517 518 519
                    p_track->i_track_ID );
        for( i_index = 0; i_index < p_stss->data.p_stss->i_entry_count; i_index++ )
        {
            if( p_stss->data.p_stss->i_sample_number[i_index] >= p_track->i_sample )
            {
                if( i_index > 0 )
                {
520 521
                    msg_Dbg( p_input, "stts gives %d --> %d (sample number)",
                            p_track->i_sample,
522 523 524
                            p_stss->data.p_stss->i_sample_number[i_index-1] );
                    p_track->i_sample = p_stss->data.p_stss->i_sample_number[i_index-1];
                    /* new track.i_sample is less than old so i_chunk can only decreased */
525
                    while( p_track->i_chunk > 0 &&
526 527 528 529 530 531 532
                            p_track->i_sample < p_track->chunk[p_track->i_chunk].i_sample_first )
                    {
                        p_track->i_chunk--;
                    }
                }
                else
                {
533 534
                    msg_Dbg( p_input, "stts gives %d --> %d (sample number)",
                            p_track->i_sample,
535 536 537 538 539 540 541 542 543 544 545 546 547 548 549 550
                            p_stss->data.p_stss->i_sample_number[i_index-1] );
                    p_track->i_sample = p_stss->data.p_stss->i_sample_number[i_index];
                    /* new track.i_sample is more than old so i_chunk can only increased */
                    while( p_track->i_chunk < p_track->i_chunk_count - 1 &&
                           p_track->i_sample >= p_track->chunk[p_track->i_chunk].i_sample_first +
                                                p_track->chunk[p_track->i_chunk].i_sample_count )
                    {
                        p_track->i_chunk++;
                    }
                }
                break;
            }
        }
    }
    else
    {
551 552
        msg_Dbg( p_input,
                    "track[Id 0x%x] does not provide Sync Sample Box (stss)",
553 554 555 556 557 558 559 560 561 562 563 564 565 566 567
                    p_track->i_track_ID );
    }

    /* *** If i_sample_description_index has changed restart decoder *** */
    if( p_track->chunk[i_chunk_last].i_sample_description_index !=
            p_track->chunk[p_track->i_chunk].i_sample_description_index )
    {
        msg_Warn( p_input,
                "SampleEntry has changed, restarting decoder" );
        MP4_StopDecoder( p_input, p_track );
        MP4_StartDecoder( p_input, p_track );
    }
    return( 1 );
}

568 569 570 571 572 573 574 575
/****************************************************************************
 * Parse track information and create all needed data to run a track
 * If it succeed b_ok is set to 1 else to 0
 ****************************************************************************/
static void MP4_ParseTrack( input_thread_t *p_input,
                     track_data_mp4_t *p_demux_track,
                     MP4_Box_t  * p_trak )
{
576
    unsigned int i;
577

578 579 580
    MP4_Box_t *p_tkhd = MP4_BoxGet( p_trak, "tkhd" );
    MP4_Box_t *p_tref = MP4_BoxGet( p_trak, "tref" );
    MP4_Box_t *p_elst;
581 582 583 584 585

    MP4_Box_t *p_mdhd;
    MP4_Box_t *p_hdlr;

    MP4_Box_t *p_vmhd;
586
    MP4_Box_t *p_smhd;
587 588 589 590 591 592 593 594

    /* hint track unsuported */

    /* by default, track isn't usable */
    p_demux_track->b_ok = 0;

    /* by default, we don't known the categorie */
    p_demux_track->i_cat = UNKNOWN_ES;
595

596
    if( !p_tkhd )
597 598 599 600 601
    {
        return;
    }

    /* do we launch this track by default ? */
602
    p_demux_track->b_enable =
603
        ( ( p_tkhd->data.p_tkhd->i_flags&MP4_TRACK_ENABLED ) != 0 );
604 605 606 607

    p_demux_track->i_track_ID = p_tkhd->data.p_tkhd->i_track_ID;
    p_demux_track->i_width = p_tkhd->data.p_tkhd->i_width / 65536;
    p_demux_track->i_height = p_tkhd->data.p_tkhd->i_height / 65536;
608

609
    if( ( p_elst = MP4_BoxGet( p_trak, "edts/elst" ) ) )
610
    {
611
/*        msg_Warn( p_input, "unhandled box: edts --> FIXME" ); */
612 613
    }

614
    if( p_tref )
615
    {
616
/*        msg_Warn( p_input, "unhandled box: tref --> FIXME" ); */
617
    }
618

619 620
    p_mdhd = MP4_BoxGet( p_trak, "mdia/mdhd" );
    p_hdlr = MP4_BoxGet( p_trak, "mdia/hdlr" );
621

622
    if( ( !p_mdhd )||( !p_hdlr ) )
623 624 625 626 627 628
    {
        return;
    }

    p_demux_track->i_timescale = p_mdhd->data.p_mdhd->i_timescale;

629
    for( i = 0; i < 3; i++ )
630 631 632
    {
        p_demux_track->i_language[i] = p_mdhd->data.p_mdhd->i_language[i];
    }
633
    p_mdhd->data.p_mdhd->i_language[3] = 0;
634

635 636 637
    switch( p_hdlr->data.p_hdlr->i_handler_type )
    {
        case( FOURCC_soun ):
638
            if( !( p_smhd = MP4_BoxGet( p_trak, "mdia/minf/smhd" ) ) )
639 640 641 642 643 644 645
            {
                return;
            }
            p_demux_track->i_cat = AUDIO_ES;
            break;

        case( FOURCC_vide ):
646
            if( !( p_vmhd = MP4_BoxGet( p_trak, "mdia/minf/vmhd" ) ) )
647 648 649 650 651
            {
                return;
            }
            p_demux_track->i_cat = VIDEO_ES;
            break;
652

653 654 655
        default:
            return;
    }
656 657 658
/*  TODO
    add support for:
    p_dinf = MP4_BoxGet( p_minf, "dinf" );
659
*/
660
    if( !( p_demux_track->p_stbl = MP4_BoxGet( p_trak,"mdia/minf/stbl" ) ) )
661 662 663
    {
        return;
    }
664

665
    if( !( p_demux_track->p_stsd = MP4_BoxGet( p_trak,"mdia/minf/stbl/stsd") ) )
666 667 668
    {
        return;
    }
669

670 671 672 673 674
    /* Create chunk  index table */
    if( !MP4_CreateChunksIndex( p_input,p_demux_track  ) )
    {
        return; /* cannot create chunks index */
    }
675

676 677 678 679 680
    /* create sample index table needed for reading and seeking */
    if( !MP4_CreateSamplesIndex( p_input, p_demux_track ) )
    {
        return; /* cannot create samples index */
    }
681 682

    p_demux_track->b_ok = 1;
683 684 685 686 687 688 689 690 691 692
}


/* now create basic chunk data, the rest will be filled by MP4_CreateSamplesIndex */
static int MP4_CreateChunksIndex( input_thread_t *p_input,
                                   track_data_mp4_t *p_demux_track )
{
    MP4_Box_t *p_co64; /* give offset for each chunk, same for stco and co64 */
    MP4_Box_t *p_stsc;

693 694
    unsigned int i_chunk;
    unsigned int i_index, i_last;
695

696
    if( ( !(p_co64 = MP4_BoxGet( p_demux_track->p_stbl, "stco" ) )&&
697
          !(p_co64 = MP4_BoxGet( p_demux_track->p_stbl, "co64" ) ) )||
698
        ( !(p_stsc = MP4_BoxGet( p_demux_track->p_stbl, "stsc" ) ) ))
699 700 701
    {
        return( 0 );
    }
702

703 704 705
    p_demux_track->i_chunk_count = p_co64->data.p_co64->i_entry_count;
    if( !p_demux_track->i_chunk_count )
    {
706
        msg_Warn( p_input, "no chunk defined" );
707 708
        return( 0 );
    }
709
    p_demux_track->chunk = calloc( p_demux_track->i_chunk_count,
710 711 712 713 714
                                   sizeof( chunk_data_mp4_t ) );

    /* first we read chunk offset */
    for( i_chunk = 0; i_chunk < p_demux_track->i_chunk_count; i_chunk++ )
    {
715
        p_demux_track->chunk[i_chunk].i_offset =
716 717 718
                p_co64->data.p_co64->i_chunk_offset[i_chunk];
    }

719 720
    /* now we read index for SampleEntry( soun vide mp4a mp4v ...)
        to be used for the sample XXX begin to 1
721 722 723 724 725 726 727 728 729 730 731 732 733 734 735
        We construct it begining at the end */
    i_last = p_demux_track->i_chunk_count; /* last chunk proceded */
    i_index = p_stsc->data.p_stsc->i_entry_count;
    if( !i_index )
    {
        msg_Warn( p_input, "cannot read chunk table or table empty" );
        return( 0 );
    }

    while( i_index )
    {
        i_index--;
        for( i_chunk = p_stsc->data.p_stsc->i_first_chunk[i_index] - 1;
                i_chunk < i_last; i_chunk++ )
        {
736
            p_demux_track->chunk[i_chunk].i_sample_description_index =
737 738 739 740 741 742 743
                    p_stsc->data.p_stsc->i_sample_description_index[i_index];
            p_demux_track->chunk[i_chunk].i_sample_count =
                    p_stsc->data.p_stsc->i_samples_per_chunk[i_index];
        }
        i_last = p_stsc->data.p_stsc->i_first_chunk[i_index] - 1;
    }

744
    p_demux_track->chunk[0].i_sample_first = 0;
745 746 747
    for( i_chunk = 1; i_chunk < p_demux_track->i_chunk_count; i_chunk++ )
    {
        p_demux_track->chunk[i_chunk].i_sample_first =
748
            p_demux_track->chunk[i_chunk-1].i_sample_first +
749 750
                p_demux_track->chunk[i_chunk-1].i_sample_count;
    }
751 752

    msg_Dbg( p_input,
753 754 755
             "track[Id 0x%x] read %d chunk",
             p_demux_track->i_track_ID,
            p_demux_track->i_chunk_count );
756 757 758 759 760 761 762 763 764 765
    return( 1 );

}



static int MP4_CreateSamplesIndex( input_thread_t *p_input,
                                   track_data_mp4_t *p_demux_track )
{
    MP4_Box_t *p_stts; /* makes mapping between sample and decoding time,
766
                          ctts make same mapping but for composition time,
767
                          not yet used and probably not usefull */
768 769
    MP4_Box_t *p_stsz; /* gives sample size of each samples, there is also stz2
                          that uses a compressed form FIXME make them in libmp4
770 771 772
                          as a unique type */
    /* TODO use also stss and stsh table for seeking */
    /* FIXME use edit table */
773 774
    int64_t i_sample;
    int64_t i_chunk;
775

776 777
    int64_t i_index;
    int64_t i_index_sample_used;
778

779 780
    int64_t i_last_dts;

781 782
    p_stts = MP4_BoxGet( p_demux_track->p_stbl, "stts" );
    p_stsz = MP4_BoxGet( p_demux_track->p_stbl, "stsz" ); /* FIXME and stz2 */
783 784 785 786

    if( ( !p_stts )||( !p_stsz ) )
    {
        msg_Warn( p_input, "cannot read sample table" );
787
        return( 0 );
788
    }
789

790 791 792 793 794 795 796 797 798 799 800 801 802 803
    p_demux_track->i_sample_count = p_stsz->data.p_stsz->i_sample_count;


    /* for sample size, there are 2 case */
    if( p_stsz->data.p_stsz->i_sample_size )
    {
        /* 1: all sample have the same size, so no need to construct a table */
        p_demux_track->i_sample_size = p_stsz->data.p_stsz->i_sample_size;
        p_demux_track->p_sample_size = NULL;
    }
    else
    {
        /* 2: each sample can have a different size */
        p_demux_track->i_sample_size = 0;
804
        p_demux_track->p_sample_size =
805
            calloc( p_demux_track->i_sample_count, sizeof( uint32_t ) );
806

807 808
        for( i_sample = 0; i_sample < p_demux_track->i_sample_count; i_sample++ )
        {
809
            p_demux_track->p_sample_size[i_sample] =
810 811 812 813 814 815 816
                    p_stsz->data.p_stsz->i_entry_size[i_sample];
        }
    }
    /* we have extract all information from stsz,
        now use stts */

    /* if we don't want to waste too much memory, we can't expand
817
       the box !, so each chunk will contain an "extract" of this table
818
       for fast research */
819

820 821
    i_last_dts = 0;
    i_index = 0; i_index_sample_used =0;
822

823 824 825 826
    /* create and init last data for each chunk */
    for(i_chunk = 0 ; i_chunk < p_demux_track->i_chunk_count; i_chunk++ )
    {

827
        int64_t i_entry, i_sample_count, i;
828 829
        /* save last dts */
        p_demux_track->chunk[i_chunk].i_first_dts = i_last_dts;
830
    /* count how many entries needed for this chunk
831 832 833
       for p_sample_delta_dts and p_sample_count_dts */

        i_sample_count = p_demux_track->chunk[i_chunk].i_sample_count;
834 835

        i_entry = 0;
836 837 838 839 840
        while( i_sample_count > 0 )
        {
            i_sample_count -= p_stts->data.p_stts->i_sample_count[i_index+i_entry];
            if( i_entry == 0 )
            {
841
                i_sample_count += i_index_sample_used; /* don't count already used sample
842 843 844 845
                                                   int this entry */
            }
            i_entry++;
        }
846

847
        /* allocate them */
848
        p_demux_track->chunk[i_chunk].p_sample_count_dts =
849
            calloc( i_entry, sizeof( uint32_t ) );
850
        p_demux_track->chunk[i_chunk].p_sample_delta_dts =
851
            calloc( i_entry, sizeof( uint32_t ) );
852 853 854 855 856

        /* now copy */
        i_sample_count = p_demux_track->chunk[i_chunk].i_sample_count;
        for( i = 0; i < i_entry; i++ )
        {
857 858
            int64_t i_used;
            int64_t i_rest;
859

860 861 862 863 864
            i_rest = p_stts->data.p_stts->i_sample_count[i_index] - i_index_sample_used;

            i_used = __MIN( i_rest, i_sample_count );

            i_index_sample_used += i_used;
865
            i_sample_count -= i_used;
866 867 868 869 870

            p_demux_track->chunk[i_chunk].p_sample_count_dts[i] = i_used;

            p_demux_track->chunk[i_chunk].p_sample_delta_dts[i] =
                        p_stts->data.p_stts->i_sample_delta[i_index];
871 872

            i_last_dts += i_used *
873 874 875 876 877
                    p_demux_track->chunk[i_chunk].p_sample_delta_dts[i];

            if( i_index_sample_used >=
                             p_stts->data.p_stts->i_sample_count[i_index] )
            {
878

879 880 881 882
                i_index++;
                i_index_sample_used = 0;
            }
        }
883

884 885
    }

886 887
    msg_Dbg( p_input,
             "track[Id 0x%x] read %d samples length:"I64Fd"s",
888
             p_demux_track->i_track_ID,
889 890
             p_demux_track->i_sample_count,
             i_last_dts / p_demux_track->i_timescale );
891 892 893 894 895 896 897

    return( 1 );
}

static void MP4_StartDecoder( input_thread_t *p_input,
                                 track_data_mp4_t *p_demux_track )
{
898 899 900
    MP4_Box_t *  p_sample;
    unsigned int i;
    unsigned int i_chunk;
901

902 903
    unsigned int i_decoder_specific_info_len;
    uint8_t *    p_decoder_specific_info;
904 905
    pes_packet_t *p_pes_init;

906 907
    uint8_t             *p_init;
    BITMAPINFOHEADER    *p_bih;
908
    WAVEFORMATEX        *p_wf;
909

910
    MP4_Box_t   *p_esds;
911

912

913 914 915 916
    if( (!p_demux_track->b_ok )||( p_demux_track->i_cat == UNKNOWN_ES ) )
    {
        return;
    }
917

918
    msg_Dbg( p_input, "starting decoder for track[Id 0x%x]",
919 920 921 922 923 924 925
                      p_demux_track->i_track_ID );

    /* launch decoder according in chunk we are */
    i_chunk = p_demux_track->i_chunk;

    if( !p_demux_track->chunk[i_chunk].i_sample_description_index )
    {
926
        msg_Warn( p_input,
927
                  "invalid SampleEntry index (track[Id 0x%x])",
928 929
                  p_demux_track->i_track_ID );
        return;
930 931 932
    }
    p_sample = MP4_BoxGet(  p_demux_track->p_stsd,
                            "[%d]",
933
                p_demux_track->chunk[i_chunk].i_sample_description_index - 1 );
934 935 936

    if( ( !p_sample )||( !p_sample->data.p_data ) )
    {
937
        msg_Warn( p_input,
938
                  "cannot find SampleEntry (track[Id 0x%x])",
939 940 941 942 943 944
                  p_demux_track->i_track_ID );
        return;
    }

    vlc_mutex_lock( &p_input->stream.stream_lock );
    p_demux_track->p_es = input_AddES( p_input,
945
                                       p_input->stream.p_selected_program,
946 947 948 949 950 951 952 953
                                       p_demux_track->i_track_ID,
                                       0 );
    vlc_mutex_unlock( &p_input->stream.stream_lock );
    /* Initialise ES, first language as description */
    for( i = 0; i < 3; i++ )
    {
        p_demux_track->p_es->psz_desc[i] = p_demux_track->i_language[i];
    }
954
    p_demux_track->p_es->psz_desc[3] = '\0';
955

956 957 958 959 960 961 962 963 964 965 966 967 968
    p_demux_track->p_es->i_stream_id = p_demux_track->i_track_ID;

    /* It's a little ugly but .. there are special cases */
    switch( p_sample->i_type )
    {
        case( VLC_FOURCC( '.', 'm', 'p', '3' ) ):
        case( VLC_FOURCC( 'm', 's', 0x00, 0x55 ) ):
            p_demux_track->p_es->i_fourcc = VLC_FOURCC( 'm', 'p', 'g', 'a' );
            break;
        default:
            p_demux_track->p_es->i_fourcc = p_sample->i_type;
            break;
    }
969

970
    p_demux_track->p_es->i_cat = p_demux_track->i_cat;
971

972 973
    i_decoder_specific_info_len = 0;
    p_decoder_specific_info = NULL;
974
    p_pes_init = NULL;
975

976
    /* now see if esds is present and if so create a data packet
977 978
        with decoder_specific_info  */
#define p_decconfig p_esds->data.p_esds->es_descriptor.p_decConfigDescr
979
    if( ( p_esds = MP4_BoxGet( p_sample, "esds" ) )&&
980 981 982 983 984 985 986 987 988 989 990 991 992 993 994 995 996 997 998 999
        ( p_esds->data.p_esds )&&
        ( p_decconfig ) )
    {
        /* First update information based on i_objectTypeIndication */
        switch( p_decconfig->i_objectTypeIndication )
        {
            case( 0x20 ): /* MPEG4 VIDEO */
                p_demux_track->p_es->i_fourcc = VLC_FOURCC( 'm','p','4','v' );
                break;
            case( 0x40):
                p_demux_track->p_es->i_fourcc = VLC_FOURCC( 'm','p','4','a' );
                break;
            case( 0x60):
            case( 0x61):
            case( 0x62):
            case( 0x63):
            case( 0x64):
            case( 0x65): /* MPEG2 video */
                p_demux_track->p_es->i_fourcc = VLC_FOURCC( 'm','p','g','v' );
                break;
1000
            /* Theses are MPEG2-AAC */
1001 1002 1003 1004 1005 1006
            case( 0x66): /* main profile */
            case( 0x67): /* Low complexity profile */
            case( 0x68): /* Scaleable Sampling rate profile */
                p_demux_track->p_es->i_fourcc = VLC_FOURCC( 'm','p','4','a' );
                break;
            /* true MPEG 2 audio */
1007
            case( 0x69):
1008 1009 1010 1011 1012 1013 1014 1015 1016 1017 1018 1019 1020
                p_demux_track->p_es->i_fourcc = VLC_FOURCC( 'm','p','g','a' );
                break;
            case( 0x6a): /* MPEG1 video */
                p_demux_track->p_es->i_fourcc = VLC_FOURCC( 'm','p','g','v' );
                break;
            case( 0x6b): /* MPEG1 audio */
                p_demux_track->p_es->i_fourcc = VLC_FOURCC( 'm','p','g','a' );
                break;
            case( 0x6c ): /* jpeg */
                p_demux_track->p_es->i_fourcc = VLC_FOURCC( 'j','p','e','g' );
                break;
            default:
                /* Unknown entry, but don't touch i_fourcc */
1021
                msg_Warn( p_input,
1022
                          "unknown objectTypeIndication(0x%x) (Track[ID 0x%x])",
1023 1024 1025 1026
                          p_decconfig->i_objectTypeIndication,
                          p_demux_track->i_track_ID );
                break;
        }
1027
        i_decoder_specific_info_len =
1028
                p_decconfig->i_decoder_specific_info_len;
1029
        p_decoder_specific_info =
1030 1031 1032 1033 1034 1035
                p_decconfig->p_decoder_specific_info;
    }

#undef p_decconfig

    /* some last initialisation */
1036 1037 1038
    /* XXX I create a bitmapinfoheader_t or
       waveformatex_t for each stream, up to now it's the best thing
       I've found but it could exist a better solution :) as something
1039 1040 1041
       like adding some new fields in p_es ...

       XXX I don't set all values, only thoses that are interesting or known
1042
        --> bitmapinfoheader_t : width and height
1043
        --> waveformatex_t : channels, samplerate, bitspersample
1044
        and at the end I add p_decoder_specific_info
1045

1046
        TODO set more values