movenc.c 46.6 KB
Newer Older
1 2 3
/*
 * MOV, 3GP, MP4 encoder.
 * Copyright (c) 2003 Thomas Raivio.
4
 * Copyright (c) 2004 Gildas Bazin <gbazin at videolan dot org>.
5 6 7 8 9 10 11 12 13 14 15 16 17
 *
 * This library is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2 of the License, or (at your option) any later version.
 *
 * This library is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
 * License along with this library; if not, write to the Free Software
18
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
19 20
 */
#include "avformat.h"
21
#include "avi.h"
22 23
#include "avio.h"

24 25 26
#undef NDEBUG
#include <assert.h>

27 28 29
#define MOV_INDEX_CLUSTER_SIZE 16384
#define globalTimescale 1000

30 31 32
#define MODE_MP4 0
#define MODE_MOV 1
#define MODE_3GP 2
33
#define MODE_PSP 3 // example working PSP command line:
34
// ffmpeg -i testinput.avi  -f psp -r 14.985 -s 320x240 -b 768 -ar 24000 -ab 32 M4V00001.MP4
35
#define MODE_3G2 4
36

37
typedef struct MOVIentry {
38 39
    unsigned int flags, pos, size;
    unsigned int samplesInChunk;
40
    char         key_frame;
41 42 43 44
    unsigned int entries;
} MOVIentry;

typedef struct MOVIndex {
45
    int         mode;
46 47 48 49 50
    int         entry;
    int         mdat_size;
    int         ents_allocated;
    long        timescale;
    long        time;
51
    long        trackDuration;
52 53
    long        sampleCount;
    long        sampleDuration;
54
    int         hasKeyframes;
55
    int         language;
56 57 58 59
    int         trackID;
    AVCodecContext *enc;

    int         vosLen;
60
    uint8_t     *vosData;
61 62 63
    MOVIentry** cluster;
} MOVTrack;

64
typedef struct MOVContext {
65
    int     mode;
66 67
    long    time;
    int     nb_streams;
68 69
    int     mdat_written;
    offset_t mdat_pos;
70 71 72 73
    long    timescale;
    MOVTrack tracks[MAX_STREAMS];
} MOVContext;

74 75
static int mov_write_esds_tag(ByteIOContext *pb, MOVTrack* track);

76 77 78
/* output language code from iso639 language name */
extern int ff_mov_iso639_to_lang(const char *lang, int mp4);

79 80 81 82 83 84 85
const CodecTag ff_mov_obj_type[] = {
    { CODEC_ID_MPEG4     ,  32 },
    { CODEC_ID_AAC       ,  64 },
    { CODEC_ID_MPEG1VIDEO, 106 },
    { CODEC_ID_MPEG2VIDEO,  96 },//mpeg2 profiles
    { CODEC_ID_MP2       , 107 },//FIXME mpeg2 mpeg audio -> 105
    { CODEC_ID_MP3       , 107 },//FIXME mpeg2 mpeg audio -> 105
86
    { CODEC_ID_H264      ,  33 },
87 88 89 90 91 92 93 94 95 96 97 98
    { CODEC_ID_H263      , 242 },
    { CODEC_ID_H261      , 243 },
    { CODEC_ID_MJPEG     , 108 },
    { CODEC_ID_PCM_S16LE , 224 },
    { CODEC_ID_VORBIS    , 225 },
    { CODEC_ID_AC3       , 226 },
    { CODEC_ID_PCM_ALAW  , 227 },
    { CODEC_ID_PCM_MULAW , 228 },
    { CODEC_ID_PCM_S16BE , 230 },
    { 0,0  },
};

99 100
//FIXME supprt 64bit varaint with wide placeholders
static int updateSize (ByteIOContext *pb, int pos)
101 102 103
{
    long curpos = url_ftell(pb);
    url_fseek(pb, pos, SEEK_SET);
104
    put_be32(pb, curpos - pos); /* rewrite size */
105
    url_fseek(pb, curpos, SEEK_SET);
106 107

    return curpos - pos;
108 109
}

110
/* Chunk offset atom */
111
static int mov_write_stco_tag(ByteIOContext *pb, MOVTrack* track)
112 113
{
    int i;
114 115
    int pos = url_ftell(pb);
    put_be32(pb, 0); /* size */
116 117 118 119 120 121 122 123
    put_tag(pb, "stco");
    put_be32(pb, 0); /* version & flags */
    put_be32(pb, track->entry); /* entry count */
    for (i=0; i<track->entry; i++) {
        int cl = i / MOV_INDEX_CLUSTER_SIZE;
        int id = i % MOV_INDEX_CLUSTER_SIZE;
        put_be32(pb, track->cluster[cl][id].pos);
    }
124
    return updateSize (pb, pos);
125 126
}

127
/* Sample size atom */
128
static int mov_write_stsz_tag(ByteIOContext *pb, MOVTrack* track)
129
{
130
    int equalChunks = 1;
131
    int i, j, entries = 0, tst = -1, oldtst = -1;
132

133 134
    int pos = url_ftell(pb);
    put_be32(pb, 0); /* size */
135 136 137
    put_tag(pb, "stsz");
    put_be32(pb, 0); /* version & flags */

138 139 140
    for (i=0; i<track->entry; i++) {
        int cl = i / MOV_INDEX_CLUSTER_SIZE;
        int id = i % MOV_INDEX_CLUSTER_SIZE;
141 142 143
        tst = track->cluster[cl][id].size/track->cluster[cl][id].entries;
        if(oldtst != -1 && tst != oldtst) {
            equalChunks = 0;
144 145
        }
        oldtst = tst;
146
        entries += track->cluster[cl][id].entries;
147
    }
148 149
    if (equalChunks) {
        int sSize = track->cluster[0][0].size/track->cluster[0][0].entries;
150
        put_be32(pb, sSize); // sample size
151
        put_be32(pb, entries); // sample count
152
    }
153
    else {
154 155
        put_be32(pb, 0); // sample size
        put_be32(pb, entries); // sample count
156
        for (i=0; i<track->entry; i++) {
157 158
            int cl = i / MOV_INDEX_CLUSTER_SIZE;
            int id = i % MOV_INDEX_CLUSTER_SIZE;
159 160 161 162
            for ( j=0; j<track->cluster[cl][id].entries; j++) {
                put_be32(pb, track->cluster[cl][id].size /
                         track->cluster[cl][id].entries);
            }
163 164
        }
    }
165
    return updateSize (pb, pos);
166 167
}

168
/* Sample to chunk atom */
169
static int mov_write_stsc_tag(ByteIOContext *pb, MOVTrack* track)
170
{
171 172 173 174
    int index = 0, oldval = -1, i, entryPos, curpos;

    int pos = url_ftell(pb);
    put_be32(pb, 0); /* size */
175
    put_tag(pb, "stsc");
176
    put_be32(pb, 0); // version & flags
177
    entryPos = url_ftell(pb);
178
    put_be32(pb, track->entry); // entry count
179 180 181
    for (i=0; i<track->entry; i++) {
        int cl = i / MOV_INDEX_CLUSTER_SIZE;
        int id = i % MOV_INDEX_CLUSTER_SIZE;
182
        if(oldval != track->cluster[cl][id].samplesInChunk)
183
        {
184
            put_be32(pb, i+1); // first chunk
185
            put_be32(pb, track->cluster[cl][id].samplesInChunk); // samples per chunk
186
            put_be32(pb, 0x1); // sample description index
187
            oldval = track->cluster[cl][id].samplesInChunk;
188
            index++;
189 190
        }
    }
191 192
    curpos = url_ftell(pb);
    url_fseek(pb, entryPos, SEEK_SET);
193
    put_be32(pb, index); // rewrite size
194
    url_fseek(pb, curpos, SEEK_SET);
195

196
    return updateSize (pb, pos);
197 198
}

199
/* Sync sample atom */
200
static int mov_write_stss_tag(ByteIOContext *pb, MOVTrack* track)
201
{
202 203 204
    long curpos;
    int i, index = 0, entryPos;
    int pos = url_ftell(pb);
205
    put_be32(pb, 0); // size
206
    put_tag(pb, "stss");
207
    put_be32(pb, 0); // version & flags
208
    entryPos = url_ftell(pb);
209
    put_be32(pb, track->entry); // entry count
210 211 212 213 214 215 216 217 218 219
    for (i=0; i<track->entry; i++) {
        int cl = i / MOV_INDEX_CLUSTER_SIZE;
        int id = i % MOV_INDEX_CLUSTER_SIZE;
        if(track->cluster[cl][id].key_frame == 1) {
            put_be32(pb, i+1);
            index++;
        }
    }
    curpos = url_ftell(pb);
    url_fseek(pb, entryPos, SEEK_SET);
220
    put_be32(pb, index); // rewrite size
221 222
    url_fseek(pb, curpos, SEEK_SET);
    return updateSize (pb, pos);
223 224
}

225
static int mov_write_damr_tag(ByteIOContext *pb)
226 227 228 229 230
{
    put_be32(pb, 0x11); /* size */
    put_tag(pb, "damr");
    put_tag(pb, "FFMP");
    put_byte(pb, 0);
231 232 233 234 235

    put_be16(pb, 0x80); /* Mode set (all modes for AMR_NB) */
    put_be16(pb, 0xa); /* Mode change period (no restriction) */
    //put_be16(pb, 0x81ff); /* Mode set (all modes for AMR_NB) */
    //put_be16(pb, 1); /* Mode change period (no restriction) */
236 237 238
    return 0x11;
}

239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265
static int mov_write_wave_tag(ByteIOContext *pb, MOVTrack* track)
{
    int pos = url_ftell(pb);

    put_be32(pb, 0);     /* size */
    put_tag(pb, "wave");

    put_be32(pb, 12);    /* size */
    put_tag(pb, "frma");
    put_tag(pb, "mp4a");

    put_be32(pb, 12);    /* size */
    put_tag(pb, "mp4a");
    put_be32(pb, 0);

    mov_write_esds_tag(pb, track);

    put_be32(pb, 12);    /* size */
    put_tag(pb, "srcq");
    put_be32(pb, 0x40);

    put_be32(pb, 8);     /* size */
    put_be32(pb, 0);     /* null tag */

    return updateSize (pb, pos);
}

266
static const CodecTag codec_movaudio_tags[] = {
267 268 269 270 271 272 273
    { CODEC_ID_PCM_MULAW, MKTAG('u', 'l', 'a', 'w') },
    { CODEC_ID_PCM_ALAW, MKTAG('a', 'l', 'a', 'w') },
    { CODEC_ID_ADPCM_IMA_QT, MKTAG('i', 'm', 'a', '4') },
    { CODEC_ID_MACE3, MKTAG('M', 'A', 'C', '3') },
    { CODEC_ID_MACE6, MKTAG('M', 'A', 'C', '6') },
    { CODEC_ID_AAC, MKTAG('m', 'p', '4', 'a') },
    { CODEC_ID_AMR_NB, MKTAG('s', 'a', 'm', 'r') },
274
    { CODEC_ID_AMR_WB, MKTAG('s', 'a', 'w', 'b') },
275 276 277 278 279 280
    { CODEC_ID_PCM_S16BE, MKTAG('t', 'w', 'o', 's') },
    { CODEC_ID_PCM_S16LE, MKTAG('s', 'o', 'w', 't') },
    { CODEC_ID_MP3, MKTAG('.', 'm', 'p', '3') },
    { 0, 0 },
};

281
static int mov_write_audio_tag(ByteIOContext *pb, MOVTrack* track)
282
{
283 284
    int pos = url_ftell(pb);
    int tag;
285

286
    put_be32(pb, 0); /* size */
287

288 289
    tag = track->enc->codec_tag;
    if (!tag)
290 291 292 293
    tag = codec_get_tag(codec_movaudio_tags, track->enc->codec_id);
    // if no mac fcc found, try with Microsoft tags
    if (!tag)
    {
294
        int tmp = codec_get_tag(codec_wav_tags, track->enc->codec_id);
295
        tag = MKTAG('m', 's', ((tmp >> 8) & 0xff), (tmp & 0xff));
296
    }
297
    put_le32(pb, tag); // store it byteswapped
298

299 300 301
    put_be32(pb, 0); /* Reserved */
    put_be16(pb, 0); /* Reserved */
    put_be16(pb, 1); /* Data-reference index, XXX  == 1 */
302

303
    /* SoundDescription */
304 305 306 307
    if(track->mode == MODE_MOV && track->enc->codec_id == CODEC_ID_AAC)
        put_be16(pb, 1); /* Version 1 */
    else
        put_be16(pb, 0); /* Version 0 */
308
    put_be16(pb, 0); /* Revision level */
309 310
    put_be32(pb, 0); /* Reserved */

311 312
    put_be16(pb, track->enc->channels); /* Number of channels */
    /* TODO: Currently hard-coded to 16-bit, there doesn't seem
313
                 to be a good way to get number of bits of audio */
314
    put_be16(pb, 0x10); /* Reserved */
315 316 317 318 319 320 321 322 323 324

    if(track->enc->codec_id == CODEC_ID_AAC ||
       track->enc->codec_id == CODEC_ID_MP3)
    {
        put_be16(pb, 0xfffe); /* compression ID (vbr)*/
    }
    else
    {
        put_be16(pb, 0); /* compression ID (= 0) */
    }
325
    put_be16(pb, 0); /* packet size (= 0) */
326 327 328
    put_be16(pb, track->timescale); /* Time scale */
    put_be16(pb, 0); /* Reserved */

329 330 331 332 333 334 335 336 337 338 339 340 341
    if(track->mode == MODE_MOV && track->enc->codec_id == CODEC_ID_AAC)
    {
        /* SoundDescription V1 extended info */
        put_be32(pb, track->enc->frame_size); /* Samples per packet  */
        put_be32(pb, 1536); /* Bytes per packet */
        put_be32(pb, 2); /* Bytes per frame */
        put_be32(pb, 2); /* Bytes per sample */
    }

    if(track->enc->codec_id == CODEC_ID_AAC) {
        if( track->mode == MODE_MOV ) mov_write_wave_tag(pb, track);
        else mov_write_esds_tag(pb, track);
    }
342 343
    if(track->enc->codec_id == CODEC_ID_AMR_NB)
        mov_write_damr_tag(pb);
344
    return updateSize (pb, pos);
345 346
}

347
static int mov_write_d263_tag(ByteIOContext *pb)
348 349 350 351 352 353 354 355 356
{
    put_be32(pb, 0xf); /* size */
    put_tag(pb, "d263");
    put_tag(pb, "FFMP");
    put_be16(pb, 0x0a);
    put_byte(pb, 0);
    return 0xf;
}

357 358
/* TODO: No idea about these values */
static int mov_write_svq3_tag(ByteIOContext *pb)
359
{
360 361 362 363 364 365
    put_be32(pb, 0x15);
    put_tag(pb, "SMI ");
    put_tag(pb, "SEQH");
    put_be32(pb, 0x5);
    put_be32(pb, 0xe2c0211d);
    put_be32(pb, 0xc0000000);
366
    put_byte(pb, 0);
367
    return 0x15;
368 369
}

370 371 372 373 374 375 376 377 378 379 380 381 382
static unsigned int descrLength(unsigned int len)
{
    if (len < 0x00000080)
        return 2 + len;
    else if (len < 0x00004000)
        return 3 + len;
    else if(len < 0x00200000)
        return 4 + len;
    else
        return 5 + len;
}

static void putDescr(ByteIOContext *pb, int tag, int size)
383
{
384 385 386 387 388 389
    uint32_t len;
    uint8_t  vals[4];

    len = size;
    vals[3] = (uint8_t)(len & 0x7f);
    len >>= 7;
390
    vals[2] = (uint8_t)((len & 0x7f) | 0x80);
391
    len >>= 7;
392
    vals[1] = (uint8_t)((len & 0x7f) | 0x80);
393 394 395 396 397 398 399 400 401 402 403 404 405 406 407 408 409 410 411 412 413 414 415 416 417 418 419
    len >>= 7;
    vals[0] = (uint8_t)((len & 0x7f) | 0x80);

    put_byte(pb, tag); // DescriptorTag

    if (size < 0x00000080)
    {
        put_byte(pb, vals[3]);
    }
    else if (size < 0x00004000)
    {
        put_byte(pb, vals[2]);
        put_byte(pb, vals[3]);
    }
    else if (size < 0x00200000)
    {
        put_byte(pb, vals[1]);
        put_byte(pb, vals[2]);
        put_byte(pb, vals[3]);
    }
    else if (size < 0x10000000)
    {
        put_byte(pb, vals[0]);
        put_byte(pb, vals[1]);
        put_byte(pb, vals[2]);
        put_byte(pb, vals[3]);
    }
420 421
}

422
static int mov_write_esds_tag(ByteIOContext *pb, MOVTrack* track) // Basic
423
{
424
    int decoderSpecificInfoLen;
425
    int pos = url_ftell(pb);
426 427
    void *vosDataBackup=track->vosData;
    int vosLenBackup=track->vosLen;
428

429 430 431
    // we should be able to have these passed in, via vosData, then we wouldn't need to attack this routine at all
    static const char PSPAACData[]={0x13,0x10};
    static const char PSPMP4Data[]={0x00,0x00,0x01,0xB0,0x03,0x00,0x00,0x01,0xB5,0x09,0x00,0x00,0x01,0x00,0x00,0x00,0x01,0x20,0x00,0x84,0x5D,0x4C,0x28,0x50,0x20,0xF0,0xA3,0x1F };
432 433


434 435 436 437 438
    if (track->mode == MODE_PSP)  // fails on psp if this is not here
    {
        if (track->enc->codec_id == CODEC_ID_AAC)
        {
            track->vosLen = 2;
439
            track->vosData = (uint8_t *) PSPAACData;
440 441 442 443 444
        }

        if (track->enc->codec_id == CODEC_ID_MPEG4)
        {
            track->vosLen = 28;
445
            track->vosData = (uint8_t *) PSPMP4Data;
446 447
        }
    }
448

449 450
    decoderSpecificInfoLen = track->vosLen ? descrLength(track->vosLen):0;

451
    put_be32(pb, 0);               // size
452
    put_tag(pb, "esds");
453
    put_be32(pb, 0);               // Version
454

455 456 457
    // ES descriptor
    putDescr(pb, 0x03, 3 + descrLength(13 + decoderSpecificInfoLen) +
             descrLength(1));
458
    put_be16(pb, track->trackID);
459 460
    put_byte(pb, 0x00);            // flags (= no flags)

461 462 463
    // DecoderConfig descriptor
    putDescr(pb, 0x04, 13 + decoderSpecificInfoLen);

464 465
    // Object type indication
    put_byte(pb, codec_get_tag(ff_mov_obj_type, track->enc->codec_id));
466

467 468
    // the following fields is made of 6 bits to identify the streamtype (4 for video, 5 for audio)
    // plus 1 bit to indicate upstream and 1 bit set to 1 (reserved)
469 470 471 472 473
    if(track->enc->codec_type == CODEC_TYPE_AUDIO)
        put_byte(pb, 0x15);            // flags (= Audiostream)
    else
        put_byte(pb, 0x11);            // flags (= Visualstream)

474 475
    put_byte(pb,  track->enc->rc_buffer_size>>(3+16));             // Buffersize DB (24 bits)
    put_be16(pb, (track->enc->rc_buffer_size>>3)&0xFFFF);          // Buffersize DB
476

477 478 479 480 481
    put_be32(pb, FFMAX(track->enc->bit_rate, track->enc->rc_max_rate));     // maxbitrate  (FIXME should be max rate in any 1 sec window)
    if(track->enc->rc_max_rate != track->enc->rc_min_rate || track->enc->rc_min_rate==0)
        put_be32(pb, 0);     // vbr
    else
        put_be32(pb, track->enc->rc_max_rate);     // avg bitrate
482

483 484 485 486 487 488 489
    if (track->vosLen)
    {
        // DecoderSpecific info descriptor
        putDescr(pb, 0x05, track->vosLen);
        put_buffer(pb, track->vosData, track->vosLen);
    }

490 491 492
    track->vosData = vosDataBackup;
    track->vosLen = vosLenBackup;

493
    // SL descriptor
494
    putDescr(pb, 0x06, 1);
495
    put_byte(pb, 0x02);
496
    return updateSize (pb, pos);
497 498
}

499
static const CodecTag codec_movvideo_tags[] = {
500 501 502 503
    { CODEC_ID_SVQ1, MKTAG('S', 'V', 'Q', '1') },
    { CODEC_ID_SVQ3, MKTAG('S', 'V', 'Q', '3') },
    { CODEC_ID_MPEG4, MKTAG('m', 'p', '4', 'v') },
    { CODEC_ID_H263, MKTAG('s', '2', '6', '3') },
504
    { CODEC_ID_H264, MKTAG('a', 'v', 'c', '1') },
505 506 507 508
    { CODEC_ID_DVVIDEO, MKTAG('d', 'v', 'c', ' ') },
    { 0, 0 },
};

509
static int mov_write_video_tag(ByteIOContext *pb, MOVTrack* track)
510
{
511
    int pos = url_ftell(pb);
512
    char compressor_name[32];
513
    int tag;
514

515
    put_be32(pb, 0); /* size */
516

517 518
    tag = track->enc->codec_tag;
    if (!tag)
519 520 521
    tag = codec_get_tag(codec_movvideo_tags, track->enc->codec_id);
    // if no mac fcc found, try with Microsoft tags
    if (!tag)
522
        tag = codec_get_tag(codec_bmp_tags, track->enc->codec_id);
523
    put_le32(pb, tag); // store it byteswapped
524

525 526 527 528
    put_be32(pb, 0); /* Reserved */
    put_be16(pb, 0); /* Reserved */
    put_be16(pb, 1); /* Data-reference index */

529 530 531 532 533 534 535 536 537 538
    put_be16(pb, 0); /* Codec stream version */
    put_be16(pb, 0); /* Codec stream revision (=0) */
    put_tag(pb, "FFMP"); /* Vendor */
    if(track->enc->codec_id == CODEC_ID_RAWVIDEO) {
        put_be32(pb, 0); /* Temporal Quality */
        put_be32(pb, 0x400); /* Spatial Quality = lossless*/
    } else {
        put_be32(pb, 0x200); /* Temporal Quality = normal */
        put_be32(pb, 0x200); /* Spatial Quality = normal */
    }
539 540
    put_be16(pb, track->enc->width); /* Video width */
    put_be16(pb, track->enc->height); /* Video height */
541 542
    put_be32(pb, 0x00480000); /* Horizontal resolution 72dpi */
    put_be32(pb, 0x00480000); /* Vertical resolution 72dpi */
543 544
    put_be32(pb, 0); /* Data size (= 0) */
    put_be16(pb, 1); /* Frame count (= 1) */
545

546
    memset(compressor_name,0,32);
547
    if (track->enc->codec && track->enc->codec->name)
548
        strncpy(compressor_name,track->enc->codec->name,31);
549
    put_byte(pb, strlen(compressor_name));
550
    put_buffer(pb, compressor_name, 31);
551

552 553 554 555 556 557 558
    put_be16(pb, 0x18); /* Reserved */
    put_be16(pb, 0xffff); /* Reserved */
    if(track->enc->codec_id == CODEC_ID_MPEG4)
        mov_write_esds_tag(pb, track);
    else if(track->enc->codec_id == CODEC_ID_H263)
        mov_write_d263_tag(pb);
    else if(track->enc->codec_id == CODEC_ID_SVQ3)
559
        mov_write_svq3_tag(pb);
560 561

    return updateSize (pb, pos);
562 563
}

564
static int mov_write_stsd_tag(ByteIOContext *pb, MOVTrack* track)
565
{
566
    int pos = url_ftell(pb);
567 568 569 570
    put_be32(pb, 0); /* size */
    put_tag(pb, "stsd");
    put_be32(pb, 0); /* version & flags */
    put_be32(pb, 1); /* entry count */
571 572 573 574
    if (track->enc->codec_type == CODEC_TYPE_VIDEO)
        mov_write_video_tag(pb, track);
    else if (track->enc->codec_type == CODEC_TYPE_AUDIO)
        mov_write_audio_tag(pb, track);
575
    return updateSize(pb, pos);
576 577
}

Michael Niedermayer's avatar
Michael Niedermayer committed
578
/* TODO: */
579
/* Time to sample atom */
580
static int mov_write_stts_tag(ByteIOContext *pb, MOVTrack* track)
581 582 583 584 585 586
{
    put_be32(pb, 0x18); /* size */
    put_tag(pb, "stts");
    put_be32(pb, 0); /* version & flags */
    put_be32(pb, 1); /* entry count */

587 588
    put_be32(pb, track->sampleCount); /* sample count */
    put_be32(pb, track->sampleDuration); /* sample duration */
589 590 591
    return 0x18;
}

592
static int mov_write_dref_tag(ByteIOContext *pb)
593 594 595 596 597 598 599 600 601 602 603 604 605
{
    put_be32(pb, 28); /* size */
    put_tag(pb, "dref");
    put_be32(pb, 0); /* version & flags */
    put_be32(pb, 1); /* entry count */

    put_be32(pb, 0xc); /* size */
    put_tag(pb, "url ");
    put_be32(pb, 1); /* version & flags */

    return 28;
}

606
static int mov_write_stbl_tag(ByteIOContext *pb, MOVTrack* track)
607
{
608
    int pos = url_ftell(pb);
609 610
    put_be32(pb, 0); /* size */
    put_tag(pb, "stbl");
611 612
    mov_write_stsd_tag(pb, track);
    mov_write_stts_tag(pb, track);
613 614 615
    if (track->enc->codec_type == CODEC_TYPE_VIDEO &&
        track->hasKeyframes)
        mov_write_stss_tag(pb, track);
616 617 618 619
    mov_write_stsc_tag(pb, track);
    mov_write_stsz_tag(pb, track);
    mov_write_stco_tag(pb, track);
    return updateSize(pb, pos);
620 621
}

622
static int mov_write_dinf_tag(ByteIOContext *pb)
623
{
624
    int pos = url_ftell(pb);
625 626
    put_be32(pb, 0); /* size */
    put_tag(pb, "dinf");
627 628
    mov_write_dref_tag(pb);
    return updateSize(pb, pos);
629 630
}

631
static int mov_write_smhd_tag(ByteIOContext *pb)
632 633 634 635 636 637 638 639 640
{
    put_be32(pb, 16); /* size */
    put_tag(pb, "smhd");
    put_be32(pb, 0); /* version & flags */
    put_be16(pb, 0); /* reserved (balance, normally = 0) */
    put_be16(pb, 0); /* reserved */
    return 16;
}

641
static int mov_write_vmhd_tag(ByteIOContext *pb)
642 643 644 645 646 647 648 649
{
    put_be32(pb, 0x14); /* size (always 0x14) */
    put_tag(pb, "vmhd");
    put_be32(pb, 0x01); /* version & flags */
    put_be64(pb, 0); /* reserved (graphics mode = copy) */
    return 0x14;
}

650
static int mov_write_hdlr_tag(ByteIOContext *pb, MOVTrack* track)
651
{
652
    char *descr, *hdlr, *hdlr_type;
653
    int pos = url_ftell(pb);
654

655
    if (!track) { /* no media --> data handler */
656 657 658
        hdlr = "dhlr";
        hdlr_type = "url ";
        descr = "DataHandler";
659
    } else {
660 661 662 663 664 665 666 667
        hdlr = (track->mode == MODE_MOV) ? "mhlr" : "\0\0\0\0";
        if (track->enc->codec_type == CODEC_TYPE_VIDEO) {
            hdlr_type = "vide";
            descr = "VideoHandler";
        } else {
            hdlr_type = "soun";
            descr = "SoundHandler";
        }
668
    }
669

670
    put_be32(pb, 0); /* size */
671 672
    put_tag(pb, "hdlr");
    put_be32(pb, 0); /* Version & flags */
673
    put_buffer(pb, hdlr, 4); /* handler */
674
    put_tag(pb, hdlr_type); /* handler type */
675 676 677
    put_be32(pb ,0); /* reserved */
    put_be32(pb ,0); /* reserved */
    put_be32(pb ,0); /* reserved */
678 679 680 681 682 683 684 685 686 687
    put_byte(pb, strlen(descr)); /* string counter */
    put_buffer(pb, descr, strlen(descr)); /* handler description */
    return updateSize(pb, pos);
}

static int mov_write_minf_tag(ByteIOContext *pb, MOVTrack* track)
{
    int pos = url_ftell(pb);
    put_be32(pb, 0); /* size */
    put_tag(pb, "minf");
688
    if(track->enc->codec_type == CODEC_TYPE_VIDEO)
689
        mov_write_vmhd_tag(pb);
690
    else
691 692 693 694 695
        mov_write_smhd_tag(pb);
    if (track->mode == MODE_MOV) /* FIXME: Why do it for MODE_MOV only ? */
        mov_write_hdlr_tag(pb, NULL);
    mov_write_dinf_tag(pb);
    mov_write_stbl_tag(pb, track);
696
    return updateSize(pb, pos);
697 698
}

699
static int mov_write_mdhd_tag(ByteIOContext *pb, MOVTrack* track)
700 701 702 703 704 705
{
    put_be32(pb, 32); /* size */
    put_tag(pb, "mdhd");
    put_be32(pb, 0); /* Version & flags */
    put_be32(pb, track->time); /* creation time */
    put_be32(pb, track->time); /* modification time */
706
    put_be32(pb, track->timescale); /* time scale (sample rate for audio) */
707
    put_be32(pb, track->trackDuration); /* duration */
708
    put_be16(pb, track->language); /* language */
709 710 711 712
    put_be16(pb, 0); /* reserved (quality) */
    return 32;
}

713
static int mov_write_mdia_tag(ByteIOContext *pb, MOVTrack* track)
714
{
715
    int pos = url_ftell(pb);
716 717
    put_be32(pb, 0); /* size */
    put_tag(pb, "mdia");
718 719 720 721
    mov_write_mdhd_tag(pb, track);
    mov_write_hdlr_tag(pb, track);
    mov_write_minf_tag(pb, track);
    return updateSize(pb, pos);
722 723
}

724
static int mov_write_tkhd_tag(ByteIOContext *pb, MOVTrack* track)
725 726 727
{
    put_be32(pb, 0x5c); /* size (always 0x5c) */
    put_tag(pb, "tkhd");
728
    put_be32(pb, 0xf); /* version & flags (track enabled) */
729 730 731 732
    put_be32(pb, track->time); /* creation time */
    put_be32(pb, track->time); /* modification time */
    put_be32(pb, track->trackID); /* track-id */
    put_be32(pb, 0); /* reserved */
Michael Niedermayer's avatar
Michael Niedermayer committed
733
    put_be32(pb, av_rescale_rnd(track->trackDuration, globalTimescale, track->timescale, AV_ROUND_UP)); /* duration */
734 735 736 737 738 739 740 741 742 743 744 745 746 747 748 749 750 751 752 753 754 755 756 757

    put_be32(pb, 0); /* reserved */
    put_be32(pb, 0); /* reserved */
    put_be32(pb, 0x0); /* reserved (Layer & Alternate group) */
    /* Volume, only for audio */
    if(track->enc->codec_type == CODEC_TYPE_AUDIO)
        put_be16(pb, 0x0100);
    else
        put_be16(pb, 0);
    put_be16(pb, 0); /* reserved */

    /* Matrix structure */
    put_be32(pb, 0x00010000); /* reserved */
    put_be32(pb, 0x0); /* reserved */
    put_be32(pb, 0x0); /* reserved */
    put_be32(pb, 0x0); /* reserved */
    put_be32(pb, 0x00010000); /* reserved */
    put_be32(pb, 0x0); /* reserved */
    put_be32(pb, 0x0); /* reserved */
    put_be32(pb, 0x0); /* reserved */
    put_be32(pb, 0x40000000); /* reserved */

    /* Track width and height, for visual only */
    if(track->enc->codec_type == CODEC_TYPE_VIDEO) {
758 759 760
        double sample_aspect_ratio = av_q2d(track->enc->sample_aspect_ratio);
        if( !sample_aspect_ratio ) sample_aspect_ratio = 1;
        put_be32(pb, sample_aspect_ratio * track->enc->width*0x10000);
761
        put_be32(pb, track->enc->height*0x10000);
762 763 764 765 766 767 768 769
    }
    else {
        put_be32(pb, 0);
        put_be32(pb, 0);
    }
    return 0x5c;
}

770 771 772 773 774 775 776 777 778 779
// This box seems important for the psp playback ... without it the movie seems to hang
static int mov_write_edts_tag(ByteIOContext *pb, MOVTrack *track)
{
    put_be32(pb, 0x24); /* size  */
    put_tag(pb, "edts");
    put_be32(pb, 0x1c); /* size  */
    put_tag(pb, "elst");
    put_be32(pb, 0x0);
    put_be32(pb, 0x1);

Michael Niedermayer's avatar
Michael Niedermayer committed
780
    put_be32(pb, av_rescale_rnd(track->trackDuration, globalTimescale, track->timescale, AV_ROUND_UP)); /* duration   ... doesn't seem to effect psp */
781 782 783 784 785 786 787 788 789 790 791 792 793 794 795 796 797 798 799 800 801 802 803 804 805

    put_be32(pb, 0x0);
    put_be32(pb, 0x00010000);
    return 0x24;
}

// goes at the end of each track!  ... Critical for PSP playback ("Incompatible data" without it)
static int mov_write_uuid_tag_psp(ByteIOContext *pb, MOVTrack *mov)
{
    put_be32(pb, 0x34); /* size ... reports as 28 in mp4box! */
    put_tag(pb, "uuid");
    put_tag(pb, "USMT");
    put_be32(pb, 0x21d24fce);
    put_be32(pb, 0xbb88695c);
    put_be32(pb, 0xfac9c740);
    put_be32(pb, 0x1c);     // another size here!
    put_tag(pb, "MTDT");
    put_be32(pb, 0x00010012);
    put_be32(pb, 0x0a);
    put_be32(pb, 0x55c40000);
    put_be32(pb, 0x1);
    put_be32(pb, 0x0);
    return 0x34;
}

806
static int mov_write_trak_tag(ByteIOContext *pb, MOVTrack* track)
807
{
808
    int pos = url_ftell(pb);
809 810
    put_be32(pb, 0); /* size */
    put_tag(pb, "trak");
811
    mov_write_tkhd_tag(pb, track);
812
    if (track->mode == MODE_PSP)
813
        mov_write_edts_tag(pb, track);  // PSP Movies require edts box
814
    mov_write_mdia_tag(pb, track);
815
    if (track->mode == MODE_PSP)
816
        mov_write_uuid_tag_psp(pb,track);  // PSP Movies require this uuid box
817
    return updateSize(pb, pos);
818 819
}

820
#if 0
821
/* TODO: Not sorted out, but not necessary either */
822
static int mov_write_iods_tag(ByteIOContext *pb, MOVContext *mov)
823 824 825 826 827 828 829 830 831 832 833
{
    put_be32(pb, 0x15); /* size */
    put_tag(pb, "iods");
    put_be32(pb, 0);    /* version & flags */
    put_be16(pb, 0x1007);
    put_byte(pb, 0);
    put_be16(pb, 0x4fff);
    put_be16(pb, 0xfffe);
    put_be16(pb, 0x01ff);
    return 0x15;
}
834
#endif
835

836
static int mov_write_mvhd_tag(ByteIOContext *pb, MOVContext *mov)
837 838
{
    int maxTrackID = 1, maxTrackLen = 0, i;
839
    int64_t maxTrackLenTemp;
840 841 842 843 844 845 846 847 848

    put_be32(pb, 0x6c); /* size (always 0x6c) */
    put_tag(pb, "mvhd");
    put_be32(pb, 0); /* version & flags */
    put_be32(pb, mov->time); /* creation time */
    put_be32(pb, mov->time); /* modification time */
    put_be32(pb, mov->timescale); /* timescale */
    for (i=0; i<MAX_STREAMS; i++) {
        if(mov->tracks[i].entry > 0) {
Michael Niedermayer's avatar
Michael Niedermayer committed
849
            maxTrackLenTemp = av_rescale_rnd(mov->tracks[i].trackDuration, globalTimescale, mov->tracks[i].timescale, AV_ROUND_UP);
850 851
            if(maxTrackLen < maxTrackLenTemp)
                maxTrackLen = maxTrackLenTemp;
852 853 854 855 856 857 858 859 860 861 862 863 864 865 866 867 868 869 870 871 872 873 874 875 876 877 878 879 880 881 882 883 884
            if(maxTrackID < mov->tracks[i].trackID)
                maxTrackID = mov->tracks[i].trackID;
        }
    }
    put_be32(pb, maxTrackLen); /* duration of longest track */

    put_be32(pb, 0x00010000); /* reserved (preferred rate) 1.0 = normal */
    put_be16(pb, 0x0100); /* reserved (preferred volume) 1.0 = normal */
    put_be16(pb, 0); /* reserved */
    put_be32(pb, 0); /* reserved */
    put_be32(pb, 0); /* reserved */

    /* Matrix structure */
    put_be32(pb, 0x00010000); /* reserved */
    put_be32(pb, 0x0); /* reserved */
    put_be32(pb, 0x0); /* reserved */
    put_be32(pb, 0x0); /* reserved */
    put_be32(pb, 0x00010000); /* reserved */
    put_be32(pb, 0x0); /* reserved */
    put_be32(pb, 0x0); /* reserved */
    put_be32(pb, 0x0); /* reserved */
    put_be32(pb, 0x40000000); /* reserved */

    put_be32(pb, 0); /* reserved (preview time) */
    put_be32(pb, 0); /* reserved (preview duration) */
    put_be32(pb, 0); /* reserved (poster time) */
    put_be32(pb, 0); /* reserved (selection time) */
    put_be32(pb, 0); /* reserved (selection duration) */
    put_be32(pb, 0); /* reserved (current time) */
    put_be32(pb, maxTrackID+1); /* Next track id */
    return 0x6c;
}

885 886 887 888 889 890 891 892 893 894 895 896 897 898 899 900 901 902 903 904 905 906 907 908 909 910 911 912