movenc.c 54.7 KB
Newer Older
1 2 3
/*
 * MOV, 3GP, MP4 encoder.
 * Copyright (c) 2003 Thomas Raivio.
4
 * Copyright (c) 2004 Gildas Bazin <gbazin at videolan dot org>.
5 6 7 8 9 10 11 12 13 14 15 16 17
 *
 * This library is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2 of the License, or (at your option) any later version.
 *
 * This library is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
 * License along with this library; if not, write to the Free Software
18
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
19 20
 */
#include "avformat.h"
21
#include "avi.h"
22
#include "avio.h"
23
#include "mov.h"
24

25 26 27
#undef NDEBUG
#include <assert.h>

28 29 30
#define MOV_INDEX_CLUSTER_SIZE 16384
#define globalTimescale 1000

31 32 33
#define MODE_MP4 0
#define MODE_MOV 1
#define MODE_3GP 2
34
#define MODE_PSP 3 // example working PSP command line:
35
// ffmpeg -i testinput.avi  -f psp -r 14.985 -s 320x240 -b 768 -ar 24000 -ab 32 M4V00001.MP4
36
#define MODE_3G2 4
37

38
typedef struct MOVIentry {
39 40
    unsigned int flags, size;
    uint64_t     pos;
41
    unsigned int samplesInChunk;
42
    char         key_frame;
43
    unsigned int entries;
44
    int64_t      cts;
45 46 47
} MOVIentry;

typedef struct MOVIndex {
48
    int         mode;
49
    int         entry;
50
    uint64_t    mdat_size;
51 52 53
    int         ents_allocated;
    long        timescale;
    long        time;
54
    int64_t     trackDuration;
55 56
    long        sampleCount;
    long        sampleDuration;
57
    int         hasKeyframes;
58
    int         hasBframes;
59
    int         language;
60 61 62 63
    int         trackID;
    AVCodecContext *enc;

    int         vosLen;
64
    uint8_t     *vosData;
65 66 67
    MOVIentry** cluster;
} MOVTrack;

68
typedef struct MOVContext {
69
    int     mode;
70
    int64_t time;
71
    int     nb_streams;
72
    offset_t mdat_pos;
73 74 75 76
    long    timescale;
    MOVTrack tracks[MAX_STREAMS];
} MOVContext;

77 78
static int mov_write_esds_tag(ByteIOContext *pb, MOVTrack* track);

79
//FIXME supprt 64bit varaint with wide placeholders
80
static offset_t updateSize (ByteIOContext *pb, offset_t pos)
81
{
82
    offset_t curpos = url_ftell(pb);
83
    url_fseek(pb, pos, SEEK_SET);
84
    put_be32(pb, curpos - pos); /* rewrite size */
85
    url_fseek(pb, curpos, SEEK_SET);
86 87

    return curpos - pos;
88 89
}

90
/* Chunk offset atom */
91
static int mov_write_stco_tag(ByteIOContext *pb, MOVTrack* track)
92 93
{
    int i;
Benjamin Larsson's avatar
Benjamin Larsson committed
94
    int mode64 = 0; //   use 32 bit size variant if possible
95
    offset_t pos = url_ftell(pb);
96
    put_be32(pb, 0); /* size */
97 98 99 100 101
    if (pos > UINT32_MAX) {
        mode64 = 1;
        put_tag(pb, "co64");
    } else
        put_tag(pb, "stco");
102 103 104 105 106
    put_be32(pb, 0); /* version & flags */
    put_be32(pb, track->entry); /* entry count */
    for (i=0; i<track->entry; i++) {
        int cl = i / MOV_INDEX_CLUSTER_SIZE;
        int id = i % MOV_INDEX_CLUSTER_SIZE;
107 108 109 110
        if(mode64 == 1)
            put_be64(pb, track->cluster[cl][id].pos);
        else
            put_be32(pb, track->cluster[cl][id].pos);
111
    }
112
    return updateSize (pb, pos);
113 114
}

115
/* Sample size atom */
116
static int mov_write_stsz_tag(ByteIOContext *pb, MOVTrack* track)
117
{
118
    int equalChunks = 1;
119
    int i, j, entries = 0, tst = -1, oldtst = -1;
120

121
    offset_t pos = url_ftell(pb);
122
    put_be32(pb, 0); /* size */
123 124 125
    put_tag(pb, "stsz");
    put_be32(pb, 0); /* version & flags */

126 127 128
    for (i=0; i<track->entry; i++) {
        int cl = i / MOV_INDEX_CLUSTER_SIZE;
        int id = i % MOV_INDEX_CLUSTER_SIZE;
129 130 131
        tst = track->cluster[cl][id].size/track->cluster[cl][id].entries;
        if(oldtst != -1 && tst != oldtst) {
            equalChunks = 0;
132 133
        }
        oldtst = tst;
134
        entries += track->cluster[cl][id].entries;
135
    }
136 137
    if (equalChunks) {
        int sSize = track->cluster[0][0].size/track->cluster[0][0].entries;
138
        put_be32(pb, sSize); // sample size
139
        put_be32(pb, entries); // sample count
140
    }
141
    else {
142 143
        put_be32(pb, 0); // sample size
        put_be32(pb, entries); // sample count
144
        for (i=0; i<track->entry; i++) {
145 146
            int cl = i / MOV_INDEX_CLUSTER_SIZE;
            int id = i % MOV_INDEX_CLUSTER_SIZE;
147 148 149 150
            for ( j=0; j<track->cluster[cl][id].entries; j++) {
                put_be32(pb, track->cluster[cl][id].size /
                         track->cluster[cl][id].entries);
            }
151 152
        }
    }
153
    return updateSize (pb, pos);
154 155
}

156
/* Sample to chunk atom */
157
static int mov_write_stsc_tag(ByteIOContext *pb, MOVTrack* track)
158
{
159 160
    int index = 0, oldval = -1, i;
    offset_t entryPos, curpos;
161

162
    offset_t pos = url_ftell(pb);
163
    put_be32(pb, 0); /* size */
164
    put_tag(pb, "stsc");
165
    put_be32(pb, 0); // version & flags
166
    entryPos = url_ftell(pb);
167
    put_be32(pb, track->entry); // entry count
168 169 170
    for (i=0; i<track->entry; i++) {
        int cl = i / MOV_INDEX_CLUSTER_SIZE;
        int id = i % MOV_INDEX_CLUSTER_SIZE;
171
        if(oldval != track->cluster[cl][id].samplesInChunk)
172
        {
173
            put_be32(pb, i+1); // first chunk
174
            put_be32(pb, track->cluster[cl][id].samplesInChunk); // samples per chunk
175
            put_be32(pb, 0x1); // sample description index
176
            oldval = track->cluster[cl][id].samplesInChunk;
177
            index++;
178 179
        }
    }
180 181
    curpos = url_ftell(pb);
    url_fseek(pb, entryPos, SEEK_SET);
182
    put_be32(pb, index); // rewrite size
183
    url_fseek(pb, curpos, SEEK_SET);
184

185
    return updateSize (pb, pos);
186 187
}

188
/* Sync sample atom */
189
static int mov_write_stss_tag(ByteIOContext *pb, MOVTrack* track)
190
{
191 192 193
    offset_t curpos, entryPos;
    int i, index = 0;
    offset_t pos = url_ftell(pb);
194
    put_be32(pb, 0); // size
195
    put_tag(pb, "stss");
196
    put_be32(pb, 0); // version & flags
197
    entryPos = url_ftell(pb);
198
    put_be32(pb, track->entry); // entry count
199 200 201 202 203 204 205 206 207 208
    for (i=0; i<track->entry; i++) {
        int cl = i / MOV_INDEX_CLUSTER_SIZE;
        int id = i % MOV_INDEX_CLUSTER_SIZE;
        if(track->cluster[cl][id].key_frame == 1) {
            put_be32(pb, i+1);
            index++;
        }
    }
    curpos = url_ftell(pb);
    url_fseek(pb, entryPos, SEEK_SET);
209
    put_be32(pb, index); // rewrite size
210 211
    url_fseek(pb, curpos, SEEK_SET);
    return updateSize (pb, pos);
212 213
}

214
static int mov_write_damr_tag(ByteIOContext *pb)
215 216 217 218 219
{
    put_be32(pb, 0x11); /* size */
    put_tag(pb, "damr");
    put_tag(pb, "FFMP");
    put_byte(pb, 0);
220

221 222 223 224
    //put_be16(pb, 0x80); /* Mode set (all modes for AMR_NB) */
    //put_be16(pb, 0xa); /* Mode change period (no restriction) */
    put_be16(pb, 0x81ff); /* Mode set (all modes for AMR_NB) */
    put_be16(pb, 1); /* Mode change period (no restriction) */
225 226 227
    return 0x11;
}

228 229
static int mov_write_wave_tag(ByteIOContext *pb, MOVTrack* track)
{
230
    offset_t pos = url_ftell(pb);
231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254

    put_be32(pb, 0);     /* size */
    put_tag(pb, "wave");

    put_be32(pb, 12);    /* size */
    put_tag(pb, "frma");
    put_tag(pb, "mp4a");

    put_be32(pb, 12);    /* size */
    put_tag(pb, "mp4a");
    put_be32(pb, 0);

    mov_write_esds_tag(pb, track);

    put_be32(pb, 12);    /* size */
    put_tag(pb, "srcq");
    put_be32(pb, 0x40);

    put_be32(pb, 8);     /* size */
    put_be32(pb, 0);     /* null tag */

    return updateSize (pb, pos);
}

255
static const CodecTag codec_movaudio_tags[] = {
256 257 258 259 260 261 262
    { CODEC_ID_PCM_MULAW, MKTAG('u', 'l', 'a', 'w') },
    { CODEC_ID_PCM_ALAW, MKTAG('a', 'l', 'a', 'w') },
    { CODEC_ID_ADPCM_IMA_QT, MKTAG('i', 'm', 'a', '4') },
    { CODEC_ID_MACE3, MKTAG('M', 'A', 'C', '3') },
    { CODEC_ID_MACE6, MKTAG('M', 'A', 'C', '6') },
    { CODEC_ID_AAC, MKTAG('m', 'p', '4', 'a') },
    { CODEC_ID_AMR_NB, MKTAG('s', 'a', 'm', 'r') },
263
    { CODEC_ID_AMR_WB, MKTAG('s', 'a', 'w', 'b') },
264 265 266
    { CODEC_ID_PCM_S16BE, MKTAG('t', 'w', 'o', 's') },
    { CODEC_ID_PCM_S16LE, MKTAG('s', 'o', 'w', 't') },
    { CODEC_ID_MP3, MKTAG('.', 'm', 'p', '3') },
267
    { CODEC_ID_NONE, 0 },
268 269
};

270
static int mov_write_audio_tag(ByteIOContext *pb, MOVTrack* track)
271
{
272
    offset_t pos = url_ftell(pb);
273
    int tag;
274

275
    put_be32(pb, 0); /* size */
276

277 278
    tag = track->enc->codec_tag;
    if (!tag)
279 280 281 282
    tag = codec_get_tag(codec_movaudio_tags, track->enc->codec_id);
    // if no mac fcc found, try with Microsoft tags
    if (!tag)
    {
283
        int tmp = codec_get_tag(codec_wav_tags, track->enc->codec_id);
284
        tag = MKTAG('m', 's', ((tmp >> 8) & 0xff), (tmp & 0xff));
285
    }
286
    put_le32(pb, tag); // store it byteswapped
287

288 289 290
    put_be32(pb, 0); /* Reserved */
    put_be16(pb, 0); /* Reserved */
    put_be16(pb, 1); /* Data-reference index, XXX  == 1 */
291

292
    /* SoundDescription */
293 294 295 296
    if(track->mode == MODE_MOV && track->enc->codec_id == CODEC_ID_AAC)
        put_be16(pb, 1); /* Version 1 */
    else
        put_be16(pb, 0); /* Version 0 */
297
    put_be16(pb, 0); /* Revision level */
298 299
    put_be32(pb, 0); /* Reserved */

300 301
    put_be16(pb, track->enc->channels); /* Number of channels */
    /* TODO: Currently hard-coded to 16-bit, there doesn't seem
302
                 to be a good way to get number of bits of audio */
303
    put_be16(pb, 0x10); /* Reserved */
304 305 306 307 308 309 310 311 312 313

    if(track->enc->codec_id == CODEC_ID_AAC ||
       track->enc->codec_id == CODEC_ID_MP3)
    {
        put_be16(pb, 0xfffe); /* compression ID (vbr)*/
    }
    else
    {
        put_be16(pb, 0); /* compression ID (= 0) */
    }
314
    put_be16(pb, 0); /* packet size (= 0) */
315 316 317
    put_be16(pb, track->timescale); /* Time scale */
    put_be16(pb, 0); /* Reserved */

318 319 320 321 322 323 324 325 326 327 328 329 330
    if(track->mode == MODE_MOV && track->enc->codec_id == CODEC_ID_AAC)
    {
        /* SoundDescription V1 extended info */
        put_be32(pb, track->enc->frame_size); /* Samples per packet  */
        put_be32(pb, 1536); /* Bytes per packet */
        put_be32(pb, 2); /* Bytes per frame */
        put_be32(pb, 2); /* Bytes per sample */
    }

    if(track->enc->codec_id == CODEC_ID_AAC) {
        if( track->mode == MODE_MOV ) mov_write_wave_tag(pb, track);
        else mov_write_esds_tag(pb, track);
    }
331 332
    if(track->enc->codec_id == CODEC_ID_AMR_NB)
        mov_write_damr_tag(pb);
333
    return updateSize (pb, pos);
334 335
}

336
static int mov_write_d263_tag(ByteIOContext *pb)
337 338 339 340 341 342 343 344 345
{
    put_be32(pb, 0xf); /* size */
    put_tag(pb, "d263");
    put_tag(pb, "FFMP");
    put_be16(pb, 0x0a);
    put_byte(pb, 0);
    return 0xf;
}

346 347
/* TODO: No idea about these values */
static int mov_write_svq3_tag(ByteIOContext *pb)
348
{
349 350 351 352 353 354
    put_be32(pb, 0x15);
    put_tag(pb, "SMI ");
    put_tag(pb, "SEQH");
    put_be32(pb, 0x5);
    put_be32(pb, 0xe2c0211d);
    put_be32(pb, 0xc0000000);
355
    put_byte(pb, 0);
356
    return 0x15;
357 358
}

359 360 361 362 363 364 365 366 367 368 369 370 371 372 373 374 375 376 377 378 379 380 381 382 383 384 385 386 387 388 389 390 391 392 393 394 395 396 397 398 399 400 401 402 403 404 405 406 407 408 409 410 411 412 413 414 415 416 417 418 419 420 421 422 423 424 425 426 427 428 429 430 431 432 433 434 435 436 437 438 439 440 441 442 443 444 445 446 447 448 449
static uint8_t *avc_find_startcode( uint8_t *p, uint8_t *end )
{
    uint8_t *a = p + 4 - ((int)p & 3);

    for( end -= 3; p < a && p < end; p++ ) {
        if( p[0] == 0 && p[1] == 0 && p[2] == 1 )
            return p;
    }

    for( end -= 3; p < end; p += 4 ) {
        uint32_t x = *(uint32_t*)p;
//      if( (x - 0x01000100) & (~x) & 0x80008000 ) // little endian
//      if( (x - 0x00010001) & (~x) & 0x00800080 ) // big endian
        if( (x - 0x01010101) & (~x) & 0x80808080 ) { // generic
            if( p[1] == 0 ) {
                if( p[0] == 0 && p[2] == 1 )
                    return p;
                if( p[2] == 0 && p[3] == 1 )
                    return p+1;
            }
            if( p[3] == 0 ) {
                if( p[2] == 0 && p[4] == 1 )
                    return p+2;
                if( p[4] == 0 && p[5] == 1 )
                    return p+3;
            }
        }
    }

    for( end += 3; p < end; p++ ) {
        if( p[0] == 0 && p[1] == 0 && p[2] == 1 )
            return p;
    }

    return end + 3;
}

static void avc_parse_nal_units(uint8_t **buf, int *size)
{
    ByteIOContext pb;
    uint8_t *p = *buf;
    uint8_t *end = p + *size;
    uint8_t *nal_start, *nal_end;

    url_open_dyn_buf(&pb);
    nal_start = avc_find_startcode(p, end);
    while (nal_start < end) {
        while(!*(nal_start++));
        nal_end = avc_find_startcode(nal_start, end);
        put_be32(&pb, nal_end - nal_start);
        put_buffer(&pb, nal_start, nal_end - nal_start);
        nal_start = nal_end;
    }
    av_freep(buf);
    *size = url_close_dyn_buf(&pb, buf);
}

static int mov_write_avcc_tag(ByteIOContext *pb, MOVTrack *track)
{
    offset_t pos = url_ftell(pb);

    put_be32(pb, 0);
    put_tag(pb, "avcC");
    if (track->vosLen > 6) {
        /* check for h264 start code */
        if (BE_32(track->vosData) == 0x00000001) {
            uint8_t *buf, *end;
            uint32_t sps_size=0, pps_size=0;
            uint8_t *sps=0, *pps=0;

            avc_parse_nal_units(&track->vosData, &track->vosLen);
            buf = track->vosData;
            end = track->vosData + track->vosLen;

            /* look for sps and pps */
            while (buf < end) {
                unsigned int size;
                uint8_t nal_type;
                size = BE_32(buf);
                nal_type = buf[4] & 0x1f;
                if (nal_type == 7) { /* SPS */
                    sps = buf + 4;
                    sps_size = size;
                } else if (nal_type == 8) { /* PPS */
                    pps = buf + 4;
                    pps_size = size;
                }
                buf += size + 4;
            }
            assert(sps);
            assert(pps);
450 451 452 453 454 455 456 457

            put_byte(pb, 1); /* version */
            put_byte(pb, sps[1]); /* profile */
            put_byte(pb, sps[2]); /* profile compat */
            put_byte(pb, sps[3]); /* level */
            put_byte(pb, 0xff); /* 6 bits reserved (111111) + 2 bits nal size length - 1 (11) */
            put_byte(pb, 0xe1); /* 3 bits reserved (111) + 5 bits number of sps (00001) */

458 459 460 461 462 463 464 465 466 467 468 469
            put_be16(pb, sps_size);
            put_buffer(pb, sps, sps_size);
            put_byte(pb, 1); /* number of pps */
            put_be16(pb, pps_size);
            put_buffer(pb, pps, pps_size);
        } else {
            put_buffer(pb, track->vosData, track->vosLen);
        }
    }
    return updateSize(pb, pos);
}

470 471 472 473 474 475 476 477 478 479 480 481 482
static unsigned int descrLength(unsigned int len)
{
    if (len < 0x00000080)
        return 2 + len;
    else if (len < 0x00004000)
        return 3 + len;
    else if(len < 0x00200000)
        return 4 + len;
    else
        return 5 + len;
}

static void putDescr(ByteIOContext *pb, int tag, int size)
483
{
484 485 486 487 488 489
    uint32_t len;
    uint8_t  vals[4];

    len = size;
    vals[3] = (uint8_t)(len & 0x7f);
    len >>= 7;
490
    vals[2] = (uint8_t)((len & 0x7f) | 0x80);
491
    len >>= 7;
492
    vals[1] = (uint8_t)((len & 0x7f) | 0x80);
493 494 495 496 497 498 499 500 501 502 503 504 505 506 507 508 509 510 511 512 513 514 515 516 517 518 519
    len >>= 7;
    vals[0] = (uint8_t)((len & 0x7f) | 0x80);

    put_byte(pb, tag); // DescriptorTag

    if (size < 0x00000080)
    {
        put_byte(pb, vals[3]);
    }
    else if (size < 0x00004000)
    {
        put_byte(pb, vals[2]);
        put_byte(pb, vals[3]);
    }
    else if (size < 0x00200000)
    {
        put_byte(pb, vals[1]);
        put_byte(pb, vals[2]);
        put_byte(pb, vals[3]);
    }
    else if (size < 0x10000000)
    {
        put_byte(pb, vals[0]);
        put_byte(pb, vals[1]);
        put_byte(pb, vals[2]);
        put_byte(pb, vals[3]);
    }
520 521
}

522
static int mov_write_esds_tag(ByteIOContext *pb, MOVTrack* track) // Basic
523
{
524
    int decoderSpecificInfoLen;
525
    offset_t pos = url_ftell(pb);
526

527 528
    decoderSpecificInfoLen = track->vosLen ? descrLength(track->vosLen):0;

529
    put_be32(pb, 0);               // size
530
    put_tag(pb, "esds");
531
    put_be32(pb, 0);               // Version
532

533 534 535
    // ES descriptor
    putDescr(pb, 0x03, 3 + descrLength(13 + decoderSpecificInfoLen) +
             descrLength(1));
536
    put_be16(pb, track->trackID);
537 538
    put_byte(pb, 0x00);            // flags (= no flags)

539 540 541
    // DecoderConfig descriptor
    putDescr(pb, 0x04, 13 + decoderSpecificInfoLen);

542 543
    // Object type indication
    put_byte(pb, codec_get_tag(ff_mov_obj_type, track->enc->codec_id));
544

545 546
    // the following fields is made of 6 bits to identify the streamtype (4 for video, 5 for audio)
    // plus 1 bit to indicate upstream and 1 bit set to 1 (reserved)
547 548 549 550 551
    if(track->enc->codec_type == CODEC_TYPE_AUDIO)
        put_byte(pb, 0x15);            // flags (= Audiostream)
    else
        put_byte(pb, 0x11);            // flags (= Visualstream)

552 553
    put_byte(pb,  track->enc->rc_buffer_size>>(3+16));             // Buffersize DB (24 bits)
    put_be16(pb, (track->enc->rc_buffer_size>>3)&0xFFFF);          // Buffersize DB
554

555 556 557 558 559
    put_be32(pb, FFMAX(track->enc->bit_rate, track->enc->rc_max_rate));     // maxbitrate  (FIXME should be max rate in any 1 sec window)
    if(track->enc->rc_max_rate != track->enc->rc_min_rate || track->enc->rc_min_rate==0)
        put_be32(pb, 0);     // vbr
    else
        put_be32(pb, track->enc->rc_max_rate);     // avg bitrate
560

561 562 563 564 565 566 567
    if (track->vosLen)
    {
        // DecoderSpecific info descriptor
        putDescr(pb, 0x05, track->vosLen);
        put_buffer(pb, track->vosData, track->vosLen);
    }

568

569
    // SL descriptor
570
    putDescr(pb, 0x06, 1);
571
    put_byte(pb, 0x02);
572
    return updateSize (pb, pos);
573 574
}

575
static const CodecTag codec_movvideo_tags[] = {
576 577 578 579
    { CODEC_ID_SVQ1, MKTAG('S', 'V', 'Q', '1') },
    { CODEC_ID_SVQ3, MKTAG('S', 'V', 'Q', '3') },
    { CODEC_ID_MPEG4, MKTAG('m', 'p', '4', 'v') },
    { CODEC_ID_H263, MKTAG('s', '2', '6', '3') },
580
    { CODEC_ID_H264, MKTAG('a', 'v', 'c', '1') },
581 582 583 584 585 586 587
    /* special handling in mov_find_video_codec_tag */
    { CODEC_ID_DVVIDEO, MKTAG('d', 'v', 'c', ' ') }, /* DV NTSC */
    { CODEC_ID_DVVIDEO, MKTAG('d', 'v', 'c', 'p') }, /* DV PAL */
    { CODEC_ID_DVVIDEO, MKTAG('d', 'v', 'p', 'p') }, /* DVCPRO PAL */
    { CODEC_ID_DVVIDEO, MKTAG('d', 'v', '5', 'n') }, /* DVCPRO50 NTSC */
    { CODEC_ID_DVVIDEO, MKTAG('d', 'v', '5', 'p') }, /* DVCPRO50 PAL */
    { CODEC_ID_NONE, 0 },
588 589
};

590 591 592 593 594 595 596 597 598 599 600 601 602 603 604 605 606
static int mov_find_video_codec_tag(MOVTrack* track)
{
    int tag;

    tag = track->enc->codec_tag;
    if (!tag) {
        if (track->enc->codec_id == CODEC_ID_DVVIDEO) {
            if (track->enc->height == 480) { /* NTSC */
                if (track->enc->pix_fmt == PIX_FMT_YUV422P)
                    tag = MKTAG('d', 'v', '5', 'n');
                else
                    tag = MKTAG('d', 'v', 'c', ' ');
            } else { /* assume PAL */
                if (track->enc->pix_fmt == PIX_FMT_YUV422P)
                    tag = MKTAG('d', 'v', '5', 'p');
                else if (track->enc->pix_fmt == PIX_FMT_YUV420P)
                    tag = MKTAG('d', 'v', 'c', 'p');
Baptiste Coudurier's avatar
Baptiste Coudurier committed
607 608
                else
                    tag = MKTAG('d', 'v', 'p', 'p');
609 610 611 612 613 614 615 616 617 618 619 620
            }
        } else {
            tag = codec_get_tag(codec_movvideo_tags, track->enc->codec_id);
        }
    }
    // if no mac fcc found, try with Microsoft tags
    if (!tag)
        tag = codec_get_tag(codec_bmp_tags, track->enc->codec_id);
    assert(tag);
    return tag;
}

621
static int mov_write_video_tag(ByteIOContext *pb, MOVTrack* track)
622
{
623
    offset_t pos = url_ftell(pb);
624
    char compressor_name[32];
625
    int tag;
626

627
    put_be32(pb, 0); /* size */
628

629
    tag = mov_find_video_codec_tag(track);
630
    put_le32(pb, tag); // store it byteswapped
631

632 633 634 635
    put_be32(pb, 0); /* Reserved */
    put_be16(pb, 0); /* Reserved */
    put_be16(pb, 1); /* Data-reference index */

636 637 638 639 640 641 642 643 644 645
    put_be16(pb, 0); /* Codec stream version */
    put_be16(pb, 0); /* Codec stream revision (=0) */
    put_tag(pb, "FFMP"); /* Vendor */
    if(track->enc->codec_id == CODEC_ID_RAWVIDEO) {
        put_be32(pb, 0); /* Temporal Quality */
        put_be32(pb, 0x400); /* Spatial Quality = lossless*/
    } else {
        put_be32(pb, 0x200); /* Temporal Quality = normal */
        put_be32(pb, 0x200); /* Spatial Quality = normal */
    }
646 647
    put_be16(pb, track->enc->width); /* Video width */
    put_be16(pb, track->enc->height); /* Video height */
648 649
    put_be32(pb, 0x00480000); /* Horizontal resolution 72dpi */
    put_be32(pb, 0x00480000); /* Vertical resolution 72dpi */
650 651
    put_be32(pb, 0); /* Data size (= 0) */
    put_be16(pb, 1); /* Frame count (= 1) */
652

653
    memset(compressor_name,0,32);
654
    if (track->enc->codec && track->enc->codec->name)
655
        strncpy(compressor_name,track->enc->codec->name,31);
656
    put_byte(pb, strlen(compressor_name));
657
    put_buffer(pb, compressor_name, 31);
658

659 660 661 662 663 664 665
    put_be16(pb, 0x18); /* Reserved */
    put_be16(pb, 0xffff); /* Reserved */
    if(track->enc->codec_id == CODEC_ID_MPEG4)
        mov_write_esds_tag(pb, track);
    else if(track->enc->codec_id == CODEC_ID_H263)
        mov_write_d263_tag(pb);
    else if(track->enc->codec_id == CODEC_ID_SVQ3)
666
        mov_write_svq3_tag(pb);
667 668
    else if(track->enc->codec_id == CODEC_ID_H264)
        mov_write_avcc_tag(pb, track);
669 670

    return updateSize (pb, pos);
671 672
}

673
static int mov_write_stsd_tag(ByteIOContext *pb, MOVTrack* track)
674
{
675
    offset_t pos = url_ftell(pb);
676 677 678 679
    put_be32(pb, 0); /* size */
    put_tag(pb, "stsd");
    put_be32(pb, 0); /* version & flags */
    put_be32(pb, 1); /* entry count */
680 681 682 683
    if (track->enc->codec_type == CODEC_TYPE_VIDEO)
        mov_write_video_tag(pb, track);
    else if (track->enc->codec_type == CODEC_TYPE_AUDIO)
        mov_write_audio_tag(pb, track);
684
    return updateSize(pb, pos);
685 686
}

687 688 689 690 691 692 693 694 695 696 697 698 699 700 701 702 703 704 705 706 707 708 709 710 711 712 713 714 715 716 717 718 719 720 721
static int mov_write_ctts_tag(ByteIOContext *pb, MOVTrack* track)
{
    Time2Sample *ctts_entries;
    uint32_t entries = 0;
    uint32_t atom_size;
    int i;

    ctts_entries = av_malloc((track->entry + 1) * sizeof(*ctts_entries)); /* worst case */
    ctts_entries[0].count = 1;
    ctts_entries[0].duration = track->cluster[0][0].cts;
    for (i=1; i<track->entry; i++) {
        int cl = i / MOV_INDEX_CLUSTER_SIZE;
        int id = i % MOV_INDEX_CLUSTER_SIZE;
        if (track->cluster[cl][id].cts == ctts_entries[entries].duration) {
            ctts_entries[entries].count++; /* compress */
        } else {
            entries++;
            ctts_entries[entries].duration = track->cluster[cl][id].cts;
            ctts_entries[entries].count = 1;
        }
    }
    entries++; /* last one */
    atom_size = 16 + (entries * 8);
    put_be32(pb, atom_size); /* size */
    put_tag(pb, "ctts");
    put_be32(pb, 0); /* version & flags */
    put_be32(pb, entries); /* entry count */
    for (i=0; i<entries; i++) {
        put_be32(pb, ctts_entries[i].count);
        put_be32(pb, ctts_entries[i].duration);
    }
    av_free(ctts_entries);
    return atom_size;
}

Michael Niedermayer's avatar
Michael Niedermayer committed
722
/* TODO: */
723
/* Time to sample atom */
724
static int mov_write_stts_tag(ByteIOContext *pb, MOVTrack* track)
725 726 727 728 729 730
{
    put_be32(pb, 0x18); /* size */
    put_tag(pb, "stts");
    put_be32(pb, 0); /* version & flags */
    put_be32(pb, 1); /* entry count */

731 732
    put_be32(pb, track->sampleCount); /* sample count */
    put_be32(pb, track->sampleDuration); /* sample duration */
733 734 735
    return 0x18;
}

736
static int mov_write_dref_tag(ByteIOContext *pb)
737 738 739 740 741 742 743 744 745 746 747 748 749
{
    put_be32(pb, 28); /* size */
    put_tag(pb, "dref");
    put_be32(pb, 0); /* version & flags */
    put_be32(pb, 1); /* entry count */

    put_be32(pb, 0xc); /* size */
    put_tag(pb, "url ");
    put_be32(pb, 1); /* version & flags */

    return 28;
}

750
static int mov_write_stbl_tag(ByteIOContext *pb, MOVTrack* track)
751
{
752
    offset_t pos = url_ftell(pb);
753 754
    put_be32(pb, 0); /* size */
    put_tag(pb, "stbl");
755 756
    mov_write_stsd_tag(pb, track);
    mov_write_stts_tag(pb, track);
757
    if (track->enc->codec_type == CODEC_TYPE_VIDEO &&
758
        track->hasKeyframes < track->entry)
759
        mov_write_stss_tag(pb, track);
760 761 762
    if (track->enc->codec_type == CODEC_TYPE_VIDEO &&
        track->hasBframes)
        mov_write_ctts_tag(pb, track);
763 764 765 766
    mov_write_stsc_tag(pb, track);
    mov_write_stsz_tag(pb, track);
    mov_write_stco_tag(pb, track);
    return updateSize(pb, pos);
767 768
}

769
static int mov_write_dinf_tag(ByteIOContext *pb)
770
{
771
    offset_t pos = url_ftell(pb);
772 773
    put_be32(pb, 0); /* size */
    put_tag(pb, "dinf");
774 775
    mov_write_dref_tag(pb);
    return updateSize(pb, pos);
776 777
}

778
static int mov_write_smhd_tag(ByteIOContext *pb)
779 780 781 782 783 784 785 786 787
{
    put_be32(pb, 16); /* size */
    put_tag(pb, "smhd");
    put_be32(pb, 0); /* version & flags */
    put_be16(pb, 0); /* reserved (balance, normally = 0) */
    put_be16(pb, 0); /* reserved */
    return 16;
}

788
static int mov_write_vmhd_tag(ByteIOContext *pb)
789 790 791 792 793 794 795 796
{
    put_be32(pb, 0x14); /* size (always 0x14) */
    put_tag(pb, "vmhd");
    put_be32(pb, 0x01); /* version & flags */
    put_be64(pb, 0); /* reserved (graphics mode = copy) */
    return 0x14;
}

797
static int mov_write_hdlr_tag(ByteIOContext *pb, MOVTrack* track)
798
{
799
    char *descr, *hdlr, *hdlr_type;
800
    offset_t pos = url_ftell(pb);
801

802
    if (!track) { /* no media --> data handler */
803 804 805
        hdlr = "dhlr";
        hdlr_type = "url ";
        descr = "DataHandler";
806
    } else {
807 808 809 810 811 812 813 814
        hdlr = (track->mode == MODE_MOV) ? "mhlr" : "\0\0\0\0";
        if (track->enc->codec_type == CODEC_TYPE_VIDEO) {
            hdlr_type = "vide";
            descr = "VideoHandler";
        } else {
            hdlr_type = "soun";
            descr = "SoundHandler";
        }
815
    }
816

817
    put_be32(pb, 0); /* size */
818 819
    put_tag(pb, "hdlr");
    put_be32(pb, 0); /* Version & flags */
820
    put_buffer(pb, hdlr, 4); /* handler */
821
    put_tag(pb, hdlr_type); /* handler type */
822 823 824
    put_be32(pb ,0); /* reserved */
    put_be32(pb ,0); /* reserved */
    put_be32(pb ,0); /* reserved */
825 826 827 828 829 830 831
    put_byte(pb, strlen(descr)); /* string counter */
    put_buffer(pb, descr, strlen(descr)); /* handler description */
    return updateSize(pb, pos);
}

static int mov_write_minf_tag(ByteIOContext *pb, MOVTrack* track)
{
832
    offset_t pos = url_ftell(pb);
833 834
    put_be32(pb, 0); /* size */
    put_tag(pb, "minf");
835
    if(track->enc->codec_type == CODEC_TYPE_VIDEO)
836
        mov_write_vmhd_tag(pb);
837
    else
838 839 840 841 842
        mov_write_smhd_tag(pb);
    if (track->mode == MODE_MOV) /* FIXME: Why do it for MODE_MOV only ? */
        mov_write_hdlr_tag(pb, NULL);
    mov_write_dinf_tag(pb);
    mov_write_stbl_tag(pb, track);
843
    return updateSize(pb, pos);
844 845
}

846
static int mov_write_mdhd_tag(ByteIOContext *pb, MOVTrack* track)
847
{
848 849 850
    int version = track->trackDuration < INT32_MAX ? 0 : 1;

    (version == 1) ? put_be32(pb, 44) : put_be32(pb, 32); /* size */
851
    put_tag(pb, "mdhd");
852 853 854 855 856 857 858 859 860
    put_byte(pb, version);
    put_be24(pb, 0); /* flags */
    if (version == 1) {
        put_be64(pb, track->time);
        put_be64(pb, track->time);
    } else {
        put_be32(pb, track->time); /* creation time */
        put_be32(pb, track->time); /* modification time */
    }
861
    put_be32(pb, track->timescale); /* time scale (sample rate for audio) */
862
    (version == 1) ? put_be64(pb, track->trackDuration) : put_be32(pb, track->trackDuration); /* duration */
863
    put_be16(pb, track->language); /* language */
864 865 866 867
    put_be16(pb, 0); /* reserved (quality) */
    return 32;
}

868
static int mov_write_mdia_tag(ByteIOContext *pb, MOVTrack* track)
869
{
870
    offset_t pos = url_ftell(pb);
871 872
    put_be32(pb, 0); /* size */
    put_tag(pb, "mdia");
873 874 875 876
    mov_write_mdhd_tag(pb, track);
    mov_write_hdlr_tag(pb, track);
    mov_write_minf_tag(pb, track);
    return updateSize(pb, pos);
877 878
}

879
static int mov_write_tkhd_tag(ByteIOContext *pb, MOVTrack* track)
880
{
881 882 883 884
    int64_t duration = av_rescale_rnd(track->trackDuration, globalTimescale, track->timescale, AV_ROUND_UP);
    int version = duration < INT32_MAX ? 0 : 1;

    (version == 1) ? put_be32(pb, 104) : put_be32(pb, 92); /* size */
885
    put_tag(pb, "tkhd");
886 887 888 889 890 891 892 893 894
    put_byte(pb, version);
    put_be24(pb, 0xf); /* flags (track enabled) */
    if (version == 1) {
        put_be64(pb, track->time);
        put_be64(pb, track->time);
    } else {
        put_be32(pb, track->time); /* creation time */
        put_be32(pb, track->time); /* modification time */
    }
895 896
    put_be32(pb, track->trackID); /* track-id */
    put_be32(pb, 0); /* reserved */
897
    (version == 1) ? put_be64(pb, duration) : put_be32(pb, duration);