rmenc.c 15.4 KB
Newer Older
1 2
/*
 * "Real" compatible muxer.
3
 * Copyright (c) 2000, 2001 Fabrice Bellard
4
 *
5
 * This file is part of Libav.
6
 *
7
 * Libav is free software; you can redistribute it and/or
8 9 10 11
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2.1 of the License, or (at your option) any later version.
 *
12
 * Libav is distributed in the hope that it will be useful,
13 14 15 16 17
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
18
 * License along with Libav; if not, write to the Free Software
19 20 21
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
 */
#include "avformat.h"
22
#include "avio_internal.h"
23
#include "rm.h"
24
#include "libavutil/dict.h"
25

26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44
typedef struct {
    int nb_packets;
    int packet_total_size;
    int packet_max_size;
    /* codec related output */
    int bit_rate;
    float frame_rate;
    int nb_frames;    /* current frame number */
    int total_frames; /* total number of frames */
    int num;
    AVCodecContext *enc;
} StreamInfo;

typedef struct {
    StreamInfo streams[2];
    StreamInfo *audio_stream, *video_stream;
    int data_pos; /* position of the data after the header */
} RMMuxContext;

45 46 47 48
/* in ms */
#define BUFFER_DURATION 0


49
static void put_str(AVIOContext *s, const char *tag)
50
{
51
    avio_wb16(s,strlen(tag));
52
    while (*tag) {
53
        avio_w8(s, *tag++);
54 55 56
    }
}

57
static void put_str8(AVIOContext *s, const char *tag)
58
{
59
    avio_w8(s, strlen(tag));
60
    while (*tag) {
61
        avio_w8(s, *tag++);
62 63 64
    }
}

65
static int rv10_write_header(AVFormatContext *ctx,
Francesco Lavra's avatar
Francesco Lavra committed
66
                             int data_size, int index_pos)
67
{
68
    RMMuxContext *rm = ctx->priv_data;
69
    AVIOContext *s = ctx->pb;
70 71 72 73 74
    StreamInfo *stream;
    unsigned char *data_offset_ptr, *start_ptr;
    const char *desc, *mimetype;
    int nb_packets, packet_total_size, packet_max_size, size, packet_avg_size, i;
    int bit_rate, v, duration, flags, data_pos;
75
    AVDictionaryEntry *tag;
76 77 78

    start_ptr = s->buf_ptr;

79
    ffio_wfourcc(s, ".RMF");
80 81 82 83
    avio_wb32(s,18); /* header size */
    avio_wb16(s,0);
    avio_wb32(s,0);
    avio_wb32(s,4 + ctx->nb_streams); /* num headers */
84

85
    ffio_wfourcc(s,"PROP");
86 87
    avio_wb32(s, 50);
    avio_wb16(s, 0);
88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104
    packet_max_size = 0;
    packet_total_size = 0;
    nb_packets = 0;
    bit_rate = 0;
    duration = 0;
    for(i=0;i<ctx->nb_streams;i++) {
        StreamInfo *stream = &rm->streams[i];
        bit_rate += stream->bit_rate;
        if (stream->packet_max_size > packet_max_size)
            packet_max_size = stream->packet_max_size;
        nb_packets += stream->nb_packets;
        packet_total_size += stream->packet_total_size;
        /* select maximum duration */
        v = (int) (1000.0 * (float)stream->total_frames / stream->frame_rate);
        if (v > duration)
            duration = v;
    }
105 106 107
    avio_wb32(s, bit_rate); /* max bit rate */
    avio_wb32(s, bit_rate); /* avg bit rate */
    avio_wb32(s, packet_max_size);        /* max packet size */
108 109 110 111
    if (nb_packets > 0)
        packet_avg_size = packet_total_size / nb_packets;
    else
        packet_avg_size = 0;
112 113 114 115 116
    avio_wb32(s, packet_avg_size);        /* avg packet size */
    avio_wb32(s, nb_packets);  /* num packets */
    avio_wb32(s, duration); /* duration */
    avio_wb32(s, BUFFER_DURATION);           /* preroll */
    avio_wb32(s, index_pos);           /* index offset */
117 118
    /* computation of data the data offset */
    data_offset_ptr = s->buf_ptr;
119 120
    avio_wb32(s, 0);           /* data offset : will be patched after */
    avio_wb16(s, ctx->nb_streams);    /* num streams */
121
    flags = 1 | 2; /* save allowed & perfect play */
122
    if (!s->seekable)
123
        flags |= 4; /* live broadcast */
124
    avio_wb16(s, flags);
125 126 127

    /* comments */

128
    ffio_wfourcc(s,"CONT");
129 130
    size =  4 * 2 + 10;
    for(i=0; i<FF_ARRAY_ELEMS(ff_rm_metadata); i++) {
131
        tag = av_dict_get(ctx->metadata, ff_rm_metadata[i], NULL, 0);
132 133
        if(tag) size += strlen(tag->value);
    }
134 135
    avio_wb32(s,size);
    avio_wb16(s,0);
136
    for(i=0; i<FF_ARRAY_ELEMS(ff_rm_metadata); i++) {
137
        tag = av_dict_get(ctx->metadata, ff_rm_metadata[i], NULL, 0);
138 139
        put_str(s, tag ? tag->value : "");
    }
140 141 142 143 144 145

    for(i=0;i<ctx->nb_streams;i++) {
        int codec_data_size;

        stream = &rm->streams[i];

146
        if (stream->enc->codec_type == AVMEDIA_TYPE_AUDIO) {
147 148 149 150 151 152 153 154 155
            desc = "The Audio Stream";
            mimetype = "audio/x-pn-realaudio";
            codec_data_size = 73;
        } else {
            desc = "The Video Stream";
            mimetype = "video/x-pn-realvideo";
            codec_data_size = 34;
        }

156
        ffio_wfourcc(s,"MDPR");
157
        size = 10 + 9 * 4 + strlen(desc) + strlen(mimetype) + codec_data_size;
158 159
        avio_wb32(s, size);
        avio_wb16(s, 0);
160

161 162 163 164
        avio_wb16(s, i); /* stream number */
        avio_wb32(s, stream->bit_rate); /* max bit rate */
        avio_wb32(s, stream->bit_rate); /* avg bit rate */
        avio_wb32(s, stream->packet_max_size);        /* max packet size */
165 166 167 168 169
        if (stream->nb_packets > 0)
            packet_avg_size = stream->packet_total_size /
                stream->nb_packets;
        else
            packet_avg_size = 0;
170 171 172
        avio_wb32(s, packet_avg_size);        /* avg packet size */
        avio_wb32(s, 0);           /* start time */
        avio_wb32(s, BUFFER_DURATION);           /* preroll */
173
        /* duration */
174
        if (!s->seekable || !stream->total_frames)
175
            avio_wb32(s, (int)(3600 * 1000));
176
        else
177
            avio_wb32(s, (int)(stream->total_frames * 1000 / stream->frame_rate));
178 179
        put_str8(s, desc);
        put_str8(s, mimetype);
180
        avio_wb32(s, codec_data_size);
181

182
        if (stream->enc->codec_type == AVMEDIA_TYPE_AUDIO) {
183 184 185 186 187
            int coded_frame_size, fscode, sample_rate;
            sample_rate = stream->enc->sample_rate;
            coded_frame_size = (stream->enc->bit_rate *
                                stream->enc->frame_size) / (8 * sample_rate);
            /* audio codec info */
188
            avio_write(s, ".ra", 3);
189 190
            avio_w8(s, 0xfd);
            avio_wb32(s, 0x00040000); /* version */
191
            ffio_wfourcc(s, ".ra4");
192 193 194
            avio_wb32(s, 0x01b53530); /* stream length */
            avio_wb16(s, 4); /* unknown */
            avio_wb32(s, 0x39); /* header size */
195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212

            switch(sample_rate) {
            case 48000:
            case 24000:
            case 12000:
                fscode = 1;
                break;
            default:
            case 44100:
            case 22050:
            case 11025:
                fscode = 2;
                break;
            case 32000:
            case 16000:
            case 8000:
                fscode = 3;
            }
213
            avio_wb16(s, fscode); /* codec additional info, for AC-3, seems
214 215 216 217
                                     to be a frequency code */
            /* special hack to compensate rounding errors... */
            if (coded_frame_size == 557)
                coded_frame_size--;
218 219 220 221 222
            avio_wb32(s, coded_frame_size); /* frame length */
            avio_wb32(s, 0x51540); /* unknown */
            avio_wb32(s, 0x249f0); /* unknown */
            avio_wb32(s, 0x249f0); /* unknown */
            avio_wb16(s, 0x01);
223
            /* frame length : seems to be very important */
224 225 226 227 228
            avio_wb16(s, coded_frame_size);
            avio_wb32(s, 0); /* unknown */
            avio_wb16(s, stream->enc->sample_rate); /* sample rate */
            avio_wb32(s, 0x10); /* unknown */
            avio_wb16(s, stream->enc->channels);
229
            put_str8(s, "Int0"); /* codec name */
230
            if (stream->enc->codec_tag) {
231 232
                avio_w8(s, 4); /* tag length */
                avio_wl32(s, stream->enc->codec_tag);
233 234 235 236
            } else {
                av_log(ctx, AV_LOG_ERROR, "Invalid codec tag\n");
                return -1;
            }
237 238 239 240
            avio_wb16(s, 0); /* title length */
            avio_wb16(s, 0); /* author length */
            avio_wb16(s, 0); /* copyright length */
            avio_w8(s, 0); /* end of header */
241 242
        } else {
            /* video codec info */
243
            avio_wb32(s,34); /* size */
244
            ffio_wfourcc(s, "VIDO");
245
            if(stream->enc->codec_id == CODEC_ID_RV10)
246
                ffio_wfourcc(s,"RV10");
247
            else
248
                ffio_wfourcc(s,"RV20");
249 250 251 252 253 254 255
            avio_wb16(s, stream->enc->width);
            avio_wb16(s, stream->enc->height);
            avio_wb16(s, (int) stream->frame_rate); /* frames per seconds ? */
            avio_wb32(s,0);     /* unknown meaning */
            avio_wb16(s, (int) stream->frame_rate);  /* unknown meaning */
            avio_wb32(s,0);     /* unknown meaning */
            avio_wb16(s, 8);    /* unknown meaning */
256 257 258 259
            /* Seems to be the codec version: only use basic H263. The next
               versions seems to add a diffential DC coding as in
               MPEG... nothing new under the sun */
            if(stream->enc->codec_id == CODEC_ID_RV10)
260
                avio_wb32(s,0x10000000);
261
            else
262 263
                avio_wb32(s,0x20103001);
            //avio_wb32(s,0x10003000);
264 265 266 267 268 269 270 271 272 273 274 275
        }
    }

    /* patch data offset field */
    data_pos = s->buf_ptr - start_ptr;
    rm->data_pos = data_pos;
    data_offset_ptr[0] = data_pos >> 24;
    data_offset_ptr[1] = data_pos >> 16;
    data_offset_ptr[2] = data_pos >> 8;
    data_offset_ptr[3] = data_pos;

    /* data stream */
276
    ffio_wfourcc(s, "DATA");
277 278
    avio_wb32(s,data_size + 10 + 8);
    avio_wb16(s,0);
279

280 281
    avio_wb32(s, nb_packets); /* number of packets */
    avio_wb32(s,0); /* next data header */
282
    return 0;
283 284 285 286 287 288
}

static void write_packet_header(AVFormatContext *ctx, StreamInfo *stream,
                                int length, int key_frame)
{
    int timestamp;
289
    AVIOContext *s = ctx->pb;
290 291 292 293 294 295

    stream->nb_packets++;
    stream->packet_total_size += length;
    if (length > stream->packet_max_size)
        stream->packet_max_size =  length;

296 297 298
    avio_wb16(s,0); /* version */
    avio_wb16(s,length + 12);
    avio_wb16(s, stream->num); /* stream number */
299
    timestamp = (1000 * (float)stream->nb_frames) / stream->frame_rate;
300 301 302
    avio_wb32(s, timestamp); /* timestamp */
    avio_w8(s, 0); /* reserved */
    avio_w8(s, key_frame ? 2 : 0); /* flags */
303 304 305 306
}

static int rm_write_header(AVFormatContext *s)
{
307
    RMMuxContext *rm = s->priv_data;
308 309 310 311 312 313 314 315 316 317 318 319 320 321
    StreamInfo *stream;
    int n;
    AVCodecContext *codec;

    for(n=0;n<s->nb_streams;n++) {
        s->streams[n]->id = n;
        codec = s->streams[n]->codec;
        stream = &rm->streams[n];
        memset(stream, 0, sizeof(StreamInfo));
        stream->num = n;
        stream->bit_rate = codec->bit_rate;
        stream->enc = codec;

        switch(codec->codec_type) {
322
        case AVMEDIA_TYPE_AUDIO:
323 324 325 326 327 328 329
            rm->audio_stream = stream;
            stream->frame_rate = (float)codec->sample_rate / (float)codec->frame_size;
            /* XXX: dummy values */
            stream->packet_max_size = 1024;
            stream->nb_packets = 0;
            stream->total_frames = stream->nb_packets;
            break;
330
        case AVMEDIA_TYPE_VIDEO:
331 332 333 334 335 336 337 338 339 340 341 342
            rm->video_stream = stream;
            stream->frame_rate = (float)codec->time_base.den / (float)codec->time_base.num;
            /* XXX: dummy values */
            stream->packet_max_size = 4096;
            stream->nb_packets = 0;
            stream->total_frames = stream->nb_packets;
            break;
        default:
            return -1;
        }
    }

343 344
    if (rv10_write_header(s, 0, 0))
        return AVERROR_INVALIDDATA;
345
    avio_flush(s->pb);
346 347 348 349 350 351
    return 0;
}

static int rm_write_audio(AVFormatContext *s, const uint8_t *buf, int size, int flags)
{
    uint8_t *buf1;
352
    RMMuxContext *rm = s->priv_data;
353
    AVIOContext *pb = s->pb;
354 355 356 357
    StreamInfo *stream = rm->audio_stream;
    int i;

    /* XXX: suppress this malloc */
358
    buf1 = av_malloc(size * sizeof(uint8_t));
359

360
    write_packet_header(s, stream, size, !!(flags & AV_PKT_FLAG_KEY));
361

362
    if (stream->enc->codec_id == CODEC_ID_AC3) {
Francesco Lavra's avatar
Francesco Lavra committed
363 364 365 366 367
        /* for AC-3, the words seem to be reversed */
        for(i=0;i<size;i+=2) {
            buf1[i] = buf[i+1];
            buf1[i+1] = buf[i];
        }
368
        avio_write(pb, buf1, size);
369
    } else {
370
        avio_write(pb, buf, size);
371
    }
372
    avio_flush(pb);
373 374 375 376 377 378 379
    stream->nb_frames++;
    av_free(buf1);
    return 0;
}

static int rm_write_video(AVFormatContext *s, const uint8_t *buf, int size, int flags)
{
380
    RMMuxContext *rm = s->priv_data;
381
    AVIOContext *pb = s->pb;
382
    StreamInfo *stream = rm->video_stream;
383
    int key_frame = !!(flags & AV_PKT_FLAG_KEY);
384 385 386 387 388 389

    /* XXX: this is incorrect: should be a parameter */

    /* Well, I spent some time finding the meaning of these bits. I am
       not sure I understood everything, but it works !! */
#if 1
390
    write_packet_header(s, stream, size + 7 + (size >= 0x4000)*4, key_frame);
391
    /* bit 7: '1' if final packet of a frame converted in several packets */
392
    avio_w8(pb, 0x81);
393 394 395
    /* bit 7: '1' if I frame. bits 6..0 : sequence number in current
       frame starting from 1 */
    if (key_frame) {
396
        avio_w8(pb, 0x81);
397
    } else {
398
        avio_w8(pb, 0x01);
399
    }
400
    if(size >= 0x4000){
401 402
        avio_wb32(pb, size); /* total frame size */
        avio_wb32(pb, size); /* offset from the start or the end */
403
    }else{
404 405
        avio_wb16(pb, 0x4000 | size); /* total frame size */
        avio_wb16(pb, 0x4000 | size); /* offset from the start or the end */
406
    }
407 408 409
#else
    /* full frame */
    write_packet_header(s, size + 6);
410 411 412
    avio_w8(pb, 0xc0);
    avio_wb16(pb, 0x4000 + size); /* total frame size */
    avio_wb16(pb, 0x4000 + packet_number * 126); /* position in stream */
413
#endif
414
    avio_w8(pb, stream->nb_frames & 0xff);
415

416
    avio_write(pb, buf, size);
417
    avio_flush(pb);
418 419 420 421 422 423 424 425

    stream->nb_frames++;
    return 0;
}

static int rm_write_packet(AVFormatContext *s, AVPacket *pkt)
{
    if (s->streams[pkt->stream_index]->codec->codec_type ==
426
        AVMEDIA_TYPE_AUDIO)
427 428 429 430 431 432 433
        return rm_write_audio(s, pkt->data, pkt->size, pkt->flags);
    else
        return rm_write_video(s, pkt->data, pkt->size, pkt->flags);
}

static int rm_write_trailer(AVFormatContext *s)
{
434
    RMMuxContext *rm = s->priv_data;
435
    int data_size, index_pos, i;
436
    AVIOContext *pb = s->pb;
437

438
    if (s->pb->seekable) {
439
        /* end of file: finish to write header */
440
        index_pos = avio_tell(pb);
441 442
        data_size = index_pos - rm->data_pos;

443 444
        /* FIXME: write index */

445
        /* undocumented end header */
446 447
        avio_wb32(pb, 0);
        avio_wb32(pb, 0);
448

449
        avio_seek(pb, 0, SEEK_SET);
450 451
        for(i=0;i<s->nb_streams;i++)
            rm->streams[i].total_frames = rm->streams[i].nb_frames;
452
        rv10_write_header(s, data_size, 0);
453 454
    } else {
        /* undocumented end header */
455 456
        avio_wb32(pb, 0);
        avio_wb32(pb, 0);
457
    }
458
    avio_flush(pb);
459 460 461 462
    return 0;
}


463
AVOutputFormat ff_rm_muxer = {
464 465 466 467 468 469 470 471 472 473
    .name              = "rm",
    .long_name         = NULL_IF_CONFIG_SMALL("RealMedia format"),
    .mime_type         = "application/vnd.rn-realmedia",
    .extensions        = "rm,ra",
    .priv_data_size    = sizeof(RMMuxContext),
    .audio_codec       = CODEC_ID_AC3,
    .video_codec       = CODEC_ID_RV10,
    .write_header      = rm_write_header,
    .write_packet      = rm_write_packet,
    .write_trailer     = rm_write_trailer,
474
    .codec_tag= (const AVCodecTag* const []){ff_rm_codec_tags, 0},
475
};