avconv.c 80.6 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32
/*
 * avconv main
 * Copyright (c) 2000-2011 The libav developers.
 *
 * This file is part of Libav.
 *
 * Libav is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Lesser General Public
 * License as published by the Free Software Foundation; either
 * version 2.1 of the License, or (at your option) any later version.
 *
 * Libav is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Lesser General Public License for more details.
 *
 * You should have received a copy of the GNU Lesser General Public
 * License along with Libav; if not, write to the Free Software
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
 */

#include "config.h"
#include <ctype.h>
#include <string.h>
#include <math.h>
#include <stdlib.h>
#include <errno.h>
#include <signal.h>
#include <limits.h>
#include "libavformat/avformat.h"
#include "libavdevice/avdevice.h"
#include "libswscale/swscale.h"
Justin Ruggles's avatar
Justin Ruggles committed
33
#include "libavresample/avresample.h"
34 35 36 37 38 39 40 41 42 43 44 45
#include "libavutil/opt.h"
#include "libavutil/audioconvert.h"
#include "libavutil/parseutils.h"
#include "libavutil/samplefmt.h"
#include "libavutil/colorspace.h"
#include "libavutil/fifo.h"
#include "libavutil/intreadwrite.h"
#include "libavutil/dict.h"
#include "libavutil/mathematics.h"
#include "libavutil/pixdesc.h"
#include "libavutil/avstring.h"
#include "libavutil/libm.h"
46
#include "libavutil/imgutils.h"
47
#include "libavutil/time.h"
48 49 50 51
#include "libavformat/os_support.h"

# include "libavfilter/avfilter.h"
# include "libavfilter/avfiltergraph.h"
52
# include "libavfilter/buffersrc.h"
53
# include "libavfilter/buffersink.h"
54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69

#if HAVE_SYS_RESOURCE_H
#include <sys/types.h>
#include <sys/resource.h>
#elif HAVE_GETPROCESSTIMES
#include <windows.h>
#endif
#if HAVE_GETPROCESSMEMORYINFO
#include <windows.h>
#include <psapi.h>
#endif

#if HAVE_SYS_SELECT_H
#include <sys/select.h>
#endif

70 71 72 73
#if HAVE_PTHREADS
#include <pthread.h>
#endif

74 75
#include <time.h>

76
#include "avconv.h"
77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92
#include "cmdutils.h"

#include "libavutil/avassert.h"

const char program_name[] = "avconv";
const int program_birth_year = 2000;

static FILE *vstats_file;

static int64_t video_size = 0;
static int64_t audio_size = 0;
static int64_t extra_size = 0;
static int nb_frames_dup = 0;
static int nb_frames_drop = 0;


93

94
#if HAVE_PTHREADS
95 96 97 98
/* signal to input threads that they should exit; set by the main thread */
static int transcoding_finished;
#endif

99 100
#define DEFAULT_PASS_LOGFILENAME_PREFIX "av2pass"

101 102 103 104
InputStream **input_streams = NULL;
int        nb_input_streams = 0;
InputFile   **input_files   = NULL;
int        nb_input_files   = 0;
105

106 107 108 109
OutputStream **output_streams = NULL;
int         nb_output_streams = 0;
OutputFile   **output_files   = NULL;
int         nb_output_files   = 0;
110

111 112
FilterGraph **filtergraphs;
int        nb_filtergraphs;
113

114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131
static void term_exit(void)
{
    av_log(NULL, AV_LOG_QUIET, "");
}

static volatile int received_sigterm = 0;
static volatile int received_nb_signals = 0;

static void
sigterm_handler(int sig)
{
    received_sigterm = sig;
    received_nb_signals++;
    term_exit();
}

static void term_init(void)
{
Aneesh Dogra's avatar
Aneesh Dogra committed
132
    signal(SIGINT , sigterm_handler); /* Interrupt (ANSI).    */
133 134 135 136 137 138
    signal(SIGTERM, sigterm_handler); /* Termination (ANSI).  */
#ifdef SIGXCPU
    signal(SIGXCPU, sigterm_handler);
#endif
}

139
static int decode_interrupt_cb(void *ctx)
140 141 142 143
{
    return received_nb_signals > 1;
}

144
const AVIOInterruptCB int_cb = { decode_interrupt_cb, NULL };
145

146
static void exit_program(void)
147
{
148 149 150 151
    int i, j;

    for (i = 0; i < nb_filtergraphs; i++) {
        avfilter_graph_free(&filtergraphs[i]->graph);
152 153
        for (j = 0; j < filtergraphs[i]->nb_inputs; j++) {
            av_freep(&filtergraphs[i]->inputs[j]->name);
154
            av_freep(&filtergraphs[i]->inputs[j]);
155
        }
156
        av_freep(&filtergraphs[i]->inputs);
157 158
        for (j = 0; j < filtergraphs[i]->nb_outputs; j++) {
            av_freep(&filtergraphs[i]->outputs[j]->name);
159
            av_freep(&filtergraphs[i]->outputs[j]);
160
        }
161 162 163 164
        av_freep(&filtergraphs[i]->outputs);
        av_freep(&filtergraphs[i]);
    }
    av_freep(&filtergraphs);
165 166

    /* close files */
Aneesh Dogra's avatar
Aneesh Dogra committed
167
    for (i = 0; i < nb_output_files; i++) {
168
        AVFormatContext *s = output_files[i]->ctx;
169 170 171
        if (!(s->oformat->flags & AVFMT_NOFILE) && s->pb)
            avio_close(s->pb);
        avformat_free_context(s);
172 173
        av_dict_free(&output_files[i]->opts);
        av_freep(&output_files[i]);
174
    }
Janne Grunau's avatar
Janne Grunau committed
175
    for (i = 0; i < nb_output_streams; i++) {
176
        AVBitStreamFilterContext *bsfc = output_streams[i]->bitstream_filters;
Janne Grunau's avatar
Janne Grunau committed
177 178 179 180 181
        while (bsfc) {
            AVBitStreamFilterContext *next = bsfc->next;
            av_bitstream_filter_close(bsfc);
            bsfc = next;
        }
182
        output_streams[i]->bitstream_filters = NULL;
183
        avcodec_free_frame(&output_streams[i]->filtered_frame);
184

Anton Khirnov's avatar
Anton Khirnov committed
185
        av_freep(&output_streams[i]->forced_keyframes);
186
        av_freep(&output_streams[i]->avfilter);
187
        av_freep(&output_streams[i]->logfile_prefix);
188
        av_freep(&output_streams[i]);
Janne Grunau's avatar
Janne Grunau committed
189
    }
Aneesh Dogra's avatar
Aneesh Dogra committed
190
    for (i = 0; i < nb_input_files; i++) {
191 192
        avformat_close_input(&input_files[i]->ctx);
        av_freep(&input_files[i]);
193
    }
194
    for (i = 0; i < nb_input_streams; i++) {
195
        avcodec_free_frame(&input_streams[i]->decoded_frame);
196
        av_dict_free(&input_streams[i]->opts);
197
        free_buffer_pool(&input_streams[i]->buffer_pool);
198
        av_freep(&input_streams[i]->filters);
199
        av_freep(&input_streams[i]);
200
    }
201 202 203 204 205 206 207

    if (vstats_file)
        fclose(vstats_file);
    av_free(vstats_filename);

    av_freep(&input_streams);
    av_freep(&input_files);
208
    av_freep(&output_streams);
209
    av_freep(&output_files);
210 211 212 213

    uninit_opts();

    avfilter_uninit();
214
    avformat_network_deinit();
215 216

    if (received_sigterm) {
217 218
        av_log(NULL, AV_LOG_INFO, "Received signal %d: terminating.\n",
               (int) received_sigterm);
219 220 221 222
        exit (255);
    }
}

223
void assert_avoptions(AVDictionary *m)
224 225 226
{
    AVDictionaryEntry *t;
    if ((t = av_dict_get(m, "", NULL, AV_DICT_IGNORE_SUFFIX))) {
227
        av_log(NULL, AV_LOG_FATAL, "Option %s not found.\n", t->key);
228
        exit(1);
229 230 231 232 233 234 235 236 237
    }
}

static void assert_codec_experimental(AVCodecContext *c, int encoder)
{
    const char *codec_string = encoder ? "encoder" : "decoder";
    AVCodec *codec;
    if (c->codec->capabilities & CODEC_CAP_EXPERIMENTAL &&
        c->strict_std_compliance > FF_COMPLIANCE_EXPERIMENTAL) {
238
        av_log(NULL, AV_LOG_FATAL, "%s '%s' is experimental and might produce bad "
239 240 241 242
                "results.\nAdd '-strict experimental' if you want to use it.\n",
                codec_string, c->codec->name);
        codec = encoder ? avcodec_find_encoder(c->codec->id) : avcodec_find_decoder(c->codec->id);
        if (!(codec->capabilities & CODEC_CAP_EXPERIMENTAL))
243
            av_log(NULL, AV_LOG_FATAL, "Or use the non experimental %s '%s'.\n",
244
                   codec_string, codec->name);
245
        exit(1);
246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269
    }
}

/**
 * Update the requested input sample format based on the output sample format.
 * This is currently only used to request float output from decoders which
 * support multiple sample formats, one of which is AV_SAMPLE_FMT_FLT.
 * Ideally this will be removed in the future when decoders do not do format
 * conversion and only output in their native format.
 */
static void update_sample_fmt(AVCodecContext *dec, AVCodec *dec_codec,
                              AVCodecContext *enc)
{
    /* if sample formats match or a decoder sample format has already been
       requested, just return */
    if (enc->sample_fmt == dec->sample_fmt ||
        dec->request_sample_fmt > AV_SAMPLE_FMT_NONE)
        return;

    /* if decoder supports more than one output format */
    if (dec_codec && dec_codec->sample_fmts &&
        dec_codec->sample_fmts[0] != AV_SAMPLE_FMT_NONE &&
        dec_codec->sample_fmts[1] != AV_SAMPLE_FMT_NONE) {
        const enum AVSampleFormat *p;
270 271 272
        int min_dec = INT_MAX, min_inc = INT_MAX;
        enum AVSampleFormat dec_fmt = AV_SAMPLE_FMT_NONE;
        enum AVSampleFormat inc_fmt = AV_SAMPLE_FMT_NONE;
273 274 275 276 277 278

        /* find a matching sample format in the encoder */
        for (p = dec_codec->sample_fmts; *p != AV_SAMPLE_FMT_NONE; p++) {
            if (*p == enc->sample_fmt) {
                dec->request_sample_fmt = *p;
                return;
279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300
            } else {
                enum AVSampleFormat dfmt = av_get_packed_sample_fmt(*p);
                enum AVSampleFormat efmt = av_get_packed_sample_fmt(enc->sample_fmt);
                int fmt_diff = 32 * abs(dfmt - efmt);
                if (av_sample_fmt_is_planar(*p) !=
                    av_sample_fmt_is_planar(enc->sample_fmt))
                    fmt_diff++;
                if (dfmt == efmt) {
                    min_inc = fmt_diff;
                    inc_fmt = *p;
                } else if (dfmt > efmt) {
                    if (fmt_diff < min_inc) {
                        min_inc = fmt_diff;
                        inc_fmt = *p;
                    }
                } else {
                    if (fmt_diff < min_dec) {
                        min_dec = fmt_diff;
                        dec_fmt = *p;
                    }
                }
            }
301 302 303
        }

        /* if none match, provide the one that matches quality closest */
304
        dec->request_sample_fmt = min_inc != INT_MAX ? inc_fmt : dec_fmt;
305 306 307
    }
}

308
static void write_frame(AVFormatContext *s, AVPacket *pkt, OutputStream *ost)
Aneesh Dogra's avatar
Aneesh Dogra committed
309
{
310 311
    AVBitStreamFilterContext *bsfc = ost->bitstream_filters;
    AVCodecContext          *avctx = ost->st->codec;
312 313
    int ret;

314 315 316 317 318 319 320 321
    /*
     * Audio encoders may split the packets --  #frames in != #packets out.
     * But there is no reordering, so we can limit the number of output packets
     * by simply dropping them here.
     * Counting encoded video frames needs to be done separately because of
     * reordering, see do_video_out()
     */
    if (!(avctx->codec_type == AVMEDIA_TYPE_VIDEO && avctx->codec)) {
322 323
        if (ost->frame_number >= ost->max_frames) {
            av_free_packet(pkt);
324
            return;
325
        }
326 327 328
        ost->frame_number++;
    }

Aneesh Dogra's avatar
Aneesh Dogra committed
329 330 331 332 333 334 335
    while (bsfc) {
        AVPacket new_pkt = *pkt;
        int a = av_bitstream_filter_filter(bsfc, avctx, NULL,
                                           &new_pkt.data, &new_pkt.size,
                                           pkt->data, pkt->size,
                                           pkt->flags & AV_PKT_FLAG_KEY);
        if (a > 0) {
336
            av_free_packet(pkt);
Aneesh Dogra's avatar
Aneesh Dogra committed
337 338
            new_pkt.destruct = av_destruct_packet;
        } else if (a < 0) {
339 340 341
            av_log(NULL, AV_LOG_ERROR, "%s failed for stream %d, codec %s",
                   bsfc->filter->name, pkt->stream_index,
                   avctx->codec ? avctx->codec->name : "copy");
342 343
            print_error("", a);
            if (exit_on_error)
344
                exit(1);
345
        }
Aneesh Dogra's avatar
Aneesh Dogra committed
346
        *pkt = new_pkt;
347

Aneesh Dogra's avatar
Aneesh Dogra committed
348
        bsfc = bsfc->next;
349 350
    }

351
    pkt->stream_index = ost->index;
Aneesh Dogra's avatar
Aneesh Dogra committed
352 353
    ret = av_interleaved_write_frame(s, pkt);
    if (ret < 0) {
354
        print_error("av_interleaved_write_frame()", ret);
355
        exit(1);
356 357 358
    }
}

359 360
static int check_recording_time(OutputStream *ost)
{
361
    OutputFile *of = output_files[ost->file_index];
362 363 364 365

    if (of->recording_time != INT64_MAX &&
        av_compare_ts(ost->sync_opts - ost->first_pts, ost->st->codec->time_base, of->recording_time,
                      AV_TIME_BASE_Q) >= 0) {
366
        ost->finished = 1;
367 368 369 370 371
        return 0;
    }
    return 1;
}

372 373
static void do_audio_out(AVFormatContext *s, OutputStream *ost,
                         AVFrame *frame)
374 375 376
{
    AVCodecContext *enc = ost->st->codec;
    AVPacket pkt;
377
    int got_packet = 0;
378 379 380 381 382

    av_init_packet(&pkt);
    pkt.data = NULL;
    pkt.size = 0;

383 384
    if (!check_recording_time(ost))
        return;
385

386
    if (frame->pts == AV_NOPTS_VALUE || audio_sync_method < 0)
387
        frame->pts = ost->sync_opts;
388
    ost->sync_opts = frame->pts + frame->nb_samples;
389 390 391

    if (avcodec_encode_audio2(enc, &pkt, frame, &got_packet) < 0) {
        av_log(NULL, AV_LOG_FATAL, "Audio encoding failed\n");
392
        exit(1);
393 394 395 396 397
    }

    if (got_packet) {
        if (pkt.pts != AV_NOPTS_VALUE)
            pkt.pts      = av_rescale_q(pkt.pts,      enc->time_base, ost->st->time_base);
398 399
        if (pkt.dts != AV_NOPTS_VALUE)
            pkt.dts      = av_rescale_q(pkt.dts,      enc->time_base, ost->st->time_base);
400 401 402 403 404 405 406
        if (pkt.duration > 0)
            pkt.duration = av_rescale_q(pkt.duration, enc->time_base, ost->st->time_base);

        write_frame(s, &pkt, ost);

        audio_size += pkt.size;
    }
407 408 409 410 411 412 413 414 415 416 417 418 419 420 421 422 423
}

static void pre_process_video_frame(InputStream *ist, AVPicture *picture, void **bufp)
{
    AVCodecContext *dec;
    AVPicture *picture2;
    AVPicture picture_tmp;
    uint8_t *buf = 0;

    dec = ist->st->codec;

    /* deinterlace : must be done before any resize */
    if (do_deinterlace) {
        int size;

        /* create temporary picture */
        size = avpicture_get_size(dec->pix_fmt, dec->width, dec->height);
Aneesh Dogra's avatar
Aneesh Dogra committed
424
        buf  = av_malloc(size);
425 426 427 428 429 430
        if (!buf)
            return;

        picture2 = &picture_tmp;
        avpicture_fill(picture2, buf, dec->pix_fmt, dec->width, dec->height);

Aneesh Dogra's avatar
Aneesh Dogra committed
431
        if (avpicture_deinterlace(picture2, picture,
432 433
                                 dec->pix_fmt, dec->width, dec->height) < 0) {
            /* if error, do not deinterlace */
434
            av_log(NULL, AV_LOG_WARNING, "Deinterlacing failed\n");
435 436 437 438 439 440 441 442 443 444 445 446 447 448 449 450 451 452 453 454 455 456 457 458 459 460
            av_free(buf);
            buf = NULL;
            picture2 = picture;
        }
    } else {
        picture2 = picture;
    }

    if (picture != picture2)
        *picture = *picture2;
    *bufp = buf;
}

static void do_subtitle_out(AVFormatContext *s,
                            OutputStream *ost,
                            InputStream *ist,
                            AVSubtitle *sub,
                            int64_t pts)
{
    static uint8_t *subtitle_out = NULL;
    int subtitle_out_max_size = 1024 * 1024;
    int subtitle_out_size, nb, i;
    AVCodecContext *enc;
    AVPacket pkt;

    if (pts == AV_NOPTS_VALUE) {
461
        av_log(NULL, AV_LOG_ERROR, "Subtitle packets must have a pts\n");
462
        if (exit_on_error)
463
            exit(1);
464 465 466 467 468 469 470 471 472 473 474 475
        return;
    }

    enc = ost->st->codec;

    if (!subtitle_out) {
        subtitle_out = av_malloc(subtitle_out_max_size);
    }

    /* Note: DVB subtitle need one packet to draw them and one other
       packet to clear them */
    /* XXX: signal it in the codec context ? */
476
    if (enc->codec_id == AV_CODEC_ID_DVB_SUBTITLE)
477 478 479 480
        nb = 2;
    else
        nb = 1;

Aneesh Dogra's avatar
Aneesh Dogra committed
481
    for (i = 0; i < nb; i++) {
482 483 484 485
        ost->sync_opts = av_rescale_q(pts, ist->st->time_base, enc->time_base);
        if (!check_recording_time(ost))
            return;

486 487
        sub->pts = av_rescale_q(pts, ist->st->time_base, AV_TIME_BASE_Q);
        // start_display_time is required to be 0
Aneesh Dogra's avatar
Aneesh Dogra committed
488 489
        sub->pts               += av_rescale_q(sub->start_display_time, (AVRational){ 1, 1000 }, AV_TIME_BASE_Q);
        sub->end_display_time  -= sub->start_display_time;
490 491 492 493
        sub->start_display_time = 0;
        subtitle_out_size = avcodec_encode_subtitle(enc, subtitle_out,
                                                    subtitle_out_max_size, sub);
        if (subtitle_out_size < 0) {
494
            av_log(NULL, AV_LOG_FATAL, "Subtitle encoding failed\n");
495
            exit(1);
496 497 498 499 500
        }

        av_init_packet(&pkt);
        pkt.data = subtitle_out;
        pkt.size = subtitle_out_size;
Aneesh Dogra's avatar
Aneesh Dogra committed
501
        pkt.pts  = av_rescale_q(sub->pts, AV_TIME_BASE_Q, ost->st->time_base);
502
        if (enc->codec_id == AV_CODEC_ID_DVB_SUBTITLE) {
503 504 505 506 507 508 509
            /* XXX: the pts correction is handled here. Maybe handling
               it in the codec would be better */
            if (i == 0)
                pkt.pts += 90 * sub->start_display_time;
            else
                pkt.pts += 90 * sub->end_display_time;
        }
510
        write_frame(s, &pkt, ost);
511 512 513
    }
}

514 515 516
static void do_video_out(AVFormatContext *s,
                         OutputStream *ost,
                         AVFrame *in_picture,
Anton Khirnov's avatar
Anton Khirnov committed
517
                         int *frame_size)
518
{
519 520 521
    int ret, format_video_sync;
    AVPacket pkt;
    AVCodecContext *enc = ost->st->codec;
522 523 524

    *frame_size = 0;

525
    format_video_sync = video_sync_method;
526 527 528
    if (format_video_sync == VSYNC_AUTO)
        format_video_sync = (s->oformat->flags & AVFMT_NOTIMESTAMPS) ? VSYNC_PASSTHROUGH :
                            (s->oformat->flags & AVFMT_VARIABLE_FPS) ? VSYNC_VFR : VSYNC_CFR;
529 530 531 532
    if (format_video_sync != VSYNC_PASSTHROUGH &&
        ost->frame_number &&
        in_picture->pts != AV_NOPTS_VALUE &&
        in_picture->pts < ost->sync_opts) {
Anton Khirnov's avatar
Anton Khirnov committed
533 534
        nb_frames_drop++;
        av_log(NULL, AV_LOG_VERBOSE, "*** drop!\n");
535
        return;
Anton Khirnov's avatar
Anton Khirnov committed
536
    }
537

538 539 540 541 542
    if (in_picture->pts == AV_NOPTS_VALUE)
        in_picture->pts = ost->sync_opts;
    ost->sync_opts = in_picture->pts;


543
    if (!ost->frame_number)
544
        ost->first_pts = in_picture->pts;
545

Anton Khirnov's avatar
Anton Khirnov committed
546 547 548
    av_init_packet(&pkt);
    pkt.data = NULL;
    pkt.size = 0;
549

Anton Khirnov's avatar
Anton Khirnov committed
550 551 552
    if (!check_recording_time(ost) ||
        ost->frame_number >= ost->max_frames)
        return;
553

Anton Khirnov's avatar
Anton Khirnov committed
554
    if (s->oformat->flags & AVFMT_RAWPICTURE &&
555
        enc->codec->id == AV_CODEC_ID_RAWVIDEO) {
Anton Khirnov's avatar
Anton Khirnov committed
556 557 558 559 560 561 562 563 564
        /* raw pictures are written as AVPicture structure to
           avoid any copies. We support temporarily the older
           method. */
        enc->coded_frame->interlaced_frame = in_picture->interlaced_frame;
        enc->coded_frame->top_field_first  = in_picture->top_field_first;
        pkt.data   = (uint8_t *)in_picture;
        pkt.size   =  sizeof(AVPicture);
        pkt.pts    = av_rescale_q(in_picture->pts, enc->time_base, ost->st->time_base);
        pkt.flags |= AV_PKT_FLAG_KEY;
565

Anton Khirnov's avatar
Anton Khirnov committed
566 567 568 569 570 571 572 573 574 575 576 577 578 579 580
        write_frame(s, &pkt, ost);
    } else {
        int got_packet;
        AVFrame big_picture;

        big_picture = *in_picture;
        /* better than nothing: use input picture interlaced
           settings */
        big_picture.interlaced_frame = in_picture->interlaced_frame;
        if (ost->st->codec->flags & (CODEC_FLAG_INTERLACED_DCT|CODEC_FLAG_INTERLACED_ME)) {
            if (ost->top_field_first == -1)
                big_picture.top_field_first = in_picture->top_field_first;
            else
                big_picture.top_field_first = !!ost->top_field_first;
        }
581

Anton Khirnov's avatar
Anton Khirnov committed
582
        big_picture.quality = ost->st->codec->global_quality;
Anton Khirnov's avatar
Anton Khirnov committed
583 584 585 586 587 588 589 590 591 592
        if (!enc->me_threshold)
            big_picture.pict_type = 0;
        if (ost->forced_kf_index < ost->forced_kf_count &&
            big_picture.pts >= ost->forced_kf_pts[ost->forced_kf_index]) {
            big_picture.pict_type = AV_PICTURE_TYPE_I;
            ost->forced_kf_index++;
        }
        ret = avcodec_encode_video2(enc, &pkt, &big_picture, &got_packet);
        if (ret < 0) {
            av_log(NULL, AV_LOG_FATAL, "Video encoding failed\n");
593
            exit(1);
Anton Khirnov's avatar
Anton Khirnov committed
594
        }
595

Anton Khirnov's avatar
Anton Khirnov committed
596 597 598 599 600
        if (got_packet) {
            if (pkt.pts != AV_NOPTS_VALUE)
                pkt.pts = av_rescale_q(pkt.pts, enc->time_base, ost->st->time_base);
            if (pkt.dts != AV_NOPTS_VALUE)
                pkt.dts = av_rescale_q(pkt.dts, enc->time_base, ost->st->time_base);
601

Anton Khirnov's avatar
Anton Khirnov committed
602 603 604
            write_frame(s, &pkt, ost);
            *frame_size = pkt.size;
            video_size += pkt.size;
605

Anton Khirnov's avatar
Anton Khirnov committed
606 607 608
            /* if two pass, output log */
            if (ost->logfile && enc->stats_out) {
                fprintf(ost->logfile, "%s", enc->stats_out);
609 610
            }
        }
Anton Khirnov's avatar
Anton Khirnov committed
611 612 613 614 615 616 617 618
    }
    ost->sync_opts++;
    /*
     * For video, number of frames in == number of packets out.
     * But there may be reordering, so we can't throw away frames on encoder
     * flush, we need to limit them here, before they go into encoder.
     */
    ost->frame_number++;
619 620
}

Aneesh Dogra's avatar
Aneesh Dogra committed
621 622 623
static double psnr(double d)
{
    return -10.0 * log(d) / log(10.0);
624 625 626 627 628 629 630 631 632 633 634 635 636 637
}

static void do_video_stats(AVFormatContext *os, OutputStream *ost,
                           int frame_size)
{
    AVCodecContext *enc;
    int frame_number;
    double ti1, bitrate, avg_bitrate;

    /* this is executed just the first time do_video_stats is called */
    if (!vstats_file) {
        vstats_file = fopen(vstats_filename, "w");
        if (!vstats_file) {
            perror("fopen");
638
            exit(1);
639 640 641 642 643 644
        }
    }

    enc = ost->st->codec;
    if (enc->codec_type == AVMEDIA_TYPE_VIDEO) {
        frame_number = ost->frame_number;
Aneesh Dogra's avatar
Aneesh Dogra committed
645
        fprintf(vstats_file, "frame= %5d q= %2.1f ", frame_number, enc->coded_frame->quality / (float)FF_QP2LAMBDA);
646
        if (enc->flags&CODEC_FLAG_PSNR)
Aneesh Dogra's avatar
Aneesh Dogra committed
647
            fprintf(vstats_file, "PSNR= %6.2f ", psnr(enc->coded_frame->error[0] / (enc->width * enc->height * 255.0 * 255.0)));
648 649 650 651 652 653 654

        fprintf(vstats_file,"f_size= %6d ", frame_size);
        /* compute pts value */
        ti1 = ost->sync_opts * av_q2d(enc->time_base);
        if (ti1 < 0.01)
            ti1 = 0.01;

Aneesh Dogra's avatar
Aneesh Dogra committed
655
        bitrate     = (frame_size * 8) / av_q2d(enc->time_base) / 1000.0;
656 657
        avg_bitrate = (double)(video_size * 8) / ti1 / 1000.0;
        fprintf(vstats_file, "s_size= %8.0fkB time= %0.3f br= %7.1fkbits/s avg_br= %7.1fkbits/s ",
Aneesh Dogra's avatar
Aneesh Dogra committed
658
               (double)video_size / 1024, ti1, bitrate, avg_bitrate);
659 660 661 662
        fprintf(vstats_file, "type= %c\n", av_get_picture_type_char(enc->coded_frame->pict_type));
    }
}

663 664 665 666
/**
 * Read one frame for lavfi output for ost and encode it.
 */
static int poll_filter(OutputStream *ost)
667
{
668
    OutputFile    *of = output_files[ost->file_index];
669 670
    AVFilterBufferRef *picref;
    AVFrame *filtered_frame = NULL;
671 672 673 674 675 676 677 678 679 680 681 682 683 684
    int frame_size, ret;

    if (!ost->filtered_frame && !(ost->filtered_frame = avcodec_alloc_frame())) {
        return AVERROR(ENOMEM);
    } else
        avcodec_get_frame_defaults(ost->filtered_frame);
    filtered_frame = ost->filtered_frame;

    if (ost->enc->type == AVMEDIA_TYPE_AUDIO &&
        !(ost->enc->capabilities & CODEC_CAP_VARIABLE_FRAME_SIZE))
        ret = av_buffersink_read_samples(ost->filter->filter, &picref,
                                         ost->st->codec->frame_size);
    else
        ret = av_buffersink_read(ost->filter->filter, &picref);
685

686 687
    if (ret < 0)
        return ret;
688

689 690 691 692 693 694 695 696
    avfilter_copy_buf_props(filtered_frame, picref);
    if (picref->pts != AV_NOPTS_VALUE) {
        filtered_frame->pts = av_rescale_q(picref->pts,
                                           ost->filter->filter->inputs[0]->time_base,
                                           ost->st->codec->time_base) -
                              av_rescale_q(of->start_time,
                                           AV_TIME_BASE_Q,
                                           ost->st->codec->time_base);
697

698
        if (of->start_time && filtered_frame->pts < 0) {
699
            avfilter_unref_buffer(picref);
700
            return 0;
701 702
        }
    }
703 704 705 706 707 708

    switch (ost->filter->filter->inputs[0]->type) {
    case AVMEDIA_TYPE_VIDEO:
        if (!ost->frame_aspect_ratio)
            ost->st->codec->sample_aspect_ratio = picref->video->pixel_aspect;

Anton Khirnov's avatar
Anton Khirnov committed
709
        do_video_out(of->ctx, ost, filtered_frame, &frame_size);
710 711 712 713 714 715 716 717 718 719 720 721 722
        if (vstats_filename && frame_size)
            do_video_stats(of->ctx, ost, frame_size);
        break;
    case AVMEDIA_TYPE_AUDIO:
        do_audio_out(of->ctx, ost, filtered_frame);
        break;
    default:
        // TODO support subtitle filters
        av_assert0(0);
    }

    avfilter_unref_buffer(picref);

723 724 725
    return 0;
}

726 727 728 729 730 731 732 733 734 735
/**
 * Read as many frames from possible from lavfi and encode them.
 *
 * Always read from the active stream with the lowest timestamp. If no frames
 * are available for it then return EAGAIN and wait for more input. This way we
 * can use lavfi sources that generate unlimited amount of frames without memory
 * usage exploding.
 */
static int poll_filters(void)
{
736
    int i, j, ret = 0;
737 738 739 740 741 742 743 744 745

    while (ret >= 0 && !received_sigterm) {
        OutputStream *ost = NULL;
        int64_t min_pts = INT64_MAX;

        /* choose output stream with the lowest timestamp */
        for (i = 0; i < nb_output_streams; i++) {
            int64_t pts = output_streams[i]->sync_opts;

746
            if (!output_streams[i]->filter || output_streams[i]->finished)
747 748 749 750 751 752 753 754 755 756 757 758 759 760 761 762
                continue;

            pts = av_rescale_q(pts, output_streams[i]->st->codec->time_base,
                               AV_TIME_BASE_Q);
            if (pts < min_pts) {
                min_pts = pts;
                ost = output_streams[i];
            }
        }

        if (!ost)
            break;

        ret = poll_filter(ost);

        if (ret == AVERROR_EOF) {
763 764
            OutputFile *of = output_files[ost->file_index];

765
            ost->finished = 1;
766

767 768 769 770
            if (of->shortest) {
                for (j = 0; j < of->ctx->nb_streams; j++)
                    output_streams[of->ost_index + j]->finished = 1;
            }
771 772 773 774 775 776 777 778 779

            ret = 0;
        } else if (ret == AVERROR(EAGAIN))
            return 0;
    }

    return ret;
}

780
static void print_report(int is_last_report, int64_t timer_start)
781 782 783 784 785 786 787 788 789 790 791
{
    char buf[1024];
    OutputStream *ost;
    AVFormatContext *oc;
    int64_t total_size;
    AVCodecContext *enc;
    int frame_number, vid, i;
    double bitrate, ti1, pts;
    static int64_t last_time = -1;
    static int qp_histogram[52];

792 793 794
    if (!print_stats && !is_last_report)
        return;

795 796 797 798 799 800 801 802 803 804 805 806 807 808
    if (!is_last_report) {
        int64_t cur_time;
        /* display the report every 0.5 seconds */
        cur_time = av_gettime();
        if (last_time == -1) {
            last_time = cur_time;
            return;
        }
        if ((cur_time - last_time) < 500000)
            return;
        last_time = cur_time;
    }


809
    oc = output_files[0]->ctx;
810 811

    total_size = avio_size(oc->pb);
Aneesh Dogra's avatar
Aneesh Dogra committed
812 813
    if (total_size < 0) // FIXME improve avio_size() so it works with non seekable output too
        total_size = avio_tell(oc->pb);
814 815 816 817

    buf[0] = '\0';
    ti1 = 1e10;
    vid = 0;
818
    for (i = 0; i < nb_output_streams; i++) {
819
        float q = -1;
820
        ost = output_streams[i];
821
        enc = ost->st->codec;
822
        if (!ost->stream_copy && enc->coded_frame)
Aneesh Dogra's avatar
Aneesh Dogra committed
823
            q = enc->coded_frame->quality / (float)FF_QP2LAMBDA;
824 825 826 827
        if (vid && enc->codec_type == AVMEDIA_TYPE_VIDEO) {
            snprintf(buf + strlen(buf), sizeof(buf) - strlen(buf), "q=%2.1f ", q);
        }
        if (!vid && enc->codec_type == AVMEDIA_TYPE_VIDEO) {
Aneesh Dogra's avatar
Aneesh Dogra committed
828
            float t = (av_gettime() - timer_start) / 1000000.0;
829 830 831

            frame_number = ost->frame_number;
            snprintf(buf + strlen(buf), sizeof(buf) - strlen(buf), "frame=%5d fps=%3d q=%3.1f ",
Aneesh Dogra's avatar
Aneesh Dogra committed
832 833
                     frame_number, (t > 1) ? (int)(frame_number / t + 0.5) : 0, q);
            if (is_last_report)
834
                snprintf(buf + strlen(buf), sizeof(buf) - strlen(buf), "L");
Aneesh Dogra's avatar
Aneesh Dogra committed
835
            if (qp_hist) {
836 837
                int j;
                int qp = lrintf(q);
Aneesh Dogra's avatar
Aneesh Dogra committed
838
                if (qp >= 0 && qp < FF_ARRAY_ELEMS(qp_histogram))
839
                    qp_histogram[qp]++;
Aneesh Dogra's avatar
Aneesh Dogra committed
840
                for (j = 0; j < 32; j++)
841
                    snprintf(buf + strlen(buf), sizeof(buf) - strlen(buf), "%X", (int)lrintf(log2(qp_histogram[j] + 1)));
842
            }
Aneesh Dogra's avatar
Aneesh Dogra committed
843
            if (enc->flags&CODEC_FLAG_PSNR) {
844
                int j;
Aneesh Dogra's avatar
Aneesh Dogra committed
845 846 847
                double error, error_sum = 0;
                double scale, scale_sum = 0;
                char type[3] = { 'Y','U','V' };
848
                snprintf(buf + strlen(buf), sizeof(buf) - strlen(buf), "PSNR=");
Aneesh Dogra's avatar
Aneesh Dogra committed
849 850 851 852 853 854 855
                for (j = 0; j < 3; j++) {
                    if (is_last_report) {
                        error = enc->error[j];
                        scale = enc->width * enc->height * 255.0 * 255.0 * frame_number;
                    } else {
                        error = enc->coded_frame->error[j];
                        scale = enc->width * enc->height * 255.0 * 255.0;
856
                    }
Aneesh Dogra's avatar
Aneesh Dogra committed
857 858
                    if (j)
                        scale /= 4;
859 860
                    error_sum += error;
                    scale_sum += scale;
Aneesh Dogra's avatar
Aneesh Dogra committed
861
                    snprintf(buf + strlen(buf), sizeof(buf) - strlen(buf), "%c:%2.2f ", type[j], psnr(error / scale));
862
                }
Aneesh Dogra's avatar
Aneesh Dogra committed
863
                snprintf(buf + strlen(buf), sizeof(buf) - strlen(buf), "*:%2.2f ", psnr(error_sum / scale_sum));
864 865 866 867 868 869 870 871 872 873 874
            }
            vid = 1;
        }
        /* compute min output value */
        pts = (double)ost->st->pts.val * av_q2d(ost->st->time_base);
        if ((pts < ti1) && (pts > 0))
            ti1 = pts;
    }
    if (ti1 < 0.01)
        ti1 = 0.01;

875
    bitrate = (double)(total_size * 8) / ti1 / 1000.0;
876

877
    snprintf(buf + strlen(buf), sizeof(buf) - strlen(buf),
878 879 880
            "size=%8.0fkB time=%0.2f bitrate=%6.1fkbits/s",
            (double)total_size / 1024, ti1, bitrate);

881 882 883
    if (nb_frames_dup || nb_frames_drop)
        snprintf(buf + strlen(buf), sizeof(buf) - strlen(buf), " dup=%d drop=%d",
                nb_frames_dup, nb_frames_drop);
884

885
    av_log(NULL, AV_LOG_INFO, "%s    \r", buf);
886

887
    fflush(stderr);
888

889
    if (is_last_report) {
890
        int64_t raw= audio_size + video_size + extra_size;
891 892
        av_log(NULL, AV_LOG_INFO, "\n");
        av_log(NULL, AV_LOG_INFO, "video:%1.0fkB audio:%1.0fkB global headers:%1.0fkB muxing overhead %f%%\n",
Aneesh Dogra's avatar
Aneesh Dogra committed
893 894 895 896
               video_size / 1024.0,
               audio_size / 1024.0,
               extra_size / 1024.0,
               100.0 * (total_size - raw) / raw
897 898 899 900
        );
    }
}

901
static void flush_encoders(void)
902 903 904
{
    int i, ret;

905
    for (i = 0; i < nb_output_streams; i++) {
906
        OutputStream   *ost = output_streams[i];
907
        AVCodecContext *enc = ost->st->codec;
908
        AVFormatContext *os = output_files[ost->file_index]->ctx;
909
        int stop_encoding = 0;
910

911
        if (!ost->encoding_needed)
912 913
            continue;

Aneesh Dogra's avatar
Aneesh Dogra committed
914
        if (ost->st->codec->codec_type == AVMEDIA_TYPE_AUDIO && enc->frame_size <= 1)
915
            continue;
916
        if (ost->st->codec->codec_type == AVMEDIA_TYPE_VIDEO && (os->oformat->flags & AVFMT_RAWPICTURE) && enc->codec->id == AV_CODEC_ID_RAWVIDEO)
917 918
            continue;

Aneesh Dogra's avatar
Aneesh Dogra committed
919
        for (;;) {
920 921 922
            int (*encode)(AVCodecContext*, AVPacket*, const AVFrame*, int*) = NULL;
            const char *desc;
            int64_t *size;
923 924 925

            switch (ost->st->codec->codec_type) {
            case AVMEDIA_TYPE_AUDIO:
926 927 928
                encode = avcodec_encode_audio2;
                desc   = "Audio";
                size   = &audio_size;
929 930
                break;
            case AVMEDIA_TYPE_VIDEO:
931 932 933 934 935 936 937 938 939 940 941 942 943 944 945 946
                encode = avcodec_encode_video2;
                desc   = "Video";
                size   = &video_size;
                break;
            default:
                stop_encoding = 1;
            }

            if (encode) {
                AVPacket pkt;
                int got_packet;
                av_init_packet(&pkt);
                pkt.data = NULL;
                pkt.size = 0;

                ret = encode(enc, &pkt, NULL, &got_packet);
947
                if (ret < 0) {
948
                    av_log(NULL, AV_LOG_FATAL, "%s encoding failed\n", desc);
949
                    exit(1);
950
                }
951
                *size += ret;
952 953 954
                if (ost->logfile && enc->stats_out) {
                    fprintf(ost->logfile, "%s", enc->stats_out);
                }
955
                if (!got_packet) {
956 957 958
                    stop_encoding = 1;
                    break;
                }
959 960 961 962
                if (pkt.pts != AV_NOPTS_VALUE)
                    pkt.pts = av_rescale_q(pkt.pts, enc->time_base, ost->st->time_base);
                if (pkt.dts != AV_NOPTS_VALUE)
                    pkt.dts = av_rescale_q(pkt.dts, enc->time_base, ost->st->time_base);
963
                write_frame(os, &pkt, ost);
964
            }
965

966
            if (stop_encoding)
967
                break;
968 969 970 971
        }
    }
}

972 973 974 975 976
/*
 * Check whether a packet from ist should be written into ost at this time
 */
static int check_output_constraints(InputStream *ist, OutputStream *ost)
{
977 978
    OutputFile *of = output_files[ost->file_index];
    int ist_index  = input_files[ist->file_index]->ist_index + ist->st->index;
979 980 981 982

    if (ost->source_index != ist_index)
        return 0;

983
    if (of->start_time && ist->last_dts < of->start_time)
984 985 986 987 988 989 990
        return 0;

    return 1;
}

static void do_streamcopy(InputStream *ist, OutputStream *ost, const AVPacket *pkt)
{
991
    OutputFile *of = output_files[ost->file_index];
992 993 994 995 996 997 998 999 1000
    int64_t ost_tb_start_time = av_rescale_q(of->start_time, AV_TIME_BASE_Q, ost->st->time_base);
    AVPacket opkt;

    av_init_packet(&opkt);

    if ((!ost->frame_number && !(pkt->flags & AV_PKT_FLAG_KEY)) &&
        !ost->copy_initial_nonkeyframes)
        return;

1001
    if (of->recording_time != INT64_MAX &&
1002
        ist->last_dts >= of->recording_time + of->start_time) {
1003
        ost->finished = 1;
1004 1005 1006
        return;
    }

1007 1008 1009 1010 1011 1012 1013 1014 1015 1016 1017 1018 1019 1020
    /* force the input stream PTS */
    if (ost->st->codec->codec_type == AVMEDIA_TYPE_AUDIO)
        audio_size += pkt->size;
    else if (ost->st->codec->codec_type == AVMEDIA_TYPE_VIDEO) {
        video_size += pkt->size;
        ost->sync_opts++;
    }

    if (pkt->pts != AV_NOPTS_VALUE)
        opkt.pts = av_rescale_q(pkt->pts, ist->st->time_base, ost->st->time_base) - ost_tb_start_time;
    else
        opkt.pts = AV_NOPTS_VALUE;

    if (pkt->dts == AV_NOPTS_VALUE)
1021
        opkt.dts = av_rescale_q(ist->last_dts, AV_TIME_BASE_Q, ost->st->time_base);
1022 1023 1024 1025 1026 1027 1028
    else
        opkt.dts = av_rescale_q(pkt->dts, ist->st->time_base, ost->st->time_base);
    opkt.dts -= ost_tb_start_time;

    opkt.duration = av_rescale_q(pkt->duration, ist->st->time_base, ost->st->time_base);
    opkt.flags    = pkt->flags;

Aneesh Dogra's avatar
Aneesh Dogra committed
1029
    // FIXME remove the following 2 lines they shall be replaced by the bitstream filters
1030 1031 1032 1033
    if (  ost->st->codec->codec_id != AV_CODEC_ID_H264
       && ost->st->codec->codec_id != AV_CODEC_ID_MPEG1VIDEO
       && ost->st->codec->codec_id != AV_CODEC_ID_MPEG2VIDEO
       && ost->st->codec->codec_id != AV_CODEC_ID_VC1