We are currently experiencing downtime impacting viewing & cloning the Mesa repo, and some GitLab pages returning 503. Please see #freedesktop on IRC for more updates.

gstffmpegcodecmap.c 102 KB
Newer Older
1 2
/* GStreamer
 * Copyright (C) <1999> Erik Walthinsen <omega@cse.ogi.edu>
3
 * This file:
4
 * Copyright (c) 2002-2004 Ronald Bultje <rbultje@ronald.bitfreak.net>
5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21
 *
 * This library is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Library General Public
 * License as published by the Free Software Foundation; either
 * version 2 of the License, or (at your option) any later version.
 *
 * This library is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Library General Public License for more details.
 *
 * You should have received a copy of the GNU Library General Public
 * License along with this library; if not, write to the
 * Free Software Foundation, Inc., 59 Temple Place - Suite 330,
 * Boston, MA 02111-1307, USA.
 */

22
#ifdef HAVE_CONFIG_H
23
#include "config.h"
24
#endif
25
#include <gst/gst.h>
26 27 28
#ifdef HAVE_FFMPEG_UNINSTALLED
#include <avcodec.h>
#else
29
#include <libavcodec/avcodec.h>
30
#endif
31
#include <string.h>
32

33
#include "gstffmpeg.h"
34 35
#include "gstffmpegcodecmap.h"

36 37
#include <gst/pbutils/codec-utils.h>

38 39 40 41 42
/*
 * Read a palette from a caps.
 */

static void
43
gst_ffmpeg_get_palette (const GstCaps * caps, AVCodecContext * context)
44 45 46
{
  GstStructure *str = gst_caps_get_structure (caps, 0);
  const GValue *palette_v;
Wim Taymans's avatar
Wim Taymans committed
47
  GstBuffer *palette;
48 49

  /* do we have a palette? */
50
  if ((palette_v = gst_structure_get_value (str, "palette_data")) && context) {
51
    palette = gst_value_get_buffer (palette_v);
Wim Taymans's avatar
Wim Taymans committed
52
    if (gst_buffer_get_size (palette) >= AVPALETTE_SIZE) {
53 54 55 56
      if (context->palctrl)
        av_free (context->palctrl);
      context->palctrl = av_malloc (sizeof (AVPaletteControl));
      context->palctrl->palette_changed = 1;
Wim Taymans's avatar
Wim Taymans committed
57
      gst_buffer_extract (palette, 0, context->palctrl->palette,
58 59 60 61 62 63
          AVPALETTE_SIZE);
    }
  }
}

static void
64
gst_ffmpeg_set_palette (GstCaps * caps, AVCodecContext * context)
65 66
{
  if (context->palctrl) {
67
    GstBuffer *palette = gst_buffer_new_and_alloc (AVPALETTE_SIZE);
68

Wim Taymans's avatar
Wim Taymans committed
69
    gst_buffer_fill (palette, 0, context->palctrl->palette, AVPALETTE_SIZE);
70
    gst_caps_set_simple (caps, "palette_data", GST_TYPE_BUFFER, palette, NULL);
71 72 73
  }
}

74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142
/* IMPORTANT: Keep this sorted by the ffmpeg channel masks */
static const struct
{
  guint64 ff;
  GstAudioChannelPosition gst;
} _ff_to_gst_layout[] = {
  {
  CH_FRONT_LEFT, GST_AUDIO_CHANNEL_POSITION_FRONT_LEFT}, {
  CH_FRONT_RIGHT, GST_AUDIO_CHANNEL_POSITION_FRONT_RIGHT}, {
  CH_FRONT_CENTER, GST_AUDIO_CHANNEL_POSITION_FRONT_CENTER}, {
  CH_LOW_FREQUENCY, GST_AUDIO_CHANNEL_POSITION_LFE}, {
  CH_BACK_LEFT, GST_AUDIO_CHANNEL_POSITION_REAR_LEFT}, {
  CH_BACK_RIGHT, GST_AUDIO_CHANNEL_POSITION_REAR_RIGHT}, {
  CH_FRONT_LEFT_OF_CENTER, GST_AUDIO_CHANNEL_POSITION_FRONT_LEFT_OF_CENTER}, {
  CH_FRONT_RIGHT_OF_CENTER, GST_AUDIO_CHANNEL_POSITION_FRONT_RIGHT_OF_CENTER}, {
  CH_BACK_CENTER, GST_AUDIO_CHANNEL_POSITION_REAR_CENTER}, {
  CH_SIDE_LEFT, GST_AUDIO_CHANNEL_POSITION_SIDE_LEFT}, {
  CH_SIDE_RIGHT, GST_AUDIO_CHANNEL_POSITION_SIDE_RIGHT}, {
  CH_TOP_CENTER, GST_AUDIO_CHANNEL_POSITION_NONE}, {
  CH_TOP_FRONT_LEFT, GST_AUDIO_CHANNEL_POSITION_NONE}, {
  CH_TOP_FRONT_CENTER, GST_AUDIO_CHANNEL_POSITION_NONE}, {
  CH_TOP_FRONT_RIGHT, GST_AUDIO_CHANNEL_POSITION_NONE}, {
  CH_TOP_BACK_LEFT, GST_AUDIO_CHANNEL_POSITION_NONE}, {
  CH_TOP_BACK_CENTER, GST_AUDIO_CHANNEL_POSITION_NONE}, {
  CH_TOP_BACK_RIGHT, GST_AUDIO_CHANNEL_POSITION_NONE}, {
  CH_STEREO_LEFT, GST_AUDIO_CHANNEL_POSITION_FRONT_LEFT}, {
  CH_STEREO_RIGHT, GST_AUDIO_CHANNEL_POSITION_FRONT_RIGHT}
};

static GstAudioChannelPosition *
gst_ff_channel_layout_to_gst (guint64 channel_layout, guint channels)
{
  guint nchannels = 0, i, j;
  GstAudioChannelPosition *pos = NULL;
  gboolean none_layout = FALSE;

  for (i = 0; i < 64; i++) {
    if ((channel_layout & (G_GUINT64_CONSTANT (1) << i)) != 0) {
      nchannels++;
    }
  }

  if (channel_layout == 0) {
    nchannels = channels;
    none_layout = TRUE;
  }

  if (nchannels != channels) {
    GST_ERROR ("Number of channels is different (%u != %u)", channels,
        nchannels);
    return NULL;
  }

  pos = g_new (GstAudioChannelPosition, nchannels);

  for (i = 0, j = 0; i < G_N_ELEMENTS (_ff_to_gst_layout); i++) {
    if ((channel_layout & _ff_to_gst_layout[i].ff) != 0) {
      pos[j++] = _ff_to_gst_layout[i].gst;

      if (_ff_to_gst_layout[i].gst == GST_AUDIO_CHANNEL_POSITION_NONE)
        none_layout = TRUE;
    }
  }

  if (j != nchannels) {
    GST_WARNING ("Unknown channels in channel layout - assuming NONE layout");
    none_layout = TRUE;
  }

143 144 145
  if (!none_layout && !gst_audio_check_channel_positions (pos, nchannels)) {
    GST_ERROR ("Invalid channel layout %" G_GUINT64_FORMAT
        " - assuming NONE layout", channel_layout);
146 147 148 149 150 151 152 153 154
    none_layout = TRUE;
  }

  if (none_layout) {
    if (nchannels == 1) {
      pos[0] = GST_AUDIO_CHANNEL_POSITION_FRONT_MONO;
    } else if (nchannels == 2) {
      pos[0] = GST_AUDIO_CHANNEL_POSITION_FRONT_LEFT;
      pos[1] = GST_AUDIO_CHANNEL_POSITION_FRONT_RIGHT;
155 156 157
    } else if (channel_layout == 0) {
      g_free (pos);
      pos = NULL;
158 159 160 161 162 163
    } else {
      for (i = 0; i < nchannels; i++)
        pos[i] = GST_AUDIO_CHANNEL_POSITION_NONE;
    }
  }

164 165 166 167 168 169 170 171 172 173
  if (nchannels == 1 && pos[0] == GST_AUDIO_CHANNEL_POSITION_FRONT_CENTER) {
    GST_DEBUG ("mono common case; won't set channel positions");
    g_free (pos);
    pos = NULL;
  } else if (nchannels == 2 && pos[0] == GST_AUDIO_CHANNEL_POSITION_FRONT_LEFT
      && pos[1] == GST_AUDIO_CHANNEL_POSITION_FRONT_RIGHT) {
    GST_DEBUG ("stereo common case; won't set channel positions");
    g_free (pos);
    pos = NULL;
  }
174 175 176 177

  return pos;
}

178 179 180 181
/* this macro makes a caps width fixed or unfixed width/height
 * properties depending on whether we've got a context.
 *
 * See below for why we use this.
182 183 184
 *
 * We should actually do this stuff at the end, like in riff-media.c,
 * but I'm too lazy today. Maybe later.
185
 */
186
static GstCaps *
187 188
gst_ff_vid_caps_new (AVCodecContext * context, enum CodecID codec_id,
    const char *mimetype, const char *fieldname, ...)
189 190 191 192
{
  GstStructure *structure = NULL;
  GstCaps *caps = NULL;
  va_list var_args;
193
  gint i;
194

195 196
  GST_LOG ("context:%p, codec_id:%d, mimetype:%s", context, codec_id, mimetype);

197 198
  /* fixed, non probing context */
  if (context != NULL && context->width != -1) {
199 200
    gint num, denom;

201 202
    caps = gst_caps_new_simple (mimetype,
        "width", G_TYPE_INT, context->width,
203 204 205 206 207
        "height", G_TYPE_INT, context->height, NULL);

    num = context->time_base.den / context->ticks_per_frame;
    denom = context->time_base.num;

208 209 210 211
    if (!denom) {
      GST_LOG ("invalid framerate: %d/0, -> %d/1", num, num);
      denom = 1;
    }
212 213 214 215 216 217 218 219
    if (gst_util_fraction_compare (num, denom, 1000, 1) > 0) {
      GST_LOG ("excessive framerate: %d/%d, -> 0/1", num, denom);
      num = 0;
      denom = 1;
    }
    GST_LOG ("setting framerate: %d/%d", num, denom);
    gst_caps_set_simple (caps,
        "framerate", GST_TYPE_FRACTION, num, denom, NULL);
220
  } else {
221
    /* so we are after restricted caps in this case */
222
    switch (codec_id) {
223 224 225 226 227 228 229 230 231 232 233 234
      case CODEC_ID_H261:
      {
        caps = gst_caps_new_simple (mimetype,
            "width", G_TYPE_INT, 352,
            "height", G_TYPE_INT, 288,
            "framerate", GST_TYPE_FRACTION_RANGE, 0, 1, G_MAXINT, 1, NULL);
        gst_caps_append (caps, gst_caps_new_simple (mimetype,
                "width", G_TYPE_INT, 176,
                "height", G_TYPE_INT, 144,
                "framerate", GST_TYPE_FRACTION_RANGE, 0, 1, G_MAXINT, 1, NULL));
        break;
      }
235 236 237 238 239 240 241 242 243
      case CODEC_ID_H263:
      {
        /* 128x96, 176x144, 352x288, 704x576, and 1408x1152. slightly reordered
         * because we want automatic negotiation to go as close to 320x240 as
         * possible. */
        const static gint widths[] = { 352, 704, 176, 1408, 128 };
        const static gint heights[] = { 288, 576, 144, 1152, 96 };
        GstCaps *temp;
        gint n_sizes = G_N_ELEMENTS (widths);
244

245 246 247 248 249 250
        caps = gst_caps_new_empty ();
        for (i = 0; i < n_sizes; i++) {
          temp = gst_caps_new_simple (mimetype,
              "width", G_TYPE_INT, widths[i],
              "height", G_TYPE_INT, heights[i],
              "framerate", GST_TYPE_FRACTION_RANGE, 0, 1, G_MAXINT, 1, NULL);
251

252 253 254 255
          gst_caps_append (caps, temp);
        }
        break;
      }
256 257
      case CODEC_ID_DVVIDEO:
      {
258 259 260 261 262 263 264 265 266 267 268 269 270 271 272
        static struct
        {
          guint32 csp;
          gint width, height;
          gint par_n, par_d;
          gint framerate_n, framerate_d;
        } profiles[] = {
          {
          GST_MAKE_FOURCC ('Y', '4', '1', 'B'), 720, 480, 10, 11, 30000, 1001}, {
          GST_MAKE_FOURCC ('Y', '4', '1', 'B'), 720, 480, 40, 33, 30000, 1001}, {
          GST_MAKE_FOURCC ('I', '4', '2', '0'), 720, 576, 59, 54, 25, 1}, {
          GST_MAKE_FOURCC ('I', '4', '2', '0'), 720, 576, 118, 81, 25, 1}, {
          GST_MAKE_FOURCC ('Y', '4', '1', 'B'), 720, 576, 59, 54, 25, 1}, {
          GST_MAKE_FOURCC ('Y', '4', '1', 'B'), 720, 576, 118, 81, 25, 1}
        };
273
        GstCaps *temp;
274
        gint n_sizes = G_N_ELEMENTS (profiles);
275 276 277 278

        caps = gst_caps_new_empty ();
        for (i = 0; i < n_sizes; i++) {
          temp = gst_caps_new_simple (mimetype,
279 280 281 282 283
              "width", G_TYPE_INT, profiles[i].width,
              "height", G_TYPE_INT, profiles[i].height,
              "framerate", GST_TYPE_FRACTION, profiles[i].framerate_n,
              profiles[i].framerate_d, "pixel-aspect-ratio", GST_TYPE_FRACTION,
              profiles[i].par_n, profiles[i].par_d, NULL);
284 285

          gst_caps_append (caps, temp);
286
        }
287 288
        break;
      }
289 290
      case CODEC_ID_DNXHD:
      {
291
        caps = gst_caps_new_simple (mimetype,
292 293
            "width", G_TYPE_INT, 1920,
            "height", G_TYPE_INT, 1080,
294
            "framerate", GST_TYPE_FRACTION_RANGE, 0, 1, G_MAXINT, 1, NULL);
295 296 297 298 299 300 301
        gst_caps_append (caps, gst_caps_new_simple (mimetype,
                "width", G_TYPE_INT, 1280,
                "height", G_TYPE_INT, 720,
                "framerate", GST_TYPE_FRACTION_RANGE, 0, 1, G_MAXINT, 1, NULL));
        break;
      }
      default:
302 303 304 305
        break;
    }
  }

306 307
  /* no fixed caps or special restrictions applied;
   * default unfixed setting */
308 309
  if (!caps) {
    GST_DEBUG ("Creating default caps");
310 311 312 313
    caps = gst_caps_new_simple (mimetype,
        "width", GST_TYPE_INT_RANGE, 16, 4096,
        "height", GST_TYPE_INT_RANGE, 16, 4096,
        "framerate", GST_TYPE_FRACTION_RANGE, 0, 1, G_MAXINT, 1, NULL);
314
  }
315

316
  for (i = 0; i < gst_caps_get_size (caps); i++) {
317
    va_start (var_args, fieldname);
318
    structure = gst_caps_get_structure (caps, i);
319 320 321 322 323 324
    gst_structure_set_valist (structure, fieldname, var_args);
    va_end (var_args);
  }

  return caps;
}
325 326 327

/* same for audio - now with channels/sample rate
 */
328
static GstCaps *
329 330
gst_ff_aud_caps_new (AVCodecContext * context, enum CodecID codec_id,
    const char *mimetype, const char *fieldname, ...)
331 332 333
{
  GstCaps *caps = NULL;
  GstStructure *structure = NULL;
334
  gint i;
335 336
  va_list var_args;

337 338
  /* fixed, non-probing context */
  if (context != NULL && context->channels != -1) {
339
    GstAudioChannelPosition *pos;
340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359
    guint64 channel_layout = context->channel_layout;

    if (channel_layout == 0) {
      const guint64 default_channel_set[] = {
        0, 0, CH_LAYOUT_SURROUND, CH_LAYOUT_QUAD, CH_LAYOUT_5POINT0,
        CH_LAYOUT_5POINT1, 0, CH_LAYOUT_7POINT1
      };

      switch (codec_id) {
        case CODEC_ID_EAC3:
        case CODEC_ID_AC3:
        case CODEC_ID_DTS:
          if (context->channels > 0
              && context->channels < G_N_ELEMENTS (default_channel_set))
            channel_layout = default_channel_set[context->channels - 1];
          break;
        default:
          break;
      }
    }
360

361 362
    caps = gst_caps_new_simple (mimetype,
        "rate", G_TYPE_INT, context->sample_rate,
363
        "channels", G_TYPE_INT, context->channels, NULL);
364

365
    pos = gst_ff_channel_layout_to_gst (channel_layout, context->channels);
366 367 368 369
    if (pos != NULL) {
      gst_audio_set_channel_positions (gst_caps_get_structure (caps, 0), pos);
      g_free (pos);
    }
370
  } else {
371 372 373
    gint maxchannels = 2;
    const gint *rates = NULL;
    gint n_rates = 0;
374

375
    if (context) {
376 377 378 379 380 381 382 383 384 385
      /* so we must be after restricted caps in this particular case */
      switch (codec_id) {
        case CODEC_ID_MP2:
        {
          const static gint l_rates[] =
              { 48000, 44100, 32000, 24000, 22050, 16000 };
          n_rates = G_N_ELEMENTS (l_rates);
          rates = l_rates;
          break;
        }
386
        case CODEC_ID_EAC3:
387 388 389 390 391 392 393 394 395 396 397 398 399 400 401 402 403 404 405 406 407 408 409 410
        case CODEC_ID_AC3:
        {
          const static gint l_rates[] = { 48000, 44100, 32000 };
          n_rates = G_N_ELEMENTS (l_rates);
          rates = l_rates;
          break;
        }
        case CODEC_ID_ADPCM_SWF:
        {
          const static gint l_rates[] = { 11025, 22050, 44100 };
          n_rates = G_N_ELEMENTS (l_rates);
          rates = l_rates;
          break;
        }
        case CODEC_ID_ROQ_DPCM:
        {
          const static gint l_rates[] = { 22050 };
          n_rates = G_N_ELEMENTS (l_rates);
          rates = l_rates;
          break;
        }
        case CODEC_ID_ADPCM_G726:
          maxchannels = 1;
          break;
411 412 413 414 415 416 417 418 419 420 421 422 423 424 425 426
        case CODEC_ID_AMR_NB:
        {
          const static gint l_rates[] = { 8000 };
          maxchannels = 1;
          n_rates = G_N_ELEMENTS (l_rates);
          rates = l_rates;
          break;
        }
        case CODEC_ID_AMR_WB:
        {
          const static gint l_rates[] = { 16000 };
          maxchannels = 1;
          n_rates = G_N_ELEMENTS (l_rates);
          rates = l_rates;
          break;
        }
427 428 429
        default:
          break;
      }
430 431 432 433 434

      /* TODO: handle context->channel_layouts here to set
       * the list of channel layouts supported by the encoder.
       * Unfortunately no encoder uses this yet....
       */
435 436 437 438 439 440 441
    }

    /* regardless of encode/decode, open up channels if applicable */
    /* Until decoders/encoders expose the maximum number of channels
     * they support, we whitelist them here. */
    switch (codec_id) {
      case CODEC_ID_AC3:
442
      case CODEC_ID_EAC3:
443
      case CODEC_ID_AAC:
444
      case CODEC_ID_AAC_LATM:
445 446 447
      case CODEC_ID_DTS:
        maxchannels = 6;
        break;
448 449 450 451
      case CODEC_ID_WMAPRO:
      case CODEC_ID_TRUEHD:
        maxchannels = 8;
        break;
452 453 454
      default:
        break;
    }
455

456 457 458 459 460 461 462 463 464 465 466 467 468 469 470 471 472 473 474 475 476 477 478
    if (maxchannels == 1)
      caps = gst_caps_new_simple (mimetype,
          "channels", G_TYPE_INT, maxchannels, NULL);
    else
      caps = gst_caps_new_simple (mimetype,
          "channels", GST_TYPE_INT_RANGE, 1, maxchannels, NULL);
    if (n_rates) {
      GValue list = { 0, };
      GstStructure *structure;

      g_value_init (&list, GST_TYPE_LIST);
      for (i = 0; i < n_rates; i++) {
        GValue v = { 0, };

        g_value_init (&v, G_TYPE_INT);
        g_value_set_int (&v, rates[i]);
        gst_value_list_append_value (&list, &v);
        g_value_unset (&v);
      }
      structure = gst_caps_get_structure (caps, 0);
      gst_structure_set_value (structure, "rate", &list);
      g_value_unset (&list);
    } else
479
      gst_caps_set_simple (caps, "rate", GST_TYPE_INT_RANGE, 4000, 96000, NULL);
480 481
  }

482
  for (i = 0; i < gst_caps_get_size (caps); i++) {
483
    va_start (var_args, fieldname);
484
    structure = gst_caps_get_structure (caps, i);
485 486 487 488 489 490
    gst_structure_set_valist (structure, fieldname, var_args);
    va_end (var_args);
  }

  return caps;
}
491 492 493 494 495 496

/* Convert a FFMPEG codec ID and optional AVCodecContext
 * to a GstCaps. If the context is ommitted, no fixed values
 * for video/audio size will be included in the GstCaps
 *
 * CodecID is primarily meant for compressed data GstCaps!
497 498 499 500 501 502 503 504 505
 *
 * encode is a special parameter. gstffmpegdec will say
 * FALSE, gstffmpegenc will say TRUE. The output caps
 * depends on this, in such a way that it will be very
 * specific, defined, fixed and correct caps for encoders,
 * yet very wide, "forgiving" caps for decoders. Example
 * for mp3: decode: audio/mpeg,mpegversion=1,layer=[1-3]
 * but encode: audio/mpeg,mpegversion=1,layer=3,bitrate=x,
 * rate=x,channels=x.
506 507
 */

508
GstCaps *
Thomas Vander Stichele's avatar
indent  
Thomas Vander Stichele committed
509 510
gst_ffmpeg_codecid_to_caps (enum CodecID codec_id,
    AVCodecContext * context, gboolean encode)
511
{
512
  GstCaps *caps = NULL;
513
  gboolean buildcaps = FALSE;
514

515 516
  GST_LOG ("codec_id:%d, context:%p, encode:%d", codec_id, context, encode);

517
  switch (codec_id) {
518
    case CODEC_ID_MPEG1VIDEO:
519 520 521 522
      /* FIXME: bitrate */
      caps = gst_ff_vid_caps_new (context, codec_id, "video/mpeg",
          "mpegversion", G_TYPE_INT, 1,
          "systemstream", G_TYPE_BOOLEAN, FALSE, NULL);
523 524 525 526 527
      break;

    case CODEC_ID_MPEG2VIDEO:
      if (encode) {
        /* FIXME: bitrate */
528
        caps = gst_ff_vid_caps_new (context, codec_id, "video/mpeg",
Thomas Vander Stichele's avatar
indent  
Thomas Vander Stichele committed
529 530
            "mpegversion", G_TYPE_INT, 2,
            "systemstream", G_TYPE_BOOLEAN, FALSE, NULL);
531 532 533 534
      } else {
        /* decode both MPEG-1 and MPEG-2; width/height/fps are all in
         * the MPEG video stream headers, so may be omitted from caps. */
        caps = gst_caps_new_simple ("video/mpeg",
Thomas Vander Stichele's avatar
indent  
Thomas Vander Stichele committed
535 536
            "mpegversion", GST_TYPE_INT_RANGE, 1, 2,
            "systemstream", G_TYPE_BOOLEAN, FALSE, NULL);
537
      }
538
      break;
539 540 541 542 543 544

    case CODEC_ID_MPEG2VIDEO_XVMC:
      /* this is a special ID - don't need it in GStreamer, I think */
      break;

    case CODEC_ID_H263:
545
      if (encode) {
546
        caps = gst_ff_vid_caps_new (context, codec_id, "video/x-h263",
547 548 549
            "variant", G_TYPE_STRING, "itu",
            "h263version", G_TYPE_STRING, "h263", NULL);
      } else {
550 551 552 553
        /* don't pass codec_id, we can decode other variants with the H263
         * decoder that don't have specific size requirements
         */
        caps = gst_ff_vid_caps_new (context, CODEC_ID_NONE, "video/x-h263",
554 555
            "variant", G_TYPE_STRING, "itu", NULL);
      }
556 557 558
      break;

    case CODEC_ID_H263P:
559
      caps = gst_ff_vid_caps_new (context, codec_id, "video/x-h263",
560 561
          "variant", G_TYPE_STRING, "itu",
          "h263version", G_TYPE_STRING, "h263p", NULL);
562 563 564 565 566 567 568 569 570
      if (encode && context) {

        gst_caps_set_simple (caps,
            "annex-f", G_TYPE_BOOLEAN, context->flags & CODEC_FLAG_4MV,
            "annex-j", G_TYPE_BOOLEAN, context->flags & CODEC_FLAG_LOOP_FILTER,
            "annex-i", G_TYPE_BOOLEAN, context->flags & CODEC_FLAG_AC_PRED,
            "annex-t", G_TYPE_BOOLEAN, context->flags & CODEC_FLAG_AC_PRED,
            NULL);
      }
571
      break;
572

573
    case CODEC_ID_H263I:
574
      caps = gst_ff_vid_caps_new (context, codec_id, "video/x-intel-h263",
575
          "variant", G_TYPE_STRING, "intel", NULL);
576 577
      break;

578
    case CODEC_ID_H261:
579
      caps = gst_ff_vid_caps_new (context, codec_id, "video/x-h261", NULL);
580 581
      break;

582
    case CODEC_ID_RV10:
583
    case CODEC_ID_RV20:
584
    case CODEC_ID_RV30:
585
    case CODEC_ID_RV40:
586 587
    {
      gint version;
588

589 590 591 592
      switch (codec_id) {
        case CODEC_ID_RV40:
          version = 4;
          break;
593 594 595
        case CODEC_ID_RV30:
          version = 3;
          break;
596 597 598 599 600 601 602
        case CODEC_ID_RV20:
          version = 2;
          break;
        default:
          version = 1;
          break;
      }
603

604 605 606 607 608
      /* FIXME: context->sub_id must be filled in during decoding */
      caps = gst_ff_vid_caps_new (context, codec_id, "video/x-pn-realvideo",
          "systemstream", G_TYPE_BOOLEAN, FALSE,
          "rmversion", G_TYPE_INT, version, NULL);
      if (context) {
609
        gst_caps_set_simple (caps, "format", G_TYPE_INT, context->sub_id, NULL);
610 611
        if (context->extradata_size >= 8) {
          gst_caps_set_simple (caps,
612 613 614
              "subformat", G_TYPE_INT, GST_READ_UINT32_BE (context->extradata),
              NULL);
        }
615
      }
616
    }
617
      break;
618

619 620 621 622 623 624
    case CODEC_ID_MP1:
      /* FIXME: bitrate */
      caps = gst_ff_aud_caps_new (context, codec_id, "audio/mpeg",
          "mpegversion", G_TYPE_INT, 1, "layer", G_TYPE_INT, 1, NULL);
      break;

625
    case CODEC_ID_MP2:
626 627 628
      /* FIXME: bitrate */
      caps = gst_ff_aud_caps_new (context, codec_id, "audio/mpeg",
          "mpegversion", G_TYPE_INT, 1, "layer", G_TYPE_INT, 2, NULL);
629
      break;
630

631 632 633
    case CODEC_ID_MP3:
      if (encode) {
        /* FIXME: bitrate */
634
        caps = gst_ff_aud_caps_new (context, codec_id, "audio/mpeg",
Thomas Vander Stichele's avatar
indent  
Thomas Vander Stichele committed
635
            "mpegversion", G_TYPE_INT, 1, "layer", G_TYPE_INT, 3, NULL);
636 637 638 639
      } else {
        /* Decodes MPEG-1 layer 1/2/3. Samplerate, channels et al are
         * in the MPEG audio header, so may be omitted from caps. */
        caps = gst_caps_new_simple ("audio/mpeg",
Thomas Vander Stichele's avatar
indent  
Thomas Vander Stichele committed
640 641
            "mpegversion", G_TYPE_INT, 1,
            "layer", GST_TYPE_INT_RANGE, 1, 3, NULL);
642
      }
643
      break;
644

645 646 647 648 649 650 651
    case CODEC_ID_MUSEPACK7:
      caps =
          gst_ff_aud_caps_new (context, codec_id,
          "audio/x-ffmpeg-parsed-musepack", "streamversion", G_TYPE_INT, 7,
          NULL);
      break;

652 653 654 655 656 657 658
    case CODEC_ID_MUSEPACK8:
      caps =
          gst_ff_aud_caps_new (context, codec_id,
          "audio/x-ffmpeg-parsed-musepack", "streamversion", G_TYPE_INT, 8,
          NULL);
      break;

659 660 661
    case CODEC_ID_AC3:
      /* FIXME: bitrate */
      caps = gst_ff_aud_caps_new (context, codec_id, "audio/x-ac3", NULL);
662
      break;
663

664 665 666 667 668
    case CODEC_ID_EAC3:
      /* FIXME: bitrate */
      caps = gst_ff_aud_caps_new (context, codec_id, "audio/x-eac3", NULL);
      break;

669 670 671 672 673
    case CODEC_ID_TRUEHD:
      caps = gst_ff_aud_caps_new (context, codec_id, "audio/x-true-hd", NULL);
      break;

    case CODEC_ID_ATRAC1:
674
      caps =
675
          gst_ff_aud_caps_new (context, codec_id, "audio/x-vnd.sony.atrac1",
676
          NULL);
677
      break;
678

679 680
    case CODEC_ID_ATRAC3:
      caps =
681
          gst_ff_aud_caps_new (context, codec_id, "audio/x-vnd.sony.atrac3",
682 683 684
          NULL);
      break;

685
    case CODEC_ID_DTS:
686
      caps = gst_ff_aud_caps_new (context, codec_id, "audio/x-dts", NULL);
687
      break;
688

689 690 691 692 693 694
    case CODEC_ID_APE:
      caps =
          gst_ff_aud_caps_new (context, codec_id, "audio/x-ffmpeg-parsed-ape",
          NULL);
      if (context) {
        gst_caps_set_simple (caps,
695
            "depth", G_TYPE_INT, context->bits_per_coded_sample, NULL);
696 697 698
      }
      break;

699 700 701
    case CODEC_ID_MLP:
      caps = gst_ff_aud_caps_new (context, codec_id, "audio/x-mlp", NULL);
      break;
702

703 704 705
    case CODEC_ID_IMC:
      caps = gst_ff_aud_caps_new (context, codec_id, "audio/x-imc", NULL);
      break;
706

Thomas Vander Stichele's avatar
indent  
Thomas Vander Stichele committed
707 708 709 710 711
      /* MJPEG is normal JPEG, Motion-JPEG and Quicktime MJPEG-A. MJPEGB
       * is Quicktime's MJPEG-B. LJPEG is lossless JPEG. I don't know what
       * sp5x is, but it's apparently something JPEG... We don't separate
       * between those in GStreamer. Should we (at least between MJPEG,
       * MJPEG-B and sp5x decoding...)? */
712
    case CODEC_ID_MJPEG:
713
    case CODEC_ID_LJPEG:
714
      caps = gst_ff_vid_caps_new (context, codec_id, "image/jpeg", NULL);
Wim Taymans's avatar
Wim Taymans committed
715
      break;
716

717
    case CODEC_ID_SP5X:
718
      caps = gst_ff_vid_caps_new (context, codec_id, "video/sp5x", NULL);
719 720
      break;

721
    case CODEC_ID_MJPEGB:
722
      caps = gst_ff_vid_caps_new (context, codec_id, "video/x-mjpeg-b", NULL);
723 724
      break;

725
    case CODEC_ID_MPEG4:
726
      if (encode && context != NULL) {
727 728
        /* I'm not exactly sure what ffmpeg outputs... ffmpeg itself uses
         * the AVI fourcc 'DIVX', but 'mp4v' for Quicktime... */
729
        switch (context->codec_tag) {
730
          case GST_MAKE_FOURCC ('D', 'I', 'V', 'X'):
731
            caps = gst_ff_vid_caps_new (context, codec_id, "video/x-divx",
Thomas Vander Stichele's avatar
Thomas Vander Stichele committed
732
                "divxversion", G_TYPE_INT, 5, NULL);
733 734 735 736
            break;
          case GST_MAKE_FOURCC ('m', 'p', '4', 'v'):
          default:
            /* FIXME: bitrate */
737
            caps = gst_ff_vid_caps_new (context, codec_id, "video/mpeg",
738 739 740 741
                "systemstream", G_TYPE_BOOLEAN, FALSE,
                "mpegversion", G_TYPE_INT, 4, NULL);
            break;
        }
742 743
      } else {
        /* The trick here is to separate xvid, divx, mpeg4, 3ivx et al */
744
        caps = gst_ff_vid_caps_new (context, codec_id, "video/mpeg",
Thomas Vander Stichele's avatar
indent  
Thomas Vander Stichele committed
745 746
            "mpegversion", G_TYPE_INT, 4,
            "systemstream", G_TYPE_BOOLEAN, FALSE, NULL);
747
        if (encode) {
748 749
          gst_caps_append (caps, gst_ff_vid_caps_new (context, codec_id,
                  "video/x-divx", "divxversion", G_TYPE_INT, 5, NULL));
750
        } else {
751 752 753 754 755 756 757
          gst_caps_append (caps, gst_ff_vid_caps_new (context, codec_id,
                  "video/x-divx", "divxversion", GST_TYPE_INT_RANGE, 4, 5,
                  NULL));
          gst_caps_append (caps, gst_ff_vid_caps_new (context, codec_id,
                  "video/x-xvid", NULL));
          gst_caps_append (caps, gst_ff_vid_caps_new (context, codec_id,
                  "video/x-3ivx", NULL));
758
        }
759
      }
760
      break;
761

762
    case CODEC_ID_RAWVIDEO:
763 764
      caps =
          gst_ffmpeg_codectype_to_caps (AVMEDIA_TYPE_VIDEO, context, codec_id,
765
          encode);
766
      break;
767

768
    case CODEC_ID_MSMPEG4V1:
769 770
    case CODEC_ID_MSMPEG4V2:
    case CODEC_ID_MSMPEG4V3:
771 772 773 774 775 776 777 778 779
    {
      gint version = 41 + codec_id - CODEC_ID_MSMPEG4V1;

      /* encode-FIXME: bitrate */
      caps = gst_ff_vid_caps_new (context, codec_id, "video/x-msmpeg",
          "msmpegversion", G_TYPE_INT, version, NULL);
      if (!encode && codec_id == CODEC_ID_MSMPEG4V3) {
        gst_caps_append (caps, gst_ff_vid_caps_new (context, codec_id,
                "video/x-divx", "divxversion", G_TYPE_INT, 3, NULL));
780
      }
781
    }
782
      break;
783

784
    case CODEC_ID_WMV1:
785
    case CODEC_ID_WMV2:
786 787
    {
      gint version = (codec_id == CODEC_ID_WMV1) ? 1 : 2;
788

789 790 791
      caps = gst_ff_vid_caps_new (context, codec_id, "video/x-wmv",
          "wmvversion", G_TYPE_INT, version, NULL);
    }
792
      break;
793

794
    case CODEC_ID_FLV1:
795 796
      caps = gst_ff_vid_caps_new (context, codec_id, "video/x-flash-video",
          "flvversion", G_TYPE_INT, 1, NULL);
797
      break;
798

799
    case CODEC_ID_SVQ1:
800
      caps = gst_ff_vid_caps_new (context, codec_id, "video/x-svq",
Thomas Vander Stichele's avatar
indent  
Thomas Vander Stichele committed
801
          "svqversion", G_TYPE_INT, 1, NULL);
802
      break;
803 804

    case CODEC_ID_SVQ3:
805
      caps = gst_ff_vid_caps_new (context, codec_id, "video/x-svq",
806
          "svqversion", G_TYPE_INT, 3, NULL);
807
      break;
808

809
    case CODEC_ID_DVAUDIO:
810
      caps = gst_ff_aud_caps_new (context, codec_id, "audio/x-dv", NULL);
811
      break;
812

813
    case CODEC_ID_DVVIDEO:
814 815 816 817 818
    {
      if (encode && context) {
        guint32 fourcc;

        switch (context->pix_fmt) {
819
          case PIX_FMT_YUYV422:
820 821 822 823 824
            fourcc = GST_MAKE_FOURCC ('Y', 'U', 'Y', '2');
            break;
          case PIX_FMT_YUV420P:
            fourcc = GST_MAKE_FOURCC ('I', '4', '2', '0');
            break;
825 826 827
          case PIX_FMT_YUVA420P:
            fourcc = GST_MAKE_FOURCC ('A', '4', '2', '0');
            break;
828 829 830 831 832 833 834 835 836 837 838 839 840 841 842 843 844 845 846 847 848 849
          case PIX_FMT_YUV411P:
            fourcc = GST_MAKE_FOURCC ('Y', '4', '1', 'B');
            break;
          case PIX_FMT_YUV422P:
            fourcc = GST_MAKE_FOURCC ('Y', '4', '2', 'B');
            break;
          case PIX_FMT_YUV410P:
            fourcc = GST_MAKE_FOURCC ('Y', 'U', 'V', '9');
            break;
          default:
            GST_WARNING
                ("Couldnt' find fourcc for pixfmt %d, defaulting to I420",
                context->pix_fmt);
            fourcc = GST_MAKE_FOURCC ('I', '4', '2', '0');
            break;
        }
        caps = gst_ff_vid_caps_new (context, codec_id, "video/x-dv",
            "systemstream", G_TYPE_BOOLEAN, FALSE,
            "format", GST_TYPE_FOURCC, fourcc, NULL);
      } else {
        caps = gst_ff_vid_caps_new (context, codec_id, "video/x-dv",
            "systemstream", G_TYPE_BOOLEAN, FALSE, NULL);
850
      }
851
    }
852
      break;
853

854 855
    case CODEC_ID_WMAV1:
    case CODEC_ID_WMAV2:
856 857
    {
      gint version = (codec_id == CODEC_ID_WMAV1) ? 1 : 2;
858

859 860 861 862 863 864 865 866 867 868
      if (context) {
        caps = gst_ff_aud_caps_new (context, codec_id, "audio/x-wma",
            "wmaversion", G_TYPE_INT, version,
            "block_align", G_TYPE_INT, context->block_align,
            "bitrate", G_TYPE_INT, context->bit_rate, NULL);
      } else {
        caps = gst_ff_aud_caps_new (context, codec_id, "audio/x-wma",
            "wmaversion", G_TYPE_INT, version,
            "block_align", GST_TYPE_INT_RANGE, 0, G_MAXINT,
            "bitrate", GST_TYPE_INT_RANGE, 0, G_MAXINT, NULL);
869
      }
870
    }
871
      break;
872 873 874 875 876 877
    case CODEC_ID_WMAPRO:
    {
      caps = gst_ff_aud_caps_new (context, codec_id, "audio/x-wma",
          "wmaversion", G_TYPE_INT, 3, NULL);
      break;
    }
878

879 880 881 882 883 884
    case CODEC_ID_WMAVOICE:
    {
      caps = gst_ff_aud_caps_new (context, codec_id, "audio/x-wms", NULL);
      break;
    }

885 886
    case CODEC_ID_MACE3:
    case CODEC_ID_MACE6:
887 888
    {
      gint version = (codec_id == CODEC_ID_MACE3) ? 3 : 6;
889

890 891 892
      caps = gst_ff_aud_caps_new (context, codec_id, "audio/x-mace",
          "maceversion", G_TYPE_INT, version, NULL);
    }
893
      break;
894

Wim Taymans's avatar
Wim Taymans committed
895
    case CODEC_ID_HUFFYUV:
896
      caps = gst_ff_vid_caps_new (context, codec_id, "video/x-huffyuv", NULL);
897 898
      if (context) {
        gst_caps_set_simple (caps,
899
            "bpp", G_TYPE_INT, context->bits_per_coded_sample, NULL);
900
      }
901 902 903
      break;

    case CODEC_ID_CYUV:
904 905 906
      caps =
          gst_ff_vid_caps_new (context, codec_id, "video/x-compressed-yuv",
          NULL);
907 908 909
      break;

    case CODEC_ID_H264:
910
      caps = gst_ff_vid_caps_new (context, codec_id, "video/x-h264", NULL);
911 912
      break;

913 914 915 916 917
    case CODEC_ID_INDEO5:
      caps = gst_ff_vid_caps_new (context, codec_id, "video/x-indeo",
          "indeoversion", G_TYPE_INT, 5, NULL);
      break;

918
    case CODEC_ID_INDEO3:
919
      caps = gst_ff_vid_caps_new (context, codec_id, "video/x-indeo",
Thomas Vander Stichele's avatar
indent  
Thomas Vander Stichele committed
920
          "indeoversion", G_TYPE_INT, 3, NULL);
921 922
      break;

923
    case CODEC_ID_INDEO2:
924
      caps = gst_ff_vid_caps_new (context, codec_id, "video/x-indeo",
925 926 927
          "indeoversion", G_TYPE_INT, 2, NULL);
      break;

928
    case CODEC_ID_FLASHSV:
929 930
      caps =
          gst_ff_vid_caps_new (context, codec_id, "video/x-flash-screen", NULL);
931 932
      break;

933
    case CODEC_ID_VP3:
934
      caps = gst_ff_vid_caps_new (context, codec_id, "video/x-vp3", NULL);
935 936
      break;

937
    case CODEC_ID_VP5:
938
      caps = gst_ff_vid_caps_new (context, codec_id, "video/x-vp5", NULL);
939 940 941
      break;

    case CODEC_ID_VP6:
942
      caps = gst_ff_vid_caps_new (context, codec_id, "video/x-vp6", NULL);
943 944 945
      break;

    case CODEC_ID_VP6F:
946
      caps = gst_ff_vid_caps_new (context, codec_id, "video/x-vp6-flash", NULL);
947 948
      break;

949 950 951 952
    case CODEC_ID_VP6A:
      caps = gst_ff_vid_caps_new (context, codec_id, "video/x-vp6-alpha", NULL);
      break;

953 954 955 956
    case CODEC_ID_VP8:
      caps = gst_ff_vid_caps_new (context, codec_id, "video/x-vp8", NULL);
      break;

957
    case CODEC_ID_THEORA:
958
      caps = gst_ff_vid_caps_new (context, codec_id, "video/x-theora", NULL);
959 960
      break;

961
    case CODEC_ID_AAC:
962
    {
963
      caps = gst_ff_aud_caps_new (context, codec_id, "audio/mpeg", NULL);
964 965 966 967 968

      if (!encode) {
        GValue arr = { 0, };
        GValue item = { 0, };

969 970 971 972 973 974 975 976 977 978 979
        g_value_init (&arr, GST_TYPE_LIST);
        g_value_init (&item, G_TYPE_INT);
        g_value_set_int (&item, 2);
        gst_value_list_append_value (&arr, &item);
        g_value_set_int (&item, 4);
        gst_value_list_append_value (&arr, &item);
        g_value_unset (&item);

        gst_caps_set_value (caps, "mpegversion", &arr);
        g_value_unset (&arr);

980 981 982 983 984 985 986 987 988 989 990 991 992
        g_value_init (&arr, GST_TYPE_LIST);
        g_value_init (&item, G_TYPE_STRING);
        g_value_set_string (&item, "raw");
        gst_value_list_append_value (&arr, &item);
        g_value_set_string (&item, "adts");
        gst_value_list_append_value (&arr, &item);
        g_value_set_string (&item, "adif");
        gst_value_list_append_value (&arr, &item);
        g_value_unset (&item);

        gst_caps_set_value (caps, "stream-format", &arr);
        g_value_unset (&arr);
      } else {
993 994
        gst_caps_set_simple (caps, "mpegversion", G_TYPE_INT, 4,
            "stream-format", G_TYPE_STRING, "raw",
995 996 997 998 999
            "base-profile", G_TYPE_STRING, "lc", NULL);

        if (context && context->extradata_size > 0)
          gst_codec_utils_aac_caps_set_level_and_profile (caps,
              context->extradata, context->extradata_size);
1000 1001 1002 1003 1004
      }

      break;
    }
    case CODEC_ID_AAC_LATM:    /* LATM/LOAS AAC syntax */
1005
      caps = gst_ff_aud_caps_new (context, codec_id, "audio/mpeg",
1006 1007
          "mpegversion", G_TYPE_INT, 4, "stream-format", G_TYPE_STRING, "loas",
          NULL);
1008 1009 1010
      break;

    case CODEC_ID_ASV1:
1011 1012
      caps = gst_ff_vid_caps_new (context, codec_id, "video/x-asus",
          "asusversion", G_TYPE_INT, 1, NULL);
1013
      break;
1014
    case CODEC_ID_ASV2:
1015 1016
      caps = gst_ff_vid_caps_new (context, codec_id, "video/x-asus",
          "asusversion", G_TYPE_INT, 2, NULL);
1017 1018
      break;

1019
    case CODEC_ID_FFV1: