gstffmpegcodecmap.c 93.4 KB
Newer Older
1 2
/* GStreamer
 * Copyright (C) <1999> Erik Walthinsen <omega@cse.ogi.edu>
3
 * This file:
4
 * Copyright (c) 2002-2004 Ronald Bultje <rbultje@ronald.bitfreak.net>
5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21
 *
 * This library is free software; you can redistribute it and/or
 * modify it under the terms of the GNU Library General Public
 * License as published by the Free Software Foundation; either
 * version 2 of the License, or (at your option) any later version.
 *
 * This library is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * Library General Public License for more details.
 *
 * You should have received a copy of the GNU Library General Public
 * License along with this library; if not, write to the
 * Free Software Foundation, Inc., 59 Temple Place - Suite 330,
 * Boston, MA 02111-1307, USA.
 */

22
#ifdef HAVE_CONFIG_H
23
#include "config.h"
24
#endif
25
#include <gst/gst.h>
26 27 28
#ifdef HAVE_FFMPEG_UNINSTALLED
#include <avcodec.h>
#else
29
#include <libavcodec/avcodec.h>
30
#endif
31
#include <string.h>
32

33
#include "gstffmpeg.h"
34 35
#include "gstffmpegcodecmap.h"

36 37 38 39 40
/*
 * Read a palette from a caps.
 */

static void
41
gst_ffmpeg_get_palette (const GstCaps * caps, AVCodecContext * context)
42 43 44 45 46 47
{
  GstStructure *str = gst_caps_get_structure (caps, 0);
  const GValue *palette_v;
  const GstBuffer *palette;

  /* do we have a palette? */
48
  if ((palette_v = gst_structure_get_value (str, "palette_data")) && context) {
49
    palette = gst_value_get_buffer (palette_v);
50
    if (GST_BUFFER_SIZE (palette) >= AVPALETTE_SIZE) {
51 52 53 54 55 56 57 58 59 60 61
      if (context->palctrl)
        av_free (context->palctrl);
      context->palctrl = av_malloc (sizeof (AVPaletteControl));
      context->palctrl->palette_changed = 1;
      memcpy (context->palctrl->palette, GST_BUFFER_DATA (palette),
          AVPALETTE_SIZE);
    }
  }
}

static void
62
gst_ffmpeg_set_palette (GstCaps * caps, AVCodecContext * context)
63 64
{
  if (context->palctrl) {
65
    GstBuffer *palette = gst_buffer_new_and_alloc (AVPALETTE_SIZE);
66 67 68

    memcpy (GST_BUFFER_DATA (palette), context->palctrl->palette,
        AVPALETTE_SIZE);
69
    gst_caps_set_simple (caps, "palette_data", GST_TYPE_BUFFER, palette, NULL);
70 71 72
  }
}

73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141
/* IMPORTANT: Keep this sorted by the ffmpeg channel masks */
static const struct
{
  guint64 ff;
  GstAudioChannelPosition gst;
} _ff_to_gst_layout[] = {
  {
  CH_FRONT_LEFT, GST_AUDIO_CHANNEL_POSITION_FRONT_LEFT}, {
  CH_FRONT_RIGHT, GST_AUDIO_CHANNEL_POSITION_FRONT_RIGHT}, {
  CH_FRONT_CENTER, GST_AUDIO_CHANNEL_POSITION_FRONT_CENTER}, {
  CH_LOW_FREQUENCY, GST_AUDIO_CHANNEL_POSITION_LFE}, {
  CH_BACK_LEFT, GST_AUDIO_CHANNEL_POSITION_REAR_LEFT}, {
  CH_BACK_RIGHT, GST_AUDIO_CHANNEL_POSITION_REAR_RIGHT}, {
  CH_FRONT_LEFT_OF_CENTER, GST_AUDIO_CHANNEL_POSITION_FRONT_LEFT_OF_CENTER}, {
  CH_FRONT_RIGHT_OF_CENTER, GST_AUDIO_CHANNEL_POSITION_FRONT_RIGHT_OF_CENTER}, {
  CH_BACK_CENTER, GST_AUDIO_CHANNEL_POSITION_REAR_CENTER}, {
  CH_SIDE_LEFT, GST_AUDIO_CHANNEL_POSITION_SIDE_LEFT}, {
  CH_SIDE_RIGHT, GST_AUDIO_CHANNEL_POSITION_SIDE_RIGHT}, {
  CH_TOP_CENTER, GST_AUDIO_CHANNEL_POSITION_NONE}, {
  CH_TOP_FRONT_LEFT, GST_AUDIO_CHANNEL_POSITION_NONE}, {
  CH_TOP_FRONT_CENTER, GST_AUDIO_CHANNEL_POSITION_NONE}, {
  CH_TOP_FRONT_RIGHT, GST_AUDIO_CHANNEL_POSITION_NONE}, {
  CH_TOP_BACK_LEFT, GST_AUDIO_CHANNEL_POSITION_NONE}, {
  CH_TOP_BACK_CENTER, GST_AUDIO_CHANNEL_POSITION_NONE}, {
  CH_TOP_BACK_RIGHT, GST_AUDIO_CHANNEL_POSITION_NONE}, {
  CH_STEREO_LEFT, GST_AUDIO_CHANNEL_POSITION_FRONT_LEFT}, {
  CH_STEREO_RIGHT, GST_AUDIO_CHANNEL_POSITION_FRONT_RIGHT}
};

static GstAudioChannelPosition *
gst_ff_channel_layout_to_gst (guint64 channel_layout, guint channels)
{
  guint nchannels = 0, i, j;
  GstAudioChannelPosition *pos = NULL;
  gboolean none_layout = FALSE;

  for (i = 0; i < 64; i++) {
    if ((channel_layout & (G_GUINT64_CONSTANT (1) << i)) != 0) {
      nchannels++;
    }
  }

  if (channel_layout == 0) {
    nchannels = channels;
    none_layout = TRUE;
  }

  if (nchannels != channels) {
    GST_ERROR ("Number of channels is different (%u != %u)", channels,
        nchannels);
    return NULL;
  }

  pos = g_new (GstAudioChannelPosition, nchannels);

  for (i = 0, j = 0; i < G_N_ELEMENTS (_ff_to_gst_layout); i++) {
    if ((channel_layout & _ff_to_gst_layout[i].ff) != 0) {
      pos[j++] = _ff_to_gst_layout[i].gst;

      if (_ff_to_gst_layout[i].gst == GST_AUDIO_CHANNEL_POSITION_NONE)
        none_layout = TRUE;
    }
  }

  if (j != nchannels) {
    GST_WARNING ("Unknown channels in channel layout - assuming NONE layout");
    none_layout = TRUE;
  }

142 143 144
  if (!none_layout && !gst_audio_check_channel_positions (pos, nchannels)) {
    GST_ERROR ("Invalid channel layout %" G_GUINT64_FORMAT
        " - assuming NONE layout", channel_layout);
145 146 147 148 149 150 151 152 153
    none_layout = TRUE;
  }

  if (none_layout) {
    if (nchannels == 1) {
      pos[0] = GST_AUDIO_CHANNEL_POSITION_FRONT_MONO;
    } else if (nchannels == 2) {
      pos[0] = GST_AUDIO_CHANNEL_POSITION_FRONT_LEFT;
      pos[1] = GST_AUDIO_CHANNEL_POSITION_FRONT_RIGHT;
154 155 156
    } else if (channel_layout == 0) {
      g_free (pos);
      pos = NULL;
157 158 159 160 161 162
    } else {
      for (i = 0; i < nchannels; i++)
        pos[i] = GST_AUDIO_CHANNEL_POSITION_NONE;
    }
  }

163 164 165 166 167 168 169 170 171 172
  if (nchannels == 1 && pos[0] == GST_AUDIO_CHANNEL_POSITION_FRONT_CENTER) {
    GST_DEBUG ("mono common case; won't set channel positions");
    g_free (pos);
    pos = NULL;
  } else if (nchannels == 2 && pos[0] == GST_AUDIO_CHANNEL_POSITION_FRONT_LEFT
      && pos[1] == GST_AUDIO_CHANNEL_POSITION_FRONT_RIGHT) {
    GST_DEBUG ("stereo common case; won't set channel positions");
    g_free (pos);
    pos = NULL;
  }
173 174 175 176

  return pos;
}

177 178 179 180
/* this macro makes a caps width fixed or unfixed width/height
 * properties depending on whether we've got a context.
 *
 * See below for why we use this.
181 182 183
 *
 * We should actually do this stuff at the end, like in riff-media.c,
 * but I'm too lazy today. Maybe later.
184
 */
185
static GstCaps *
186 187
gst_ff_vid_caps_new (AVCodecContext * context, enum CodecID codec_id,
    const char *mimetype, const char *fieldname, ...)
188 189 190 191
{
  GstStructure *structure = NULL;
  GstCaps *caps = NULL;
  va_list var_args;
192
  gint i;
193

194 195
  GST_LOG ("context:%p, codec_id:%d, mimetype:%s", context, codec_id, mimetype);

196 197
  /* fixed, non probing context */
  if (context != NULL && context->width != -1) {
198 199 200 201
    caps = gst_caps_new_simple (mimetype,
        "width", G_TYPE_INT, context->width,
        "height", G_TYPE_INT, context->height,
        "framerate", GST_TYPE_FRACTION,
202 203
        context->time_base.den / context->ticks_per_frame,
        context->time_base.num, NULL);
204
  } else {
205
    /* so we are after restricted caps in this case */
206
    switch (codec_id) {
207 208 209 210 211 212 213 214 215 216 217 218
      case CODEC_ID_H261:
      {
        caps = gst_caps_new_simple (mimetype,
            "width", G_TYPE_INT, 352,
            "height", G_TYPE_INT, 288,
            "framerate", GST_TYPE_FRACTION_RANGE, 0, 1, G_MAXINT, 1, NULL);
        gst_caps_append (caps, gst_caps_new_simple (mimetype,
                "width", G_TYPE_INT, 176,
                "height", G_TYPE_INT, 144,
                "framerate", GST_TYPE_FRACTION_RANGE, 0, 1, G_MAXINT, 1, NULL));
        break;
      }
219 220 221 222 223 224 225 226 227
      case CODEC_ID_H263:
      {
        /* 128x96, 176x144, 352x288, 704x576, and 1408x1152. slightly reordered
         * because we want automatic negotiation to go as close to 320x240 as
         * possible. */
        const static gint widths[] = { 352, 704, 176, 1408, 128 };
        const static gint heights[] = { 288, 576, 144, 1152, 96 };
        GstCaps *temp;
        gint n_sizes = G_N_ELEMENTS (widths);
228

229 230 231 232 233 234
        caps = gst_caps_new_empty ();
        for (i = 0; i < n_sizes; i++) {
          temp = gst_caps_new_simple (mimetype,
              "width", G_TYPE_INT, widths[i],
              "height", G_TYPE_INT, heights[i],
              "framerate", GST_TYPE_FRACTION_RANGE, 0, 1, G_MAXINT, 1, NULL);
235

236 237 238 239
          gst_caps_append (caps, temp);
        }
        break;
      }
240 241
      case CODEC_ID_DVVIDEO:
      {
242 243 244 245 246 247 248 249 250 251 252 253 254 255 256
        static struct
        {
          guint32 csp;
          gint width, height;
          gint par_n, par_d;
          gint framerate_n, framerate_d;
        } profiles[] = {
          {
          GST_MAKE_FOURCC ('Y', '4', '1', 'B'), 720, 480, 10, 11, 30000, 1001}, {
          GST_MAKE_FOURCC ('Y', '4', '1', 'B'), 720, 480, 40, 33, 30000, 1001}, {
          GST_MAKE_FOURCC ('I', '4', '2', '0'), 720, 576, 59, 54, 25, 1}, {
          GST_MAKE_FOURCC ('I', '4', '2', '0'), 720, 576, 118, 81, 25, 1}, {
          GST_MAKE_FOURCC ('Y', '4', '1', 'B'), 720, 576, 59, 54, 25, 1}, {
          GST_MAKE_FOURCC ('Y', '4', '1', 'B'), 720, 576, 118, 81, 25, 1}
        };
257
        GstCaps *temp;
258
        gint n_sizes = G_N_ELEMENTS (profiles);
259 260 261 262

        caps = gst_caps_new_empty ();
        for (i = 0; i < n_sizes; i++) {
          temp = gst_caps_new_simple (mimetype,
263 264 265 266 267
              "width", G_TYPE_INT, profiles[i].width,
              "height", G_TYPE_INT, profiles[i].height,
              "framerate", GST_TYPE_FRACTION, profiles[i].framerate_n,
              profiles[i].framerate_d, "pixel-aspect-ratio", GST_TYPE_FRACTION,
              profiles[i].par_n, profiles[i].par_d, NULL);
268 269

          gst_caps_append (caps, temp);
270
        }
271 272
        break;
      }
273 274
      case CODEC_ID_DNXHD:
      {
275
        caps = gst_caps_new_simple (mimetype,
276 277
            "width", G_TYPE_INT, 1920,
            "height", G_TYPE_INT, 1080,
278
            "framerate", GST_TYPE_FRACTION_RANGE, 0, 1, G_MAXINT, 1, NULL);
279 280 281 282 283 284 285
        gst_caps_append (caps, gst_caps_new_simple (mimetype,
                "width", G_TYPE_INT, 1280,
                "height", G_TYPE_INT, 720,
                "framerate", GST_TYPE_FRACTION_RANGE, 0, 1, G_MAXINT, 1, NULL));
        break;
      }
      default:
286 287 288 289
        break;
    }
  }

290 291
  /* no fixed caps or special restrictions applied;
   * default unfixed setting */
292 293
  if (!caps) {
    GST_DEBUG ("Creating default caps");
294 295 296 297
    caps = gst_caps_new_simple (mimetype,
        "width", GST_TYPE_INT_RANGE, 16, 4096,
        "height", GST_TYPE_INT_RANGE, 16, 4096,
        "framerate", GST_TYPE_FRACTION_RANGE, 0, 1, G_MAXINT, 1, NULL);
298
  }
299

300
  for (i = 0; i < gst_caps_get_size (caps); i++) {
301
    va_start (var_args, fieldname);
302
    structure = gst_caps_get_structure (caps, i);
303 304 305 306 307 308
    gst_structure_set_valist (structure, fieldname, var_args);
    va_end (var_args);
  }

  return caps;
}
309 310 311

/* same for audio - now with channels/sample rate
 */
312
static GstCaps *
313 314
gst_ff_aud_caps_new (AVCodecContext * context, enum CodecID codec_id,
    const char *mimetype, const char *fieldname, ...)
315 316 317
{
  GstCaps *caps = NULL;
  GstStructure *structure = NULL;
318
  gint i;
319 320
  va_list var_args;

321 322
  /* fixed, non-probing context */
  if (context != NULL && context->channels != -1) {
323 324
    GstAudioChannelPosition *pos;

325 326
    caps = gst_caps_new_simple (mimetype,
        "rate", G_TYPE_INT, context->sample_rate,
327
        "channels", G_TYPE_INT, context->channels, NULL);
328 329 330 331 332 333 334 335

    pos =
        gst_ff_channel_layout_to_gst (context->channel_layout,
        context->channels);
    if (pos != NULL) {
      gst_audio_set_channel_positions (gst_caps_get_structure (caps, 0), pos);
      g_free (pos);
    }
336
  } else {
337 338 339
    gint maxchannels = 2;
    const gint *rates = NULL;
    gint n_rates = 0;
340

341
    if (context) {
342 343 344 345 346 347 348 349 350 351
      /* so we must be after restricted caps in this particular case */
      switch (codec_id) {
        case CODEC_ID_MP2:
        {
          const static gint l_rates[] =
              { 48000, 44100, 32000, 24000, 22050, 16000 };
          n_rates = G_N_ELEMENTS (l_rates);
          rates = l_rates;
          break;
        }
352
        case CODEC_ID_EAC3:
353 354 355 356 357 358 359 360 361 362 363 364 365 366 367 368 369 370 371 372 373 374 375 376
        case CODEC_ID_AC3:
        {
          const static gint l_rates[] = { 48000, 44100, 32000 };
          n_rates = G_N_ELEMENTS (l_rates);
          rates = l_rates;
          break;
        }
        case CODEC_ID_ADPCM_SWF:
        {
          const static gint l_rates[] = { 11025, 22050, 44100 };
          n_rates = G_N_ELEMENTS (l_rates);
          rates = l_rates;
          break;
        }
        case CODEC_ID_ROQ_DPCM:
        {
          const static gint l_rates[] = { 22050 };
          n_rates = G_N_ELEMENTS (l_rates);
          rates = l_rates;
          break;
        }
        case CODEC_ID_ADPCM_G726:
          maxchannels = 1;
          break;
377 378 379 380 381 382 383 384 385 386 387 388 389 390 391 392
        case CODEC_ID_AMR_NB:
        {
          const static gint l_rates[] = { 8000 };
          maxchannels = 1;
          n_rates = G_N_ELEMENTS (l_rates);
          rates = l_rates;
          break;
        }
        case CODEC_ID_AMR_WB:
        {
          const static gint l_rates[] = { 16000 };
          maxchannels = 1;
          n_rates = G_N_ELEMENTS (l_rates);
          rates = l_rates;
          break;
        }
393 394 395
        default:
          break;
      }
396 397 398 399 400

      /* TODO: handle context->channel_layouts here to set
       * the list of channel layouts supported by the encoder.
       * Unfortunately no encoder uses this yet....
       */
401 402 403 404 405 406 407
    }

    /* regardless of encode/decode, open up channels if applicable */
    /* Until decoders/encoders expose the maximum number of channels
     * they support, we whitelist them here. */
    switch (codec_id) {
      case CODEC_ID_AC3:
408
      case CODEC_ID_EAC3:
409 410 411 412 413 414 415
      case CODEC_ID_AAC:
      case CODEC_ID_DTS:
        maxchannels = 6;
        break;
      default:
        break;
    }
416

417 418 419 420 421 422 423 424 425 426 427 428 429 430 431 432 433 434 435 436 437 438 439
    if (maxchannels == 1)
      caps = gst_caps_new_simple (mimetype,
          "channels", G_TYPE_INT, maxchannels, NULL);
    else
      caps = gst_caps_new_simple (mimetype,
          "channels", GST_TYPE_INT_RANGE, 1, maxchannels, NULL);
    if (n_rates) {
      GValue list = { 0, };
      GstStructure *structure;

      g_value_init (&list, GST_TYPE_LIST);
      for (i = 0; i < n_rates; i++) {
        GValue v = { 0, };

        g_value_init (&v, G_TYPE_INT);
        g_value_set_int (&v, rates[i]);
        gst_value_list_append_value (&list, &v);
        g_value_unset (&v);
      }
      structure = gst_caps_get_structure (caps, 0);
      gst_structure_set_value (structure, "rate", &list);
      g_value_unset (&list);
    } else
440
      gst_caps_set_simple (caps, "rate", GST_TYPE_INT_RANGE, 4000, 96000, NULL);
441 442
  }

443
  for (i = 0; i < gst_caps_get_size (caps); i++) {
444
    va_start (var_args, fieldname);
445
    structure = gst_caps_get_structure (caps, i);
446 447 448 449 450 451
    gst_structure_set_valist (structure, fieldname, var_args);
    va_end (var_args);
  }

  return caps;
}
452 453 454 455 456 457

/* Convert a FFMPEG codec ID and optional AVCodecContext
 * to a GstCaps. If the context is ommitted, no fixed values
 * for video/audio size will be included in the GstCaps
 *
 * CodecID is primarily meant for compressed data GstCaps!
458 459 460 461 462 463 464 465 466
 *
 * encode is a special parameter. gstffmpegdec will say
 * FALSE, gstffmpegenc will say TRUE. The output caps
 * depends on this, in such a way that it will be very
 * specific, defined, fixed and correct caps for encoders,
 * yet very wide, "forgiving" caps for decoders. Example
 * for mp3: decode: audio/mpeg,mpegversion=1,layer=[1-3]
 * but encode: audio/mpeg,mpegversion=1,layer=3,bitrate=x,
 * rate=x,channels=x.
467 468
 */

469
GstCaps *
Thomas Vander Stichele's avatar
indent  
Thomas Vander Stichele committed
470 471
gst_ffmpeg_codecid_to_caps (enum CodecID codec_id,
    AVCodecContext * context, gboolean encode)
472
{
473
  GstCaps *caps = NULL;
474
  gboolean buildcaps = FALSE;
475

476 477
  GST_LOG ("codec_id:%d, context:%p, encode:%d", codec_id, context, encode);

478
  switch (codec_id) {
479
    case CODEC_ID_MPEG1VIDEO:
480 481 482 483
      /* FIXME: bitrate */
      caps = gst_ff_vid_caps_new (context, codec_id, "video/mpeg",
          "mpegversion", G_TYPE_INT, 1,
          "systemstream", G_TYPE_BOOLEAN, FALSE, NULL);
484 485 486 487 488
      break;

    case CODEC_ID_MPEG2VIDEO:
      if (encode) {
        /* FIXME: bitrate */
489
        caps = gst_ff_vid_caps_new (context, codec_id, "video/mpeg",
Thomas Vander Stichele's avatar
indent  
Thomas Vander Stichele committed
490 491
            "mpegversion", G_TYPE_INT, 2,
            "systemstream", G_TYPE_BOOLEAN, FALSE, NULL);
492 493 494 495
      } else {
        /* decode both MPEG-1 and MPEG-2; width/height/fps are all in
         * the MPEG video stream headers, so may be omitted from caps. */
        caps = gst_caps_new_simple ("video/mpeg",
Thomas Vander Stichele's avatar
indent  
Thomas Vander Stichele committed
496 497
            "mpegversion", GST_TYPE_INT_RANGE, 1, 2,
            "systemstream", G_TYPE_BOOLEAN, FALSE, NULL);
498
      }
499
      break;
500 501 502 503 504 505

    case CODEC_ID_MPEG2VIDEO_XVMC:
      /* this is a special ID - don't need it in GStreamer, I think */
      break;

    case CODEC_ID_H263:
506
      if (encode) {
507
        caps = gst_ff_vid_caps_new (context, codec_id, "video/x-h263",
508 509 510
            "variant", G_TYPE_STRING, "itu",
            "h263version", G_TYPE_STRING, "h263", NULL);
      } else {
511 512 513 514
        /* don't pass codec_id, we can decode other variants with the H263
         * decoder that don't have specific size requirements
         */
        caps = gst_ff_vid_caps_new (context, CODEC_ID_NONE, "video/x-h263",
515 516
            "variant", G_TYPE_STRING, "itu", NULL);
      }
517 518 519
      break;

    case CODEC_ID_H263P:
520
      caps = gst_ff_vid_caps_new (context, codec_id, "video/x-h263",
521 522
          "variant", G_TYPE_STRING, "itu",
          "h263version", G_TYPE_STRING, "h263p", NULL);
523
      break;
524

525
    case CODEC_ID_H263I:
526
      caps = gst_ff_vid_caps_new (context, codec_id, "video/x-intel-h263",
527
          "variant", G_TYPE_STRING, "intel", NULL);
528 529
      break;

530
    case CODEC_ID_H261:
531
      caps = gst_ff_vid_caps_new (context, codec_id, "video/x-h261", NULL);
532 533
      break;

534
    case CODEC_ID_RV10:
535
    case CODEC_ID_RV20:
536
    case CODEC_ID_RV30:
537
    case CODEC_ID_RV40:
538 539
    {
      gint version;
540

541 542 543 544
      switch (codec_id) {
        case CODEC_ID_RV40:
          version = 4;
          break;
545 546 547
        case CODEC_ID_RV30:
          version = 3;
          break;
548 549 550 551 552 553 554
        case CODEC_ID_RV20:
          version = 2;
          break;
        default:
          version = 1;
          break;
      }
555

556 557 558 559 560
      /* FIXME: context->sub_id must be filled in during decoding */
      caps = gst_ff_vid_caps_new (context, codec_id, "video/x-pn-realvideo",
          "systemstream", G_TYPE_BOOLEAN, FALSE,
          "rmversion", G_TYPE_INT, version, NULL);
      if (context) {
561
        gst_caps_set_simple (caps, "format", G_TYPE_INT, context->sub_id, NULL);
562 563
        if (context->extradata_size >= 8) {
          gst_caps_set_simple (caps,
564 565 566
              "subformat", G_TYPE_INT, GST_READ_UINT32_BE (context->extradata),
              NULL);
        }
567
      }
568
    }
569
      break;
570

571 572 573 574 575 576
    case CODEC_ID_MP1:
      /* FIXME: bitrate */
      caps = gst_ff_aud_caps_new (context, codec_id, "audio/mpeg",
          "mpegversion", G_TYPE_INT, 1, "layer", G_TYPE_INT, 1, NULL);
      break;

577
    case CODEC_ID_MP2:
578 579 580
      /* FIXME: bitrate */
      caps = gst_ff_aud_caps_new (context, codec_id, "audio/mpeg",
          "mpegversion", G_TYPE_INT, 1, "layer", G_TYPE_INT, 2, NULL);
581
      break;
582

583 584 585
    case CODEC_ID_MP3:
      if (encode) {
        /* FIXME: bitrate */
586
        caps = gst_ff_aud_caps_new (context, codec_id, "audio/mpeg",
Thomas Vander Stichele's avatar
indent  
Thomas Vander Stichele committed
587
            "mpegversion", G_TYPE_INT, 1, "layer", G_TYPE_INT, 3, NULL);
588 589 590 591
      } else {
        /* Decodes MPEG-1 layer 1/2/3. Samplerate, channels et al are
         * in the MPEG audio header, so may be omitted from caps. */
        caps = gst_caps_new_simple ("audio/mpeg",
Thomas Vander Stichele's avatar
indent  
Thomas Vander Stichele committed
592 593
            "mpegversion", G_TYPE_INT, 1,
            "layer", GST_TYPE_INT_RANGE, 1, 3, NULL);
594
      }
595
      break;
596

597 598 599 600 601 602 603
    case CODEC_ID_MUSEPACK7:
      caps =
          gst_ff_aud_caps_new (context, codec_id,
          "audio/x-ffmpeg-parsed-musepack", "streamversion", G_TYPE_INT, 7,
          NULL);
      break;

604 605 606 607 608 609 610
    case CODEC_ID_MUSEPACK8:
      caps =
          gst_ff_aud_caps_new (context, codec_id,
          "audio/x-ffmpeg-parsed-musepack", "streamversion", G_TYPE_INT, 8,
          NULL);
      break;

611 612 613
    case CODEC_ID_AC3:
      /* FIXME: bitrate */
      caps = gst_ff_aud_caps_new (context, codec_id, "audio/x-ac3", NULL);
614
      break;
615

616 617 618 619 620
    case CODEC_ID_EAC3:
      /* FIXME: bitrate */
      caps = gst_ff_aud_caps_new (context, codec_id, "audio/x-eac3", NULL);
      break;

621
    case CODEC_ID_ATRAC3:
622 623 624
      caps =
          gst_ff_aud_caps_new (context, codec_id, "audio/x-vnd.sony.atrac3",
          NULL);
625
      break;
626

627
    case CODEC_ID_DTS:
628
      caps = gst_ff_aud_caps_new (context, codec_id, "audio/x-dts", NULL);
629
      break;
630

631 632 633 634 635 636
    case CODEC_ID_APE:
      caps =
          gst_ff_aud_caps_new (context, codec_id, "audio/x-ffmpeg-parsed-ape",
          NULL);
      if (context) {
        gst_caps_set_simple (caps,
637
            "depth", G_TYPE_INT, context->bits_per_coded_sample, NULL);
638 639 640
      }
      break;

641 642 643
    case CODEC_ID_MLP:
      caps = gst_ff_aud_caps_new (context, codec_id, "audio/x-mlp", NULL);
      break;
644

645 646 647
    case CODEC_ID_IMC:
      caps = gst_ff_aud_caps_new (context, codec_id, "audio/x-imc", NULL);
      break;
648

Thomas Vander Stichele's avatar
indent  
Thomas Vander Stichele committed
649 650 651 652 653
      /* MJPEG is normal JPEG, Motion-JPEG and Quicktime MJPEG-A. MJPEGB
       * is Quicktime's MJPEG-B. LJPEG is lossless JPEG. I don't know what
       * sp5x is, but it's apparently something JPEG... We don't separate
       * between those in GStreamer. Should we (at least between MJPEG,
       * MJPEG-B and sp5x decoding...)? */
654
    case CODEC_ID_MJPEG:
655
    case CODEC_ID_LJPEG:
656
      caps = gst_ff_vid_caps_new (context, codec_id, "image/jpeg", NULL);
Wim Taymans's avatar
Wim Taymans committed
657
      break;
658

659
    case CODEC_ID_SP5X:
660
      caps = gst_ff_vid_caps_new (context, codec_id, "video/sp5x", NULL);
661 662
      break;

663
    case CODEC_ID_MJPEGB:
664
      caps = gst_ff_vid_caps_new (context, codec_id, "video/x-mjpeg-b", NULL);
665 666
      break;

667
    case CODEC_ID_MPEG4:
668
      if (encode && context != NULL) {
669 670
        /* I'm not exactly sure what ffmpeg outputs... ffmpeg itself uses
         * the AVI fourcc 'DIVX', but 'mp4v' for Quicktime... */
671
        switch (context->codec_tag) {
672
          case GST_MAKE_FOURCC ('D', 'I', 'V', 'X'):
673
            caps = gst_ff_vid_caps_new (context, codec_id, "video/x-divx",
Thomas Vander Stichele's avatar
Thomas Vander Stichele committed
674
                "divxversion", G_TYPE_INT, 5, NULL);
675 676 677 678
            break;
          case GST_MAKE_FOURCC ('m', 'p', '4', 'v'):
          default:
            /* FIXME: bitrate */
679
            caps = gst_ff_vid_caps_new (context, codec_id, "video/mpeg",
680 681 682 683
                "systemstream", G_TYPE_BOOLEAN, FALSE,
                "mpegversion", G_TYPE_INT, 4, NULL);
            break;
        }
684 685
      } else {
        /* The trick here is to separate xvid, divx, mpeg4, 3ivx et al */
686
        caps = gst_ff_vid_caps_new (context, codec_id, "video/mpeg",
Thomas Vander Stichele's avatar
indent  
Thomas Vander Stichele committed
687 688
            "mpegversion", G_TYPE_INT, 4,
            "systemstream", G_TYPE_BOOLEAN, FALSE, NULL);
689
        if (encode) {
690 691
          gst_caps_append (caps, gst_ff_vid_caps_new (context, codec_id,
                  "video/x-divx", "divxversion", G_TYPE_INT, 5, NULL));
692
        } else {
693 694 695 696 697 698 699
          gst_caps_append (caps, gst_ff_vid_caps_new (context, codec_id,
                  "video/x-divx", "divxversion", GST_TYPE_INT_RANGE, 4, 5,
                  NULL));
          gst_caps_append (caps, gst_ff_vid_caps_new (context, codec_id,
                  "video/x-xvid", NULL));
          gst_caps_append (caps, gst_ff_vid_caps_new (context, codec_id,
                  "video/x-3ivx", NULL));
700
        }
701
      }
702
      break;
703

704
    case CODEC_ID_RAWVIDEO:
705 706
      caps = gst_ffmpeg_codectype_to_caps (CODEC_TYPE_VIDEO, context, codec_id,
          encode);
707
      break;
708

709
    case CODEC_ID_MSMPEG4V1:
710 711
    case CODEC_ID_MSMPEG4V2:
    case CODEC_ID_MSMPEG4V3:
712 713 714 715 716 717 718 719 720
    {
      gint version = 41 + codec_id - CODEC_ID_MSMPEG4V1;

      /* encode-FIXME: bitrate */
      caps = gst_ff_vid_caps_new (context, codec_id, "video/x-msmpeg",
          "msmpegversion", G_TYPE_INT, version, NULL);
      if (!encode && codec_id == CODEC_ID_MSMPEG4V3) {
        gst_caps_append (caps, gst_ff_vid_caps_new (context, codec_id,
                "video/x-divx", "divxversion", G_TYPE_INT, 3, NULL));
721
      }
722
    }
723
      break;
724

725
    case CODEC_ID_WMV1:
726
    case CODEC_ID_WMV2:
727 728
    {
      gint version = (codec_id == CODEC_ID_WMV1) ? 1 : 2;
729

730 731 732
      caps = gst_ff_vid_caps_new (context, codec_id, "video/x-wmv",
          "wmvversion", G_TYPE_INT, version, NULL);
    }
733
      break;
734

735
    case CODEC_ID_FLV1:
736 737
      caps = gst_ff_vid_caps_new (context, codec_id, "video/x-flash-video",
          "flvversion", G_TYPE_INT, 1, NULL);
738
      break;
739

740
    case CODEC_ID_SVQ1:
741
      caps = gst_ff_vid_caps_new (context, codec_id, "video/x-svq",
Thomas Vander Stichele's avatar
indent  
Thomas Vander Stichele committed
742
          "svqversion", G_TYPE_INT, 1, NULL);
743
      break;
744 745

    case CODEC_ID_SVQ3:
746
      caps = gst_ff_vid_caps_new (context, codec_id, "video/x-svq",
747
          "svqversion", G_TYPE_INT, 3, NULL);
748
      break;
749

750
    case CODEC_ID_DVAUDIO:
751
      caps = gst_ff_aud_caps_new (context, codec_id, "audio/x-dv", NULL);
752
      break;
753

754
    case CODEC_ID_DVVIDEO:
755 756 757 758 759
    {
      if (encode && context) {
        guint32 fourcc;

        switch (context->pix_fmt) {
760
          case PIX_FMT_YUYV422:
761 762 763 764 765 766 767 768 769 770 771 772 773 774 775 776 777 778 779 780 781 782 783 784 785 786 787
            fourcc = GST_MAKE_FOURCC ('Y', 'U', 'Y', '2');
            break;
          case PIX_FMT_YUV420P:
            fourcc = GST_MAKE_FOURCC ('I', '4', '2', '0');
            break;
          case PIX_FMT_YUV411P:
            fourcc = GST_MAKE_FOURCC ('Y', '4', '1', 'B');
            break;
          case PIX_FMT_YUV422P:
            fourcc = GST_MAKE_FOURCC ('Y', '4', '2', 'B');
            break;
          case PIX_FMT_YUV410P:
            fourcc = GST_MAKE_FOURCC ('Y', 'U', 'V', '9');
            break;
          default:
            GST_WARNING
                ("Couldnt' find fourcc for pixfmt %d, defaulting to I420",
                context->pix_fmt);
            fourcc = GST_MAKE_FOURCC ('I', '4', '2', '0');
            break;
        }
        caps = gst_ff_vid_caps_new (context, codec_id, "video/x-dv",
            "systemstream", G_TYPE_BOOLEAN, FALSE,
            "format", GST_TYPE_FOURCC, fourcc, NULL);
      } else {
        caps = gst_ff_vid_caps_new (context, codec_id, "video/x-dv",
            "systemstream", G_TYPE_BOOLEAN, FALSE, NULL);
788
      }
789
    }
790
      break;
791

792 793
    case CODEC_ID_WMAV1:
    case CODEC_ID_WMAV2:
794 795
    {
      gint version = (codec_id == CODEC_ID_WMAV1) ? 1 : 2;
796

797 798 799 800 801 802 803 804 805 806
      if (context) {
        caps = gst_ff_aud_caps_new (context, codec_id, "audio/x-wma",
            "wmaversion", G_TYPE_INT, version,
            "block_align", G_TYPE_INT, context->block_align,
            "bitrate", G_TYPE_INT, context->bit_rate, NULL);
      } else {
        caps = gst_ff_aud_caps_new (context, codec_id, "audio/x-wma",
            "wmaversion", G_TYPE_INT, version,
            "block_align", GST_TYPE_INT_RANGE, 0, G_MAXINT,
            "bitrate", GST_TYPE_INT_RANGE, 0, G_MAXINT, NULL);
807
      }
808
    }
809
      break;
810

811 812
    case CODEC_ID_MACE3:
    case CODEC_ID_MACE6:
813 814
    {
      gint version = (codec_id == CODEC_ID_MACE3) ? 3 : 6;
815

816 817 818
      caps = gst_ff_aud_caps_new (context, codec_id, "audio/x-mace",
          "maceversion", G_TYPE_INT, version, NULL);
    }
819
      break;
820

Wim Taymans's avatar
Wim Taymans committed
821
    case CODEC_ID_HUFFYUV:
822
      caps = gst_ff_vid_caps_new (context, codec_id, "video/x-huffyuv", NULL);
823 824
      if (context) {
        gst_caps_set_simple (caps,
825
            "bpp", G_TYPE_INT, context->bits_per_coded_sample, NULL);
826
      }
827 828 829
      break;

    case CODEC_ID_CYUV:
830 831 832
      caps =
          gst_ff_vid_caps_new (context, codec_id, "video/x-compressed-yuv",
          NULL);
833 834 835
      break;

    case CODEC_ID_H264:
836
      caps = gst_ff_vid_caps_new (context, codec_id, "video/x-h264", NULL);
837 838 839
      break;

    case CODEC_ID_INDEO3:
840
      caps = gst_ff_vid_caps_new (context, codec_id, "video/x-indeo",
Thomas Vander Stichele's avatar
indent  
Thomas Vander Stichele committed
841
          "indeoversion", G_TYPE_INT, 3, NULL);
842 843
      break;

844
    case CODEC_ID_INDEO2:
845
      caps = gst_ff_vid_caps_new (context, codec_id, "video/x-indeo",
846 847 848
          "indeoversion", G_TYPE_INT, 2, NULL);
      break;

849
    case CODEC_ID_FLASHSV:
850 851
      caps =
          gst_ff_vid_caps_new (context, codec_id, "video/x-flash-screen", NULL);
852 853
      break;

854
    case CODEC_ID_VP3:
855
      caps = gst_ff_vid_caps_new (context, codec_id, "video/x-vp3", NULL);
856 857
      break;

858
    case CODEC_ID_VP5:
859
      caps = gst_ff_vid_caps_new (context, codec_id, "video/x-vp5", NULL);
860 861 862
      break;

    case CODEC_ID_VP6:
863
      caps = gst_ff_vid_caps_new (context, codec_id, "video/x-vp6", NULL);
864 865 866
      break;

    case CODEC_ID_VP6F:
867
      caps = gst_ff_vid_caps_new (context, codec_id, "video/x-vp6-flash", NULL);
868 869
      break;

870 871 872 873
    case CODEC_ID_VP6A:
      caps = gst_ff_vid_caps_new (context, codec_id, "video/x-vp6-alpha", NULL);
      break;

874
    case CODEC_ID_THEORA:
875
      caps = gst_ff_vid_caps_new (context, codec_id, "video/x-theora", NULL);
876 877
      break;

878
    case CODEC_ID_AAC:
879
      caps = gst_ff_aud_caps_new (context, codec_id, "audio/mpeg",
880
          "mpegversion", G_TYPE_INT, 4, NULL);
881 882 883
      break;

    case CODEC_ID_ASV1:
884 885
      caps = gst_ff_vid_caps_new (context, codec_id, "video/x-asus",
          "asusversion", G_TYPE_INT, 1, NULL);
886
      break;
887
    case CODEC_ID_ASV2:
888 889
      caps = gst_ff_vid_caps_new (context, codec_id, "video/x-asus",
          "asusversion", G_TYPE_INT, 2, NULL);
890 891
      break;

892
    case CODEC_ID_FFV1:
893
      caps = gst_ff_vid_caps_new (context, codec_id, "video/x-ffv",
Thomas Vander Stichele's avatar
indent  
Thomas Vander Stichele committed
894
          "ffvversion", G_TYPE_INT, 1, NULL);
895 896 897
      break;

    case CODEC_ID_4XM:
898
      caps = gst_ff_vid_caps_new (context, codec_id, "video/x-4xm", NULL);
899 900
      break;

901 902
    case CODEC_ID_XAN_WC3:
    case CODEC_ID_XAN_WC4:
903
      caps = gst_ff_vid_caps_new (context, codec_id, "video/x-xan",
904 905 906
          "wcversion", G_TYPE_INT, 3 - CODEC_ID_XAN_WC3 + codec_id, NULL);
      break;

907
    case CODEC_ID_CLJR:
908 909 910
      caps =
          gst_ff_vid_caps_new (context, codec_id,
          "video/x-cirrus-logic-accupak", NULL);
911 912 913
      break;

    case CODEC_ID_FRAPS:
914 915 916
      caps = gst_ff_vid_caps_new (context, codec_id, "video/x-fraps", NULL);
      break;

917 918 919 920 921 922
    case CODEC_ID_MDEC:
    case CODEC_ID_ROQ:
    case CODEC_ID_INTERPLAY_VIDEO:
      buildcaps = TRUE;
      break;

923
    case CODEC_ID_VCR1:
924 925
      caps = gst_ff_vid_caps_new (context, codec_id, "video/x-ati-vcr",
          "vcrversion", G_TYPE_INT, 1, NULL);
926 927
      break;

928
    case CODEC_ID_RPZA:
929 930
      caps =
          gst_ff_vid_caps_new (context, codec_id, "video/x-apple-video", NULL);
931 932
      break;

933
    case CODEC_ID_CINEPAK:
934
      caps = gst_ff_vid_caps_new (context, codec_id, "video/x-cinepak", NULL);
935 936
      break;

937
      /* WS_VQA belogns here (order) */
938 939

    case CODEC_ID_MSRLE:
940
      caps = gst_ff_vid_caps_new (context, codec_id, "video/x-rle",
Thomas Vander Stichele's avatar
Thomas Vander Stichele committed
941
          "layout", G_TYPE_STRING, "microsoft", NULL);
942 943
      if (context) {
        gst_caps_set_simple (caps,
944
            "depth", G_TYPE_INT, (gint) context->bits_per_coded_sample, NULL);
945 946 947 948 949
      } else {
        gst_caps_set_simple (caps, "depth", GST_TYPE_INT_RANGE, 1, 64, NULL);
      }
      break;

950
    case CODEC_ID_QTRLE:
951
      caps = gst_ff_vid_caps_new (context, codec_id, "video/x-rle",
952 953 954
          "layout", G_TYPE_STRING, "quicktime", NULL);
      if (context) {
        gst_caps_set_simple (caps,
955
            "depth", G_TYPE_INT, (gint) context->bits_per_coded_sample, NULL);
956 957 958 959 960
      } else {
        gst_caps_set_simple (caps, "depth", GST_TYPE_INT_RANGE, 1, 64, NULL);
      }
      break;

961
    case CODEC_ID_MSVIDEO1:
962
      caps = gst_ff_vid_caps_new (context, codec_id, "video/x-msvideocodec",
Thomas Vander Stichele's avatar
Thomas Vander Stichele committed
963
          "msvideoversion", G_TYPE_INT, 1, NULL);
964 965
      break;

966
    case CODEC_ID_WMV3:
967
      caps = gst_ff_vid_caps_new (context, codec_id, "video/x-wmv",
Jan Schmidt's avatar
Jan Schmidt committed
968 969
          "wmvversion", G_TYPE_INT, 3, "format", GST_TYPE_FOURCC,
          GST_MAKE_FOURCC ('W', 'M', 'V', '3'), NULL);
970
      break;
971 972
    case CODEC_ID_VC1:
      caps = gst_ff_vid_caps_new (context, codec_id, "video/x-wmv",
Jan Schmidt's avatar
Jan Schmidt committed
973
          "wmvversion", G_TYPE_INT, 3, "format", GST_TYPE_FOURCC,
974
          GST_MAKE_FOURCC ('W', 'V', 'C', '1'), NULL);
975
      break;
976
    case CODEC_ID_QDM2:
977 978
      caps = gst_ff_aud_caps_new (context, codec_id, "audio/x-qdm2", NULL);
      break;
979

980
    case CODEC_ID_MSZH: