Blame gst/avi/gstavisubtitle.c

Packit 1f69a5
/* GStreamer AVI GAB2 subtitle parser
Packit 1f69a5
 * Copyright (C) <2007> Thijs Vermeir <thijsvermeir@gmail.com>
Packit 1f69a5
 * Copyright (C) <2007> Tim-Philipp Müller <tim centricular net>
Packit 1f69a5
 *
Packit 1f69a5
 * This library is free software; you can redistribute it and/or
Packit 1f69a5
 * modify it under the terms of the GNU Library General Public
Packit 1f69a5
 * License as published by the Free Software Foundation; either
Packit 1f69a5
 * version 2 of the License, or (at your option) any later version.
Packit 1f69a5
 *
Packit 1f69a5
 * This library is distributed in the hope that it will be useful,
Packit 1f69a5
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
Packit 1f69a5
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
Packit 1f69a5
 * Library General Public License for more details.
Packit 1f69a5
 *
Packit 1f69a5
 * You should have received a copy of the GNU Library General Public
Packit 1f69a5
 * License along with this library; if not, write to the
Packit 1f69a5
 * Free Software Foundation, Inc., 51 Franklin St, Fifth Floor,
Packit 1f69a5
 * Boston, MA 02110-1301, USA.
Packit 1f69a5
 */
Packit 1f69a5
Packit 1f69a5
/**
Packit 1f69a5
 * SECTION:element-avisubtitle
Packit 1f69a5
 *
Packit 1f69a5
 * <refsect2>
Packit 1f69a5
 * <para>
Packit 1f69a5
 * Parses the subtitle stream from an avi file.
Packit 1f69a5
 * </para>
Packit 1f69a5
 * <title>Example launch line</title>
Packit 1f69a5
 * <para>
Packit 1f69a5
 * <programlisting>
Packit 1f69a5
 * gst-launch-1.0 filesrc location=subtitle.avi ! avidemux name=demux ! queue ! avisubtitle ! subparse ! textoverlay name=overlay ! videoconvert ! autovideosink demux. ! queue ! decodebin ! overlay.
Packit 1f69a5
 * </programlisting>
Packit 1f69a5
 * This plays an avi file with a video and subtitle stream.
Packit 1f69a5
 * </para>
Packit 1f69a5
 * </refsect2>
Packit 1f69a5
 */
Packit 1f69a5
Packit 1f69a5
/* example of a subtitle chunk in an avi file
Packit 1f69a5
 * 00000000: 47 41 42 32 00 02 00 10 00 00 00 45 00 6e 00 67  GAB2.......E.n.g
Packit 1f69a5
 * 00000010: 00 6c 00 69 00 73 00 68 00 00 00 04 00 8e 00 00  .l.i.s.h........
Packit 1f69a5
 * 00000020: 00 ef bb bf 31 0d 0a 30 30 3a 30 30 3a 30 30 2c  ....1..00:00:00,
Packit 1f69a5
 * 00000030: 31 30 30 20 2d 2d 3e 20 30 30 3a 30 30 3a 30 32  100 --> 00:00:02
Packit 1f69a5
 * 00000040: 2c 30 30 30 0d 0a 3c 62 3e 41 6e 20 55 54 46 38  ,000..An UTF8
Packit 1f69a5
 * 00000050: 20 53 75 62 74 69 74 6c 65 20 77 69 74 68 20 42   Subtitle with B
Packit 1f69a5
 * 00000060: 4f 4d 3c 2f 62 3e 0d 0a 0d 0a 32 0d 0a 30 30 3a  OM....2..00:
Packit 1f69a5
 * 00000070: 30 30 3a 30 32 2c 31 30 30 20 2d 2d 3e 20 30 30  00:02,100 --> 00
Packit 1f69a5
 * 00000080: 3a 30 30 3a 30 34 2c 30 30 30 0d 0a 53 6f 6d 65  :00:04,000..Some
Packit 1f69a5
 * 00000090: 74 68 69 6e 67 20 6e 6f 6e 41 53 43 49 49 20 2d  thing nonASCII -
Packit 1f69a5
 * 000000a0: 20 c2 b5 c3 b6 c3 a4 c3 bc c3 9f 0d 0a 0d 0a      ..............
Packit 1f69a5
 */
Packit 1f69a5
Packit 1f69a5
#ifdef HAVE_CONFIG_H
Packit 1f69a5
#include "config.h"
Packit 1f69a5
#endif
Packit 1f69a5
Packit 1f69a5
#include <string.h>
Packit 1f69a5
Packit 1f69a5
#include "gstavisubtitle.h"
Packit 1f69a5
Packit 1f69a5
GST_DEBUG_CATEGORY_STATIC (avisubtitle_debug);
Packit 1f69a5
#define GST_CAT_DEFAULT avisubtitle_debug
Packit 1f69a5
Packit 1f69a5
static GstStaticPadTemplate sink_template = GST_STATIC_PAD_TEMPLATE ("sink",
Packit 1f69a5
    GST_PAD_SINK,
Packit 1f69a5
    GST_PAD_ALWAYS,
Packit 1f69a5
    GST_STATIC_CAPS ("application/x-subtitle-avi")
Packit 1f69a5
    );
Packit 1f69a5
Packit 1f69a5
static GstStaticPadTemplate src_template = GST_STATIC_PAD_TEMPLATE ("src",
Packit 1f69a5
    GST_PAD_SRC,
Packit 1f69a5
    GST_PAD_ALWAYS,
Packit 1f69a5
    GST_STATIC_CAPS ("application/x-subtitle")
Packit 1f69a5
    );
Packit 1f69a5
Packit 1f69a5
static void gst_avi_subtitle_title_tag (GstAviSubtitle * sub, gchar * title);
Packit 1f69a5
static GstFlowReturn gst_avi_subtitle_chain (GstPad * pad, GstObject * parent,
Packit 1f69a5
    GstBuffer * buffer);
Packit 1f69a5
static GstStateChangeReturn gst_avi_subtitle_change_state (GstElement * element,
Packit 1f69a5
    GstStateChange transition);
Packit 1f69a5
static gboolean gst_avi_subtitle_send_event (GstElement * element,
Packit 1f69a5
    GstEvent * event);
Packit 1f69a5
Packit 1f69a5
#define gst_avi_subtitle_parent_class parent_class
Packit 1f69a5
G_DEFINE_TYPE (GstAviSubtitle, gst_avi_subtitle, GST_TYPE_ELEMENT);
Packit 1f69a5
Packit 1f69a5
#define IS_BOM_UTF8(data)     ((GST_READ_UINT32_BE(data) >> 8) == 0xEFBBBF)
Packit 1f69a5
#define IS_BOM_UTF16_BE(data) (GST_READ_UINT16_BE(data) == 0xFEFF)
Packit 1f69a5
#define IS_BOM_UTF16_LE(data) (GST_READ_UINT16_LE(data) == 0xFEFF)
Packit 1f69a5
#define IS_BOM_UTF32_BE(data) (GST_READ_UINT32_BE(data) == 0xFEFF)
Packit 1f69a5
#define IS_BOM_UTF32_LE(data) (GST_READ_UINT32_LE(data) == 0xFEFF)
Packit 1f69a5
Packit 1f69a5
static GstBuffer *
Packit 1f69a5
gst_avi_subtitle_extract_file (GstAviSubtitle * sub, GstBuffer * buffer,
Packit 1f69a5
    guint offset, guint len)
Packit 1f69a5
{
Packit 1f69a5
  const gchar *input_enc = NULL;
Packit 1f69a5
  GstBuffer *ret = NULL;
Packit 1f69a5
  gchar *data;
Packit 1f69a5
  GstMapInfo map;
Packit 1f69a5
Packit 1f69a5
  gst_buffer_map (buffer, &map, GST_MAP_READ);
Packit 1f69a5
  data = (gchar *) (map.data + offset);
Packit 1f69a5
Packit 1f69a5
  if (len >= (3 + 1) && IS_BOM_UTF8 (data) &&
Packit 1f69a5
      g_utf8_validate (data + 3, len - 3, NULL)) {
Packit 1f69a5
    ret =
Packit 1f69a5
        gst_buffer_copy_region (buffer, GST_BUFFER_COPY_ALL, offset + 3,
Packit 1f69a5
        len - 3);
Packit 1f69a5
  } else if (len >= 2 && IS_BOM_UTF16_BE (data)) {
Packit 1f69a5
    input_enc = "UTF-16BE";
Packit 1f69a5
    data += 2;
Packit 1f69a5
    len -= 2;
Packit 1f69a5
  } else if (len >= 2 && IS_BOM_UTF16_LE (data)) {
Packit 1f69a5
    input_enc = "UTF-16LE";
Packit 1f69a5
    data += 2;
Packit 1f69a5
    len -= 2;
Packit 1f69a5
  } else if (len >= 4 && IS_BOM_UTF32_BE (data)) {
Packit 1f69a5
    input_enc = "UTF-32BE";
Packit 1f69a5
    data += 4;
Packit 1f69a5
    len -= 4;
Packit 1f69a5
  } else if (len >= 4 && IS_BOM_UTF32_LE (data)) {
Packit 1f69a5
    input_enc = "UTF-32LE";
Packit 1f69a5
    data += 4;
Packit 1f69a5
    len -= 4;
Packit 1f69a5
  } else if (g_utf8_validate (data, len, NULL)) {
Packit 1f69a5
    /* not specified, check if it's UTF-8 */
Packit 1f69a5
    ret = gst_buffer_copy_region (buffer, GST_BUFFER_COPY_ALL, offset, len);
Packit 1f69a5
  } else {
Packit 1f69a5
    /* we could fall back to gst_tag_freeform_to_utf8() here */
Packit 1f69a5
    GST_WARNING_OBJECT (sub, "unspecified encoding, and not UTF-8");
Packit 1f69a5
    ret = NULL;
Packit 1f69a5
    goto done;
Packit 1f69a5
  }
Packit 1f69a5
Packit 1f69a5
  g_return_val_if_fail (ret != NULL || input_enc != NULL, NULL);
Packit 1f69a5
Packit 1f69a5
  if (input_enc) {
Packit 1f69a5
    GError *err = NULL;
Packit 1f69a5
    gchar *utf8;
Packit 1f69a5
    gsize slen;
Packit 1f69a5
Packit 1f69a5
    GST_DEBUG_OBJECT (sub, "converting subtitles from %s to UTF-8", input_enc);
Packit 1f69a5
    utf8 = g_convert (data, len, "UTF-8", input_enc, NULL, NULL, &err;;
Packit 1f69a5
Packit 1f69a5
    if (err != NULL) {
Packit 1f69a5
      GST_WARNING_OBJECT (sub, "conversion to UTF-8 failed : %s", err->message);
Packit 1f69a5
      g_error_free (err);
Packit 1f69a5
      ret = NULL;
Packit 1f69a5
      goto done;
Packit 1f69a5
    }
Packit 1f69a5
Packit 1f69a5
    ret = gst_buffer_new ();
Packit 1f69a5
    slen = strlen (utf8);
Packit 1f69a5
    gst_buffer_append_memory (ret,
Packit 1f69a5
        gst_memory_new_wrapped (0, utf8, slen, 0, slen, utf8, g_free));
Packit 1f69a5
Packit 1f69a5
    GST_BUFFER_OFFSET (ret) = 0;
Packit 1f69a5
  }
Packit 1f69a5
Packit 1f69a5
done:
Packit 1f69a5
  gst_buffer_unmap (buffer, &map);
Packit 1f69a5
Packit 1f69a5
  return ret;
Packit 1f69a5
}
Packit 1f69a5
Packit 1f69a5
/**
Packit 1f69a5
 * gst_avi_subtitle_title_tag:
Packit 1f69a5
 * @sub: subtitle element
Packit 1f69a5
 * @title: the title of this subtitle stream
Packit 1f69a5
 *
Packit 1f69a5
 * Send an event to the srcpad of the @sub element with the title
Packit 1f69a5
 * of the subtitle stream as a GST_TAG_TITLE
Packit 1f69a5
 */
Packit 1f69a5
static void
Packit 1f69a5
gst_avi_subtitle_title_tag (GstAviSubtitle * sub, gchar * title)
Packit 1f69a5
{
Packit 1f69a5
  gst_pad_push_event (sub->src,
Packit 1f69a5
      gst_event_new_tag (gst_tag_list_new (GST_TAG_TITLE, title, NULL)));
Packit 1f69a5
}
Packit 1f69a5
Packit 1f69a5
static GstFlowReturn
Packit 1f69a5
gst_avi_subtitle_parse_gab2_chunk (GstAviSubtitle * sub, GstBuffer * buf)
Packit 1f69a5
{
Packit 1f69a5
  gchar *name_utf8;
Packit 1f69a5
  guint name_length;
Packit 1f69a5
  guint file_length;
Packit 1f69a5
  GstMapInfo map;
Packit 1f69a5
Packit 1f69a5
  gst_buffer_map (buf, &map, GST_MAP_READ);
Packit 1f69a5
Packit 1f69a5
  /* check the magic word "GAB2\0", and the next word must be 2 */
Packit 1f69a5
  if (map.size < 12 || memcmp (map.data, "GAB2\0\2\0", 5 + 2) != 0)
Packit 1f69a5
    goto wrong_magic_word;
Packit 1f69a5
Packit 1f69a5
  /* read 'name' of subtitle */
Packit 1f69a5
  name_length = GST_READ_UINT32_LE (map.data + 5 + 2);
Packit 1f69a5
  GST_LOG_OBJECT (sub, "length of name: %u", name_length);
Packit 1f69a5
  if (map.size <= 17 + name_length)
Packit 1f69a5
    goto wrong_name_length;
Packit 1f69a5
Packit 1f69a5
  name_utf8 =
Packit 1f69a5
      g_convert ((gchar *) map.data + 11, name_length, "UTF-8", "UTF-16LE",
Packit 1f69a5
      NULL, NULL, NULL);
Packit 1f69a5
Packit 1f69a5
  if (name_utf8) {
Packit 1f69a5
    GST_LOG_OBJECT (sub, "subtitle name: %s", name_utf8);
Packit 1f69a5
    gst_avi_subtitle_title_tag (sub, name_utf8);
Packit 1f69a5
    g_free (name_utf8);
Packit 1f69a5
  }
Packit 1f69a5
Packit 1f69a5
  /* next word must be 4 */
Packit 1f69a5
  if (GST_READ_UINT16_LE (map.data + 11 + name_length) != 0x4)
Packit 1f69a5
    goto wrong_fixed_word_2;
Packit 1f69a5
Packit 1f69a5
  file_length = GST_READ_UINT32_LE (map.data + 13 + name_length);
Packit 1f69a5
  GST_LOG_OBJECT (sub, "length srt/ssa file: %u", file_length);
Packit 1f69a5
Packit 1f69a5
  if (map.size < (17 + name_length + file_length))
Packit 1f69a5
    goto wrong_total_length;
Packit 1f69a5
Packit 1f69a5
  /* store this, so we can send it again after a seek; note that we shouldn't
Packit 1f69a5
   * assume all the remaining data in the chunk is subtitle data, there may
Packit 1f69a5
   * be padding at the end for some reason, so only parse file_length bytes */
Packit 1f69a5
  sub->subfile =
Packit 1f69a5
      gst_avi_subtitle_extract_file (sub, buf, 17 + name_length, file_length);
Packit 1f69a5
Packit 1f69a5
  if (sub->subfile == NULL)
Packit 1f69a5
    goto extract_failed;
Packit 1f69a5
Packit 1f69a5
  gst_buffer_unmap (buf, &map);
Packit 1f69a5
Packit 1f69a5
  return GST_FLOW_OK;
Packit 1f69a5
Packit 1f69a5
  /* ERRORS */
Packit 1f69a5
wrong_magic_word:
Packit 1f69a5
  {
Packit 1f69a5
    GST_ELEMENT_ERROR (sub, STREAM, DECODE, (NULL), ("Wrong magic word"));
Packit 1f69a5
    gst_buffer_unmap (buf, &map);
Packit 1f69a5
    return GST_FLOW_ERROR;
Packit 1f69a5
  }
Packit 1f69a5
wrong_name_length:
Packit 1f69a5
  {
Packit 1f69a5
    GST_ELEMENT_ERROR (sub, STREAM, DECODE, (NULL),
Packit 1f69a5
        ("name doesn't fit in buffer (%" G_GSIZE_FORMAT " < %d)", map.size,
Packit 1f69a5
            17 + name_length));
Packit 1f69a5
    gst_buffer_unmap (buf, &map);
Packit 1f69a5
    return GST_FLOW_ERROR;
Packit 1f69a5
  }
Packit 1f69a5
wrong_fixed_word_2:
Packit 1f69a5
  {
Packit 1f69a5
    GST_ELEMENT_ERROR (sub, STREAM, DECODE, (NULL),
Packit 1f69a5
        ("wrong fixed word: expected %u, got %u", 4,
Packit 1f69a5
            GST_READ_UINT16_LE (map.data + 11 + name_length)));
Packit 1f69a5
    gst_buffer_unmap (buf, &map);
Packit 1f69a5
    return GST_FLOW_ERROR;
Packit 1f69a5
  }
Packit 1f69a5
wrong_total_length:
Packit 1f69a5
  {
Packit 1f69a5
    GST_ELEMENT_ERROR (sub, STREAM, DECODE, (NULL),
Packit 1f69a5
        ("buffer size is wrong: need %d bytes, have %" G_GSIZE_FORMAT " bytes",
Packit 1f69a5
            17 + name_length + file_length, map.size));
Packit 1f69a5
    gst_buffer_unmap (buf, &map);
Packit 1f69a5
    return GST_FLOW_ERROR;
Packit 1f69a5
  }
Packit 1f69a5
extract_failed:
Packit 1f69a5
  {
Packit 1f69a5
    GST_ELEMENT_ERROR (sub, STREAM, DECODE, (NULL),
Packit 1f69a5
        ("could not extract subtitles"));
Packit 1f69a5
    gst_buffer_unmap (buf, &map);
Packit 1f69a5
    return GST_FLOW_ERROR;
Packit 1f69a5
  }
Packit 1f69a5
}
Packit 1f69a5
Packit 1f69a5
static GstFlowReturn
Packit 1f69a5
gst_avi_subtitle_chain (GstPad * pad, GstObject * parent, GstBuffer * buffer)
Packit 1f69a5
{
Packit 1f69a5
  GstAviSubtitle *sub = GST_AVI_SUBTITLE (parent);
Packit 1f69a5
  GstFlowReturn ret;
Packit 1f69a5
Packit 1f69a5
  if (sub->subfile != NULL) {
Packit 1f69a5
    GST_WARNING_OBJECT (sub, "Got more buffers than expected, dropping");
Packit 1f69a5
    ret = GST_FLOW_EOS;
Packit 1f69a5
    goto done;
Packit 1f69a5
  }
Packit 1f69a5
Packit 1f69a5
  /* we expect exactly one buffer with the whole srt/ssa file in it */
Packit 1f69a5
  ret = gst_avi_subtitle_parse_gab2_chunk (sub, buffer);
Packit 1f69a5
  if (ret != GST_FLOW_OK)
Packit 1f69a5
    goto done;
Packit 1f69a5
Packit 1f69a5
  /* now push the subtitle data downstream */
Packit 1f69a5
  ret = gst_pad_push (sub->src, gst_buffer_ref (sub->subfile));
Packit 1f69a5
Packit 1f69a5
done:
Packit 1f69a5
Packit 1f69a5
  gst_buffer_unref (buffer);
Packit 1f69a5
  return ret;
Packit 1f69a5
}
Packit 1f69a5
Packit 1f69a5
static gboolean
Packit 1f69a5
gst_avi_subtitle_send_event (GstElement * element, GstEvent * event)
Packit 1f69a5
{
Packit 1f69a5
  GstAviSubtitle *avisubtitle = GST_AVI_SUBTITLE (element);
Packit 1f69a5
  gboolean ret = FALSE;
Packit 1f69a5
Packit 1f69a5
  if (GST_EVENT_TYPE (event) == GST_EVENT_SEEK) {
Packit 1f69a5
    if (avisubtitle->subfile) {
Packit 1f69a5
      if (gst_pad_push (avisubtitle->src,
Packit 1f69a5
              gst_buffer_ref (avisubtitle->subfile)) == GST_FLOW_OK)
Packit 1f69a5
        ret = TRUE;
Packit 1f69a5
    }
Packit 1f69a5
  }
Packit 1f69a5
  gst_event_unref (event);
Packit 1f69a5
  return ret;
Packit 1f69a5
}
Packit 1f69a5
Packit 1f69a5
static void
Packit 1f69a5
gst_avi_subtitle_class_init (GstAviSubtitleClass * klass)
Packit 1f69a5
{
Packit 1f69a5
  GstElementClass *gstelement_class = (GstElementClass *) klass;
Packit 1f69a5
Packit 1f69a5
  GST_DEBUG_CATEGORY_INIT (avisubtitle_debug, "avisubtitle", 0,
Packit 1f69a5
      "parse avi subtitle stream");
Packit 1f69a5
Packit 1f69a5
  gstelement_class->change_state =
Packit 1f69a5
      GST_DEBUG_FUNCPTR (gst_avi_subtitle_change_state);
Packit 1f69a5
  gstelement_class->send_event =
Packit 1f69a5
      GST_DEBUG_FUNCPTR (gst_avi_subtitle_send_event);
Packit 1f69a5
Packit 1f69a5
  gst_element_class_add_static_pad_template (gstelement_class, &sink_template);
Packit 1f69a5
  gst_element_class_add_static_pad_template (gstelement_class, &src_template);
Packit 1f69a5
Packit 1f69a5
  gst_element_class_set_static_metadata (gstelement_class,
Packit 1f69a5
      "Avi subtitle parser", "Codec/Parser/Subtitle",
Packit 1f69a5
      "Parse avi subtitle stream", "Thijs Vermeir <thijsvermeir@gmail.com>");
Packit 1f69a5
}
Packit 1f69a5
Packit 1f69a5
static void
Packit 1f69a5
gst_avi_subtitle_init (GstAviSubtitle * self)
Packit 1f69a5
{
Packit 1f69a5
  GstCaps *caps;
Packit 1f69a5
Packit 1f69a5
  self->src = gst_pad_new_from_static_template (&src_template, "src");
Packit 1f69a5
  gst_element_add_pad (GST_ELEMENT (self), self->src);
Packit 1f69a5
Packit 1f69a5
  self->sink = gst_pad_new_from_static_template (&sink_template, "sink");
Packit 1f69a5
  gst_pad_set_chain_function (self->sink,
Packit 1f69a5
      GST_DEBUG_FUNCPTR (gst_avi_subtitle_chain));
Packit 1f69a5
Packit 1f69a5
  caps = gst_static_pad_template_get_caps (&src_template);
Packit 1f69a5
  gst_pad_set_caps (self->src, caps);
Packit 1f69a5
  gst_caps_unref (caps);
Packit 1f69a5
Packit 1f69a5
  gst_pad_use_fixed_caps (self->src);
Packit 1f69a5
  gst_element_add_pad (GST_ELEMENT (self), self->sink);
Packit 1f69a5
Packit 1f69a5
  self->subfile = NULL;
Packit 1f69a5
}
Packit 1f69a5
Packit 1f69a5
static GstStateChangeReturn
Packit 1f69a5
gst_avi_subtitle_change_state (GstElement * element, GstStateChange transition)
Packit 1f69a5
{
Packit 1f69a5
  GstStateChangeReturn ret;
Packit 1f69a5
  GstAviSubtitle *sub = GST_AVI_SUBTITLE (element);
Packit 1f69a5
Packit 1f69a5
  switch (transition) {
Packit 1f69a5
    case GST_STATE_CHANGE_NULL_TO_READY:
Packit 1f69a5
    case GST_STATE_CHANGE_READY_TO_PAUSED:
Packit 1f69a5
    default:
Packit 1f69a5
      break;
Packit 1f69a5
  }
Packit 1f69a5
Packit 1f69a5
  ret = GST_ELEMENT_CLASS (parent_class)->change_state (element, transition);
Packit 1f69a5
  if (ret == GST_STATE_CHANGE_FAILURE)
Packit 1f69a5
    return ret;
Packit 1f69a5
Packit 1f69a5
  switch (transition) {
Packit 1f69a5
    case GST_STATE_CHANGE_PAUSED_TO_READY:
Packit 1f69a5
      if (sub->subfile) {
Packit 1f69a5
        gst_buffer_unref (sub->subfile);
Packit 1f69a5
        sub->subfile = NULL;
Packit 1f69a5
      }
Packit 1f69a5
      break;
Packit 1f69a5
    default:
Packit 1f69a5
      break;
Packit 1f69a5
  }
Packit 1f69a5
Packit 1f69a5
  return ret;
Packit 1f69a5
}