id3vx

author: Christian Grothoff <christian@grothoff.org> 2009-12-20 00:06:45 +0000
committer: Christian Grothoff <christian@grothoff.org> 2009-12-20 00:06:45 +0000
commit: 949dae1583254b789e3dafe569e030140a621846 (patch)
tree: a6e356030fcb030bd88d96b74d7aa62e1dd5aeb7
parent: 73b50507dba0570f2182f21f8b1c27a95886e4e7 (diff)
download: libextractor-949dae1583254b789e3dafe569e030140a621846.tar.gz
libextractor-949dae1583254b789e3dafe569e030140a621846.zip
10 files changed, 609 insertions, 209 deletions
diff --git a/TODO b/TODO
index cc8c6eb..12b473b 100644
--- a/TODO
+++ b/TODO
@@ -17,12 +17,12 @@ Core:
 Incomplete code (missing features):
 * RIFF (idx1 attribute)
-* IDv2{3,4} (some attributes, make testcases in test/id3v2/ work)
 * StarOffice sdw (some attributes, see doc/)
 * man pages (interpret sections for authors, brief description)
 * pdf: full-text extraction!
 * EXIV2
 * ELF: 64-bit support, lists of architectures, OSes, etc. are incomplete
+* ID3v2x: unsynchronization support, (de)compression support, footer support (24)
 Desirable missing formats:
 * mbox / various e-mail formats
diff --git a/src/include/extractor.h b/src/include/extractor.h
index 9c4ae60..ffebd5c 100644
--- a/src/include/extractor.h
+++ b/src/include/extractor.h
@@ -280,8 +280,8 @@ enum EXTRACTOR_MetaType
    EXTRACTOR_METATYPE_PRODUCT_VERSION = 148,
    EXTRACTOR_METATYPE_CONTRIBUTOR_NAME = 149,
    EXTRACTOR_METATYPE_MOVIE_DIRECTOR = 150,
-    EXTRACTOR_METATYPE_TV_NETWORK_NAME = 151,
+    EXTRACTOR_METATYPE_NETWORK_NAME = 151,
-    EXTRACTOR_METATYPE_TV_SHOW_NAME = 152,
+    EXTRACTOR_METATYPE_SHOW_NAME = 152,
    EXTRACTOR_METATYPE_CHAPTER_NAME = 153,
    EXTRACTOR_METATYPE_SONG_COUNT = 154,
    EXTRACTOR_METATYPE_STARTING_SONG = 155,
@@ -295,13 +295,17 @@ enum EXTRACTOR_MetaType
    EXTRACTOR_METATYPE_ORIGINAL_ARTIST = 163,
    EXTRACTOR_METATYPE_ORIGINAL_WRITER = 164,
    EXTRACTOR_METATYPE_ORIGINAL_RELEASE_YEAR = 165,
-    EXTRACTOR_METATYPE_LYRICS = 166,
+    EXTRACTOR_METATYPE_ORIGINAL_PERFORMER = 166,
-    EXTRACTOR_METATYPE_POPULARITY_METER = 167,
+    EXTRACTOR_METATYPE_LYRICS = 167,
+    EXTRACTOR_METATYPE_POPULARITY_METER = 168,
+    EXTRACTOR_METATYPE_LICENSEE = 169,
+    EXTRACTOR_METATYPE_MUSICIAN_CREDITS_LIST = 170,
+    EXTRACTOR_METATYPE_MOOD = 171, 
+    EXTRACTOR_METATYPE_SUBTITLE = 172, 
    /* fixme: used up to here! */
    EXTRACTOR_METATYPE_MUSIC_CD_IDENTIFIER = 117,
-    EXTRACTOR_METATYPE_MUSICIAN_CREDITS_LIST = 123,
    
    EXTRACTOR_METATYPE_SCALE = 108,
@@ -342,7 +346,6 @@ enum EXTRACTOR_MetaType
    EXTRACTOR_METATYPE_FULL_NAME = 113,
    EXTRACTOR_METATYPE_LINK = 116,
    EXTRACTOR_METATYPE_TIME = 122,
-    EXTRACTOR_METATYPE_MOOD = 124, 
    EXTRACTOR_METATYPE_TELEVISION_SYSTEM = 126,
    EXTRACTOR_METATYPE_HARDWARE_DEPENDENCY = 129,
    EXTRACTOR_METATYPE_RIPPER = 130,
diff --git a/src/main/extractor_metatypes.c b/src/main/extractor_metatypes.c
index b98a395..c97fc3e 100644
--- a/src/main/extractor_metatypes.c
+++ b/src/main/extractor_metatypes.c
@@ -369,10 +369,10 @@ static const struct MetaTypeDescription meta_type_descriptions[] = {
  /* 150 */
  { gettext_noop ("movie director"),
    gettext_noop ("name of the director") }, 
-  { gettext_noop ("TV network"),
+  { gettext_noop ("network"),
-    gettext_noop ("name of the broadcasting TV network") }, 
+    gettext_noop ("name of the broadcasting network or station") }, 
-  { gettext_noop ("TV show"),
+  { gettext_noop ("show"),
-    gettext_noop ("name of the TV show") }, 
+    gettext_noop ("name of the show") }, 
  { gettext_noop ("chapter name"),
    gettext_noop ("name of the chapter") }, 
  { gettext_noop ("song count"),
@@ -402,10 +402,23 @@ static const struct MetaTypeDescription meta_type_descriptions[] = {
  /* 165 */
  { gettext_noop ("original release year"),
    gettext_noop ("year of the original release") }, 
+  { gettext_noop ("original performer"),
+    gettext_noop ("name of the original performer") }, 
  { gettext_noop ("lyrics"),
    gettext_noop ("lyrics of the song or text description of vocal activities") }, 
  { gettext_noop ("popularity"),
    gettext_noop ("information about the file's popularity") }, 
+  { gettext_noop ("licensee"),
+    gettext_noop ("name of the owner or licensee of the file") }, 
+  /* 170 */
+  { gettext_noop ("musician credit list"),
+    gettext_noop ("names of contributing musicians") }, 
+  { gettext_noop ("mood"),
+    gettext_noop ("keywords reflecting the mood of the piece") }, 
+  { gettext_noop ("subtitle"),
+    gettext_noop ("subtitle of this part") }, 
+  { gettext_noop (""),
+    gettext_noop ("") }, 
  { gettext_noop (""),
    gettext_noop ("") }, 
 #if 0
diff --git a/src/plugins/id3v23_extractor.c b/src/plugins/id3v23_extractor.c
index 71553c2..4ab8116 100644
--- a/src/plugins/id3v23_extractor.c
+++ b/src/plugins/id3v23_extractor.c
@@ -1,6 +1,6 @@
 /*
     This file is part of libextractor.
-     (C) 2002, 2003, 2004, 2006, 2007 Vidyut Samanta and Christian Grothoff
+     (C) 2002, 2003, 2004, 2006, 2007, 2009 Vidyut Samanta and Christian Grothoff
     libextractor is free software; you can redistribute it and/or modify
     it under the terms of the GNU General Public License as published
@@ -35,54 +35,83 @@
 #include "convert.h"
+enum Id3v23Fmt
+  {
+    T, /* simple, 0-terminated string, prefixed by encoding */
+    U, /* 0-terminated ASCII string, no encoding */
+    UL, /* unsync'ed lyrics */
+    SL, /* sync'ed lyrics */
+    L, /* string with language prefix */
+    I /* image */
+  };
 typedef struct
 {
  const char *text;
  enum EXTRACTOR_MetaType type;
+  enum Id3v23Fmt fmt;
 } Matches;
 static Matches tmap[] = {
-  {"COMM", EXTRACTOR_METATYPE_COMMENT},
+  {"TALB", EXTRACTOR_METATYPE_ALBUM, T},
-  {"IPLS", EXTRACTOR_METATYPE_CONTRIBUTOR},
+  {"TBPM", EXTRACTOR_METATYPE_BEATS_PER_MINUTE, T},
-  {"LINK", EXTRACTOR_METATYPE_LINK},
+  {"TCOM", EXTRACTOR_METATYPE_COMPOSER, T},
-  {"MCDI", EXTRACTOR_METATYPE_MUSIC_CD_IDENTIFIER},
+  {"TCON", EXTRACTOR_METATYPE_SONG_VERSION, T},
-  {"PCNT", EXTRACTOR_METATYPE_PLAY_COUNTER},
+  {"TCOP", EXTRACTOR_METATYPE_COPYRIGHT, T},
-  {"POPM", EXTRACTOR_METATYPE_POPULARITY_METER},
+  /* {"TDAT", EXTRACTOR_METATYPE_CREATION_DATE, T}, */
-  {"TCOP", EXTRACTOR_METATYPE_COPYRIGHT},
+  /* TDLY */
-  {"TDAT", EXTRACTOR_METATYPE_DATE},
+  {"TENC", EXTRACTOR_METATYPE_ENCODED_BY, T},
-  {"TCON", EXTRACTOR_METATYPE_CONTENT_TYPE},
+  {"TEXT", EXTRACTOR_METATYPE_WRITER, T},  
-  {"TIT1", EXTRACTOR_METATYPE_GENRE},
+  {"TFLT", EXTRACTOR_METATYPE_FORMAT_VERSION, T},
-  {"TENC", EXTRACTOR_METATYPE_ENCODED_BY},
+  /* TIME */
-  {"TEXT", EXTRACTOR_METATYPE_LYRICS},
+  {"TIT1", EXTRACTOR_METATYPE_SECTION, T},
-  {"TOLY", EXTRACTOR_METATYPE_CONTRIBUTOR},
+  {"TIT2", EXTRACTOR_METATYPE_TITLE, T},
-  {"TOPE", EXTRACTOR_METATYPE_CONTRIBUTOR},
+  {"TIT3", EXTRACTOR_METATYPE_SONG_VERSION, T},
-  {"TOWN", EXTRACTOR_METATYPE_OWNER},
+  /* TKEY */
-  {"TPE1", EXTRACTOR_METATYPE_ARTIST},
+  {"TLAN", EXTRACTOR_METATYPE_LANGUAGE, T},
-  {"TPE2", EXTRACTOR_METATYPE_ARTIST},
+  {"TLEN", EXTRACTOR_METATYPE_DURATION, T}, /* FIXME: should append 'ms' as unit */
-  {"TPE3", EXTRACTOR_METATYPE_CONDUCTOR},
+  {"TMED", EXTRACTOR_METATYPE_SOURCE, T}, 
-  {"TPE4", EXTRACTOR_METATYPE_INTERPRET},
+  {"TOAL", EXTRACTOR_METATYPE_ORIGINAL_TITLE, T},
-  {"TMED", EXTRACTOR_METATYPE_MEDIA_TYPE},
+  {"TOFN", EXTRACTOR_METATYPE_ORIGINAL_ARTIST, T},
-  {"TCOM", EXTRACTOR_METATYPE_CREATOR},
+  {"TOLY", EXTRACTOR_METATYPE_ORIGINAL_WRITER, T},
-  {"TIME", EXTRACTOR_METATYPE_TIME},
+  {"TOPE", EXTRACTOR_METATYPE_ORIGINAL_PERFORMER, T},
-  {"TOFN", EXTRACTOR_METATYPE_FILENAME},
+  {"TORY", EXTRACTOR_METATYPE_ORIGINAL_RELEASE_YEAR, T},
-  {"TOPE", EXTRACTOR_METATYPE_ARTIST},
+  {"TOWN", EXTRACTOR_METATYPE_LICENSEE, T},
-  {"TPUB", EXTRACTOR_METATYPE_PUBLISHER},
+  {"TPE1", EXTRACTOR_METATYPE_ARTIST, T},
-  {"TRCK", EXTRACTOR_METATYPE_TRACK_NUMBER},
+  {"TPE2", EXTRACTOR_METATYPE_PERFORMER, T},
-  {"TRSC", EXTRACTOR_METATYPE_ISRC},
+  {"TPE3", EXTRACTOR_METATYPE_CONDUCTOR, T},
-  {"TRSN", EXTRACTOR_METATYPE_SOURCE},
+  {"TPE4", EXTRACTOR_METATYPE_INTERPRETATION, T}, 
-  {"TRSO", EXTRACTOR_METATYPE_CREATED_FOR},
+  {"TPOS", EXTRACTOR_METATYPE_DISC_NUMBER, T},
-  {"TSRC", EXTRACTOR_METATYPE_RESOURCE_IDENTIFIER},
+  {"TPUB", EXTRACTOR_METATYPE_PUBLISHER, T},
-  {"TOAL", EXTRACTOR_METATYPE_ALBUM},
+  {"TRCK", EXTRACTOR_METATYPE_TRACK_NUMBER, T},
-  {"TALB", EXTRACTOR_METATYPE_ALBUM},
+  /* TRDA */
-  {"TLAN", EXTRACTOR_METATYPE_LANGUAGE},
+  {"TRSN", EXTRACTOR_METATYPE_NETWORK_NAME, T},
-  {"TYER", EXTRACTOR_METATYPE_YEAR},
+  /* TRSO */
-  {"TLEN", EXTRACTOR_METATYPE_DURATION},
+  {"TSIZ", EXTRACTOR_METATYPE_EMBEDDED_FILE_SIZE, T},
-  {"TIT2", EXTRACTOR_METATYPE_TITLE},
+  {"TSRC", EXTRACTOR_METATYPE_ISRC, T},
-  {"TIT3", EXTRACTOR_METATYPE_DESCRIPTION},
+  /* TSSE */
-  {"WCOM", EXTRACTOR_METATYPE_RELEASE},
+  {"TYER", EXTRACTOR_METATYPE_PUBLICATION_YEAR, T},
-  {"WCOP", EXTRACTOR_METATYPE_DISCLAIMER},
+  {"WCOM", EXTRACTOR_METATYPE_URL, U},
-  {"", EXTRACTOR_METATYPE_KEYWORDS},
+  {"WCOP", EXTRACTOR_METATYPE_URL, U},
-  {NULL, 0}
+  {"WOAF", EXTRACTOR_METATYPE_URL, U},
+  {"WOAS", EXTRACTOR_METATYPE_URL, U},
+  {"WORS", EXTRACTOR_METATYPE_URL, U},
+  {"WPAY", EXTRACTOR_METATYPE_URL, U},
+  {"WPUB", EXTRACTOR_METATYPE_URL, U},
+  {"WXXX", EXTRACTOR_METATYPE_URL, T},
+  {"IPLS", EXTRACTOR_METATYPE_CONTRIBUTOR_NAME, T},
+  /* ... */
+  {"USLT", EXTRACTOR_METATYPE_LYRICS, UL },
+  {"SYLT", EXTRACTOR_METATYPE_LYRICS, SL },
+  {"COMM", EXTRACTOR_METATYPE_COMMENT, L},
+  /* ... */
+  {"APIC", EXTRACTOR_METATYPE_PICTURE, I},
+  /* ... */
+  {"LINK", EXTRACTOR_METATYPE_URL, U},
+  /* ... */
+  {"USER", EXTRACTOR_METATYPE_LICENSE, T},
+  /* ... */
+  {NULL, 0, T}
 };
@@ -104,6 +133,9 @@ EXTRACTOR_id3v23_extract (const unsigned char *data,
  uint32_t csize;
  int i;
  uint16_t flags;
+  char *mime;
+  enum EXTRACTOR_MetaType type;
+  size_t off;
  if ((size < 16) ||
      (data[0] != 0x49) ||
@@ -111,12 +143,16 @@ EXTRACTOR_id3v23_extract (const unsigned char *data,
      (data[2] != 0x33) || (data[3] != 0x03) || (data[4] != 0x00))
    return 0;
  unsync = (data[5] & 0x80) > 0;
+  if (unsync)
+    return 0; /* not supported */
  extendedHdr = (data[5] & 0x40) > 0;
  experimental = (data[5] & 0x20) > 0;
+  if (experimental)
+    return 0;
  tsize = (((data[6] & 0x7F) << 21) |
           ((data[7] & 0x7F) << 14) |
           ((data[8] & 0x7F) << 7) | ((data[9] & 0x7F) << 0));
-  if ((tsize + 10 > size) || (experimental))
+  if (tsize + 10 > size)
    return 0;
  pos = 10;
  padding = 0;
@@ -142,7 +178,8 @@ EXTRACTOR_id3v23_extract (const unsigned char *data,
      csize =
        (data[pos + 4] << 24) + (data[pos + 5] << 16) + (data[pos + 6] << 8) +
        data[pos + 7];
-      if ((pos + 10 + csize > tsize) || (csize > tsize) || (csize == 0))
+      if ((pos + 10 + csize > tsize) || (csize > tsize) || (csize == 0) ||
+          (pos + 10 + csize <= pos + 10) || (pos + 10 <= pos))
        break;
      flags = (data[pos + 8] << 8) + data[pos + 9];
      if (((flags & 0x80) > 0) /* compressed, not yet supported */  ||
@@ -163,32 +200,191 @@ EXTRACTOR_id3v23_extract (const unsigned char *data,
                  pos++;
                  csize--;
                }
-              csize--;
+              switch (tmap[i].fmt)
-              /* this byte describes the encoding
+                {
-                 try to convert strings to UTF-8
+                case T:
-                 if it fails, then forget it */
+                  /* this byte describes the encoding
-              switch (data[pos + 10])
+                     try to convert strings to UTF-8
-                {
+                     if it fails, then forget it */
-                case 0x00:
+                  switch (data[pos + 10])
-                  word = EXTRACTOR_common_convert_to_utf8 ((const char *) &data[pos + 11],
+                    {
-                                        csize, "ISO-8859-1");
+                    case 0x00:
-                  break;
+                      word = EXTRACTOR_common_convert_to_utf8 ((const char *) &data[pos + 11],
-                case 0x01:
+                                                               csize - 1, "ISO-8859-1");
-                  word = EXTRACTOR_common_convert_to_utf8 ((const char *) &data[pos + 11],
+                      break;
-                                        csize, "UCS-2");
+                    case 0x01:
-                  break;
+                      word = EXTRACTOR_common_convert_to_utf8 ((const char *) &data[pos + 11],
-                default:
+                                                               csize - 1, "UCS-2");
-                  /* bad encoding byte,
+                      break;
-                     try to convert from iso-8859-1 */
+                    default:
-                  word = EXTRACTOR_common_convert_to_utf8 ((const char *) &data[pos + 11],
+                      /* bad encoding byte,
-                                        csize, "ISO-8859-1");
+                         try to convert from iso-8859-1 */
-                  break;
+                      word = EXTRACTOR_common_convert_to_utf8 ((const char *) &data[pos + 11],
-                }
+                                                               csize - 1, "ISO-8859-1");
-              pos++;
+                      break;
+                    }
+                  break;
+                case U:
+                  word = EXTRACTOR_common_convert_to_utf8 ((const char *) &data[pos + 10],
+                                                           csize, "ISO-8859-1");
+                  break;
+                case UL:
+                  if (csize < 6)
+                    return 0; /* malformed */
+                  /* find end of description */
+                  off = 14;
+                  while ( (off < size) &&
+                          (off - pos < csize) &&
+                          (data[pos + off] == '\0') )
+                    off++;
+                  if ( (off >= csize) ||
+                       (data[pos+off] != '\0') )
+                    return 0; /* malformed */
+                  off++;
+                  switch (data[pos + 10])
+                    {
+                    case 0x00:
+                      word = EXTRACTOR_common_convert_to_utf8 ((const char *) &data[pos + off],
+                                                               csize - off, "ISO-8859-1");
+                      break;
+                    case 0x01:
+                      word = EXTRACTOR_common_convert_to_utf8 ((const char *) &data[pos + off],
+                                                               csize - off, "UCS-2");
+                      break;
+                    default:
+                      /* bad encoding byte,
+                         try to convert from iso-8859-1 */
+                      word = EXTRACTOR_common_convert_to_utf8 ((const char *) &data[pos + off],
+                                                               csize - off, "ISO-8859-1");
+                      break;
+                    }
+                  break;
+                case SL:
+                  if (csize < 7)
+                    return 0; /* malformed */
+                  /* find end of description */
+                  switch (data[pos + 10])
+                    {
+                    case 0x00:
+                      word = EXTRACTOR_common_convert_to_utf8 ((const char *) &data[pos + 16],
+                                                               csize - 6, "ISO-8859-1");
+                      break;
+                    case 0x01:
+                      word = EXTRACTOR_common_convert_to_utf8 ((const char *) &data[pos + 16],
+                                                               csize - 6, "UCS-2");
+                      break;
+                    default:
+                      /* bad encoding byte,
+                         try to convert from iso-8859-1 */
+                      word = EXTRACTOR_common_convert_to_utf8 ((const char *) &data[pos + 16],
+                                                               csize - 6, "ISO-8859-1");
+                      break;
+                    }
+                  break;
+                case L:
+                  if (csize < 5)
+                    return 0; /* malformed */
+                  /* find end of description */
+                  switch (data[pos + 10])
+                    {
+                    case 0x00:
+                      word = EXTRACTOR_common_convert_to_utf8 ((const char *) &data[pos + 14],
+                                                               csize - 4, "ISO-8859-1");
+                      break;
+                    case 0x01:
+                      word = EXTRACTOR_common_convert_to_utf8 ((const char *) &data[pos + 14],
+                                                               csize - 4, "UCS-2");
+                      break;
+                    default:
+                      /* bad encoding byte,
+                         try to convert from iso-8859-1 */
+                      word = EXTRACTOR_common_convert_to_utf8 ((const char *) &data[pos + 14],
+                                                               csize - 4, "ISO-8859-1");
+                      break;
+                    }
+                  break;
+                case I:
+                  if (csize < 2)
+                    return 0; /* malformed */
+                  /* find end of mime type */
+                  off = 11;
+                  while ( (off < size) &&
+                          (off - pos < csize) &&
+                          (data[pos + off] == '\0') )
+                    off++;
+                  if ( (off >= csize) ||
+                       (data[pos+off] != '\0') )
+                    return 0; /* malformed */
+                  off++;
+                  mime = strdup ((const char*) &data[pos + 11]);
+                  
+                  switch (data[pos+off])
+                    {
+                    case 0x03:
+                    case 0x04:
+                      type = EXTRACTOR_METATYPE_COVER_PICTURE;
+                      break;
+                    case 0x07:
+                    case 0x08:
+                    case 0x09:
+                    case 0x0A:
+                    case 0x0B:
+                    case 0x0C:
+                      type = EXTRACTOR_METATYPE_CONTRIBUTOR_PICTURE;
+                      break;
+                    case 0x0D:
+                    case 0x0E:
+                    case 0x0F:
+                      type = EXTRACTOR_METATYPE_EVENT_PICTURE;
+                      break;
+                    case 0x14:
+                      type = EXTRACTOR_METATYPE_LOGO;
+                      type = EXTRACTOR_METATYPE_LOGO;
+                      break;
+                    default:
+                      type = EXTRACTOR_METATYPE_PICTURE;
+                      break;
+                    }
+                  off++;
+                  /* find end of description */
+                  while ( (off < size) &&
+                          (off - pos < csize) &&
+                          (data[pos + off] == '\0') )
+                    off++;
+                  if ( (off >= csize) ||
+                       (data[pos+off] != '\0') )
+                    return 0; /* malformed */
+                  off++;
+                  if (0 == strcasecmp ("-->",
+                                       mime))
+                    {
+                      /* not supported */
+                    }
+                  else
+                    {
+                      if (0 != proc (proc_cls,
+                                     "id3v23",
+                                     type,
+                                     EXTRACTOR_METAFORMAT_BINARY,
+                                     mime,
+                                     (const char*) &data[pos + off],
+                                     csize + 6 - off))                  
+                        {
+                          free (mime);
+                          return 1;
+                        }
+                    }
+                  free (mime);
+                  word = NULL;
+                  break;
+                default:
+                  return 0;
+                }             
              if ((word != NULL) && (strlen (word) > 0))
                {
                  if (0 != proc (proc_cls,
-                                 "id3v2",
+                                 "id3v23",
                                 tmap[i].type,
                                 EXTRACTOR_METAFORMAT_UTF8,
                                 "text/plain",
diff --git a/src/plugins/id3v24_extractor.c b/src/plugins/id3v24_extractor.c
index ec11e4a..acc76af 100644
--- a/src/plugins/id3v24_extractor.c
+++ b/src/plugins/id3v24_extractor.c
@@ -1,6 +1,6 @@
 /*
     This file is part of libextractor.
-     (C) 2002, 2003, 2004, 2006, 2009 Vidyut Samanta and Christian Grothoff
+     (C) 2002, 2003, 2004, 2006, 2007, 2009 Vidyut Samanta and Christian Grothoff
     libextractor is free software; you can redistribute it and/or modify
     it under the terms of the GNU General Public License as published
@@ -18,7 +18,6 @@
     Boston, MA 02111-1307, USA.
 */
 #define DEBUG_EXTRACT_ID3v24 0
 #include "platform.h"
@@ -33,72 +32,98 @@
 #ifndef MINGW
 #include <sys/mman.h>
 #endif
 #include "convert.h"
+enum Id3v24Fmt
-static struct EXTRACTOR_Keywords *
+  {
-addKeyword (EXTRACTOR_KeywordList * oldhead,
+    T, /* simple, 0-terminated string, prefixed by encoding */
-            char *phrase, EXTRACTOR_KeywordType type)
+    U, /* 0-terminated ASCII string, no encoding */
-{
+    UL, /* unsync'ed lyrics */
-  EXTRACTOR_KeywordList *keyword;
+    SL, /* sync'ed lyrics */
+    L, /* string with language prefix */
-  keyword = malloc (sizeof (EXTRACTOR_KeywordList));
+    I /* image */
-  keyword->next = oldhead;
+  };
-  keyword->keyword = phrase;
-  keyword->keywordType = type;
-  return keyword;
-}
 typedef struct
 {
-  char *text;
+  const char *text;
  enum EXTRACTOR_MetaType type;
+  enum Id3v24Fmt fmt;
 } Matches;
 static Matches tmap[] = {
-  {"COMM", EXTRACTOR_METATYPE_COMMENT},
+  {"TALB", EXTRACTOR_METATYPE_ALBUM, T},
-  {"IPLS", EXTRACTOR_METATYPE_CONTRIBUTOR},
+  {"TBPM", EXTRACTOR_METATYPE_BEATS_PER_MINUTE, T},
-  {"TIPL", EXTRACTOR_METATYPE_CONTRIBUTOR},
+  {"TCOM", EXTRACTOR_METATYPE_COMPOSER, T},
-  {"TMOO", EXTRACTOR_METATYPE_MOOD},
+  {"TCON", EXTRACTOR_METATYPE_SONG_VERSION, T},
-  {"TMCL", EXTRACTOR_METATYPE_MUSICIAN_CREDITS_LIST},
+  {"TCOP", EXTRACTOR_METATYPE_COPYRIGHT, T},
-  {"LINK", EXTRACTOR_METATYPE_LINK},
+  /* {"TDAT", EXTRACTOR_METATYPE_CREATION_DATE, T}, deprecated in 24 */
-  {"MCDI", EXTRACTOR_METATYPE_MUSIC_CD_IDENTIFIER},
+  /* TDLY */
-  {"PCNT", EXTRACTOR_METATYPE_PLAY_COUNTER},
+  {"TENC", EXTRACTOR_METATYPE_ENCODED_BY, T},
-  {"POPM", EXTRACTOR_METATYPE_POPULARITY_METER},
+  {"TEXT", EXTRACTOR_METATYPE_WRITER, T},  
-  {"TCOP", EXTRACTOR_METATYPE_COPYRIGHT},
+  {"TFLT", EXTRACTOR_METATYPE_FORMAT_VERSION, T},
-  {"TDRC", EXTRACTOR_METATYPE_DATE},
+  /* TIME, deprecated in 24 */
-  {"TCON", EXTRACTOR_METATYPE_GENRE},
+  {"TIT1", EXTRACTOR_METATYPE_SECTION, T},
-  {"TIT1", EXTRACTOR_METATYPE_GENRE},
+  {"TIT2", EXTRACTOR_METATYPE_TITLE, T},
-  {"TENC", EXTRACTOR_METATYPE_ENCODED_BY},
+  {"TIT3", EXTRACTOR_METATYPE_SONG_VERSION, T},
-  {"TEXT", EXTRACTOR_METATYPE_LYRICS},
+  /* TKEY */
-  {"TOLY", EXTRACTOR_METATYPE_CONTRIBUTOR},
+  {"TLAN", EXTRACTOR_METATYPE_LANGUAGE, T},
-  {"TOPE", EXTRACTOR_METATYPE_CONTRIBUTOR},
+  {"TLEN", EXTRACTOR_METATYPE_DURATION, T}, /* FIXME: should append 'ms' as unit */
-  {"TOWN", EXTRACTOR_METATYPE_OWNER},
+  {"TMED", EXTRACTOR_METATYPE_SOURCE, T}, 
-  {"TPE1", EXTRACTOR_METATYPE_ARTIST},
+  {"TOAL", EXTRACTOR_METATYPE_ORIGINAL_TITLE, T},
-  {"TPE2", EXTRACTOR_METATYPE_ARTIST},
+  {"TOFN", EXTRACTOR_METATYPE_ORIGINAL_ARTIST, T},
-  {"TPE3", EXTRACTOR_METATYPE_CONDUCTOR},
+  {"TOLY", EXTRACTOR_METATYPE_ORIGINAL_WRITER, T},
-  {"TPE4", EXTRACTOR_METATYPE_INTERPRET},
+  {"TOPE", EXTRACTOR_METATYPE_ORIGINAL_PERFORMER, T},
-  {"TIME", EXTRACTOR_METATYPE_TIME},
+  /* {"TORY", EXTRACTOR_METATYPE_ORIGINAL_RELEASE_YEAR, T}, deprecated in 24 */
-  {"TMED", EXTRACTOR_METATYPE_MEDIA_TYPE},
+  {"TOWN", EXTRACTOR_METATYPE_LICENSEE, T},
-  {"TCOM", EXTRACTOR_METATYPE_CREATOR},
+  {"TPE1", EXTRACTOR_METATYPE_ARTIST, T},
-  {"TOFN", EXTRACTOR_METATYPE_FILENAME},
+  {"TPE2", EXTRACTOR_METATYPE_PERFORMER, T},
-  {"TOPE", EXTRACTOR_METATYPE_ARTIST},
+  {"TPE3", EXTRACTOR_METATYPE_CONDUCTOR, T},
-  {"TPUB", EXTRACTOR_METATYPE_PUBLISHER},
+  {"TPE4", EXTRACTOR_METATYPE_INTERPRETATION, T}, 
-  {"TRCK", EXTRACTOR_METATYPE_TRACK_NUMBER},
+  {"TPOS", EXTRACTOR_METATYPE_DISC_NUMBER, T},
-  {"TRSC", EXTRACTOR_METATYPE_ISRC},
+  {"TPUB", EXTRACTOR_METATYPE_PUBLISHER, T},
-  {"TRSN", EXTRACTOR_METATYPE_SOURCE},
+  {"TRCK", EXTRACTOR_METATYPE_TRACK_NUMBER, T},
-  {"TRSO", EXTRACTOR_METATYPE_CREATED_FOR},
+  /* TRDA, deprecated in 24 */
-  {"TSRC", EXTRACTOR_METATYPE_RESOURCE_IDENTIFIER},
+  {"TRSN", EXTRACTOR_METATYPE_NETWORK_NAME, T},
-  {"TYER", EXTRACTOR_METATYPE_YEAR},
+  /* TRSO */
-  {"TOAL", EXTRACTOR_METATYPE_ALBUM},
+  /* {"TSIZ", EXTRACTOR_METATYPE_EMBEDDED_FILE_SIZE, T}, deprecated in 24 */
-  {"TALB", EXTRACTOR_METATYPE_ALBUM},
+  {"TSRC", EXTRACTOR_METATYPE_ISRC, T},
-  {"TLAN", EXTRACTOR_METATYPE_LANGUAGE},
+  /* TSSE */
-  {"TIT2", EXTRACTOR_METATYPE_TITLE},
+  /* {"TYER", EXTRACTOR_METATYPE_PUBLICATION_YEAR, T}, deprecated in 24 */
-  {"TIT3", EXTRACTOR_METATYPE_DESCRIPTION},
+  {"WCOM", EXTRACTOR_METATYPE_URL, U},
-  {"WCOM", EXTRACTOR_METATYPE_RELEASE},
+  {"WCOP", EXTRACTOR_METATYPE_URL, U},
-  {"WCOP", EXTRACTOR_METATYPE_DISCLAIMER},
+  {"WOAF", EXTRACTOR_METATYPE_URL, U},
-  {"", EXTRACTOR_METATYPE_KEYWORDS},
+  {"WOAS", EXTRACTOR_METATYPE_URL, U},
-  {NULL, 0}
+  {"WORS", EXTRACTOR_METATYPE_URL, U},
+  {"WPAY", EXTRACTOR_METATYPE_URL, U},
+  {"WPUB", EXTRACTOR_METATYPE_URL, U},
+  {"WXXX", EXTRACTOR_METATYPE_URL, T},
+  /* {"IPLS", EXTRACTOR_METATYPE_CONTRIBUTOR_NAME, T}, deprecated in 24 */
+  /* ... */
+  {"USLT", EXTRACTOR_METATYPE_LYRICS, UL },
+  {"SYLT", EXTRACTOR_METATYPE_LYRICS, SL },
+  {"COMM", EXTRACTOR_METATYPE_COMMENT, L},
+  /* ... */
+  {"APIC", EXTRACTOR_METATYPE_PICTURE, I},
+  /* ... */
+  {"LINK", EXTRACTOR_METATYPE_URL, U},
+  /* ... */
+  {"USER", EXTRACTOR_METATYPE_LICENSE, T},
+  /* ... */
+  /* new frames in 24 */
+  /* ASPI, EQU2, RVA2, SEEK, SIGN, TDEN */
+  {"TDOR", EXTRACTOR_METATYPE_PUBLICATION_DATE, T},
+  /* TDRC, TDRL, TDTG */
+  {"TIPL", EXTRACTOR_METATYPE_CONTRIBUTOR_NAME, T},
+  {"TMCL", EXTRACTOR_METATYPE_MUSICIAN_CREDITS_LIST, T},
+  {"TMOO", EXTRACTOR_METATYPE_MOOD, T},
+  {"TPRO", EXTRACTOR_METATYPE_COPYRIGHT, T},
+  {"TSOA", EXTRACTOR_METATYPE_ALBUM, T},
+  {"TSOP", EXTRACTOR_METATYPE_PERFORMER, T},
+  {"TSOT", EXTRACTOR_METATYPE_TITLE, T},
+  {"TSST", EXTRACTOR_METATYPE_SUBTITLE, T},
+  {NULL, 0, T}
 };
@@ -114,54 +139,60 @@ EXTRACTOR_id3v24_extract (const unsigned char *data,
  int extendedHdr;
  int experimental;
  int footer;
-  unsigned int tsize;
+  uint32_t tsize;
-  unsigned int pos;
+  uint32_t pos;
-  unsigned int ehdrSize;
+  uint32_t ehdrSize;
-  unsigned int padding;
+  uint32_t padding;
+  uint32_t csize;
+  int i;
+  uint16_t flags;
+  char *mime;
+  enum EXTRACTOR_MetaType type;
+  size_t off;
  if ((size < 16) ||
      (data[0] != 0x49) ||
      (data[1] != 0x44) ||
      (data[2] != 0x33) || (data[3] != 0x04) || (data[4] != 0x00))
-    return prev;
+    return 0;
  unsync = (data[5] & 0x80) > 0;
+  if (unsync)
+    return 0; /* not supported */
  extendedHdr = (data[5] & 0x40) > 0;
  experimental = (data[5] & 0x20) > 0;
+  if (experimental)
+    return 0;
  footer = (data[5] & 0x10) > 0;
  tsize = (((data[6] & 0x7F) << 21) |
           ((data[7] & 0x7F) << 14) |
           ((data[8] & 0x7F) << 7) | ((data[9] & 0x7F) << 0));
-  if ((tsize + 10 > size) || (experimental))
+  if (tsize + 10 > size)
-    return prev;
+    return 0;
  pos = 10;
  padding = 0;
  if (extendedHdr)
    {
      ehdrSize = (((data[10] & 0x7F) << 21) |
-                  ((data[11] & 0x7F) << 14) |
+                  ((data[11] & 0x7F) << 14) |
-                  ((data[12] & 0x7F) << 7) | ((data[13] & 0x7F) << 0));
+                  ((data[12] & 0x7F) << 7) | ((data[13] & 0x7F) << 0));
-      pos += ehdrSize;
+      pos += 4 + ehdrSize;
+      if (ehdrSize > tsize)
+        return 0;
    }
  while (pos < tsize)
    {
-      size_t csize;
-      int i;
-      unsigned short flags;
      if (pos + 10 > tsize)
-        return prev;
+        return 0;
+      csize =
-      csize = (((data[pos + 4] & 0x7F) << 21) |
+        (data[pos + 4] << 24) + (data[pos + 5] << 16) + (data[pos + 6] << 8) +
-               ((data[pos + 5] & 0x7F) << 14) |
+        data[pos + 7];
-               ((data[pos + 6] & 0x7F) << 7) | ((data[pos + 7] & 0x7F) << 0));
+      if ((pos + 10 + csize > tsize) || (csize > tsize) || (csize == 0) ||
+          (pos + 10 + csize <= pos + 10) || (pos + 10 <= pos))
-      if ((pos + 10 + csize > tsize) || (csize > tsize) || (csize == 0))
        break;
      flags = (data[pos + 8] << 8) + data[pos + 9];
-      if (((flags & 0x80) > 0) /* compressed, not yet supported */  ||
+      if (((flags & 0x08) > 0) /* compressed, not yet supported */  ||
-          ((flags & 0x40) > 0) /* encrypted, not supported */ )
+          ((flags & 0x04) > 0) /* encrypted, not supported */ ||
+          ((flags & 0x02) > 0) /* unsynchronized, not supported */ )
        {
          pos += 10 + csize;
          continue;
@@ -172,59 +203,216 @@ EXTRACTOR_id3v24_extract (const unsigned char *data,
          if (0 == strncmp (tmap[i].text, (const char *) &data[pos], 4))
            {
              char *word;
-              if ((flags & 0x20) > 0)
+              if ((flags & 0x40) > 0)
                {
                  /* "group" identifier, skip a byte */
                  pos++;
                  csize--;
                }
-              /* this byte describes the encoding
+              switch (tmap[i].fmt)
-                 try to convert strings to UTF-8
+                {
-                 if it fails, then forget it */
+                case T:
-              csize--;
+                  /* this byte describes the encoding
-              switch (data[pos + 10])
+                     try to convert strings to UTF-8
-                {
+                     if it fails, then forget it */
-                case 0x00:
+                  switch (data[pos + 10])
-                  word = EXTRACTOR_common_convert_to_utf8 ((const char *) &data[pos + 11],
+                    {
-                                        csize, "ISO-8859-1");
+                    case 0x00:
-                  break;
+                      word = EXTRACTOR_common_convert_to_utf8 ((const char *) &data[pos + 11],
-                case 0x01:
+                                                               csize - 1, "ISO-8859-1");
-                  word = EXTRACTOR_common_convert_to_utf8 ((const char *) &data[pos + 11],
+                      break;
-                                        csize, "UTF-16");
+                    case 0x01:
-                  break;
+                      word = EXTRACTOR_common_convert_to_utf8 ((const char *) &data[pos + 11],
-                case 0x02:
+                                                               csize - 1, "UCS-2");
-                  word = EXTRACTOR_common_convert_to_utf8 ((const char *) &data[pos + 11],
+                      break;
-                                        csize, "UTF-16BE");
+                    default:
-                  break;
+                      /* bad encoding byte,
-                case 0x03:
+                         try to convert from iso-8859-1 */
-                  word = malloc (csize + 1);
+                      word = EXTRACTOR_common_convert_to_utf8 ((const char *) &data[pos + 11],
-                  memcpy (word, &data[pos + 11], csize);
+                                                               csize - 1, "ISO-8859-1");
-                  word[csize] = '\0';
+                      break;
-                  break;
+                    }
-                default:
+                  break;
-                  /* bad encoding byte,
+                case U:
-                     try to convert from iso-8859-1 */
+                  word = EXTRACTOR_common_convert_to_utf8 ((const char *) &data[pos + 10],
-                  word = EXTRACTOR_common_convert_to_utf8 ((const char *) &data[pos + 11],
+                                                           csize, "ISO-8859-1");
-                                        csize, "ISO-8859-1");
+                  break;
-                  break;
+                case UL:
-                }
+                  if (csize < 6)
-              pos++;
+                    return 0; /* malformed */
+                  /* find end of description */
+                  off = 14;
+                  while ( (off < size) &&
+                          (off - pos < csize) &&
+                          (data[pos + off] == '\0') )
+                    off++;
+                  if ( (off >= csize) ||
+                       (data[pos+off] != '\0') )
+                    return 0; /* malformed */
+                  off++;
+                  switch (data[pos + 10])
+                    {
+                    case 0x00:
+                      word = EXTRACTOR_common_convert_to_utf8 ((const char *) &data[pos + off],
+                                                               csize - off, "ISO-8859-1");
+                      break;
+                    case 0x01:
+                      word = EXTRACTOR_common_convert_to_utf8 ((const char *) &data[pos + off],
+                                                               csize - off, "UCS-2");
+                      break;
+                    default:
+                      /* bad encoding byte,
+                         try to convert from iso-8859-1 */
+                      word = EXTRACTOR_common_convert_to_utf8 ((const char *) &data[pos + off],
+                                                               csize - off, "ISO-8859-1");
+                      break;
+                    }
+                  break;
+                case SL:
+                  if (csize < 7)
+                    return 0; /* malformed */
+                  /* find end of description */
+                  switch (data[pos + 10])
+                    {
+                    case 0x00:
+                      word = EXTRACTOR_common_convert_to_utf8 ((const char *) &data[pos + 16],
+                                                               csize - 6, "ISO-8859-1");
+                      break;
+                    case 0x01:
+                      word = EXTRACTOR_common_convert_to_utf8 ((const char *) &data[pos + 16],
+                                                               csize - 6, "UCS-2");
+                      break;
+                    default:
+                      /* bad encoding byte,
+                         try to convert from iso-8859-1 */
+                      word = EXTRACTOR_common_convert_to_utf8 ((const char *) &data[pos + 16],
+                                                               csize - 6, "ISO-8859-1");
+                      break;
+                    }
+                  break;
+                case L:
+                  if (csize < 5)
+                    return 0; /* malformed */
+                  /* find end of description */
+                  switch (data[pos + 10])
+                    {
+                    case 0x00:
+                      word = EXTRACTOR_common_convert_to_utf8 ((const char *) &data[pos + 14],
+                                                               csize - 4, "ISO-8859-1");
+                      break;
+                    case 0x01:
+                      word = EXTRACTOR_common_convert_to_utf8 ((const char *) &data[pos + 14],
+                                                               csize - 4, "UCS-2");
+                      break;
+                    default:
+                      /* bad encoding byte,
+                         try to convert from iso-8859-1 */
+                      word = EXTRACTOR_common_convert_to_utf8 ((const char *) &data[pos + 14],
+                                                               csize - 4, "ISO-8859-1");
+                      break;
+                    }
+                  break;
+                case I:
+                  if (csize < 2)
+                    return 0; /* malformed */
+                  /* find end of mime type */
+                  off = 11;
+                  while ( (off < size) &&
+                          (off - pos < csize) &&
+                          (data[pos + off] == '\0') )
+                    off++;
+                  if ( (off >= csize) ||
+                       (data[pos+off] != '\0') )
+                    return 0; /* malformed */
+                  off++;
+                  mime = strdup ((const char*) &data[pos + 11]);
+                  
+                  switch (data[pos+off])
+                    {
+                    case 0x03:
+                    case 0x04:
+                      type = EXTRACTOR_METATYPE_COVER_PICTURE;
+                      break;
+                    case 0x07:
+                    case 0x08:
+                    case 0x09:
+                    case 0x0A:
+                    case 0x0B:
+                    case 0x0C:
+                      type = EXTRACTOR_METATYPE_CONTRIBUTOR_PICTURE;
+                      break;
+                    case 0x0D:
+                    case 0x0E:
+                    case 0x0F:
+                      type = EXTRACTOR_METATYPE_EVENT_PICTURE;
+                      break;
+                    case 0x14:
+                      type = EXTRACTOR_METATYPE_LOGO;
+                      type = EXTRACTOR_METATYPE_LOGO;
+                      break;
+                    default:
+                      type = EXTRACTOR_METATYPE_PICTURE;
+                      break;
+                    }
+                  off++;
+                  /* find end of description */
+                  while ( (off < size) &&
+                          (off - pos < csize) &&
+                          (data[pos + off] == '\0') )
+                    off++;
+                  if ( (off >= csize) ||
+                       (data[pos+off] != '\0') )
+                    return 0; /* malformed */
+                  off++;
+                  if (0 == strcasecmp ("-->",
+                                       mime))
+                    {
+                      /* not supported */
+                    }
+                  else
+                    {
+                      if (0 != proc (proc_cls,
+                                     "id3v24",
+                                     type,
+                                     EXTRACTOR_METAFORMAT_BINARY,
+                                     mime,
+                                     (const char*) &data[pos + off],
+                                     csize + 6 - off))                  
+                        {
+                          free (mime);
+                          return 1;
+                        }
+                    }
+                  free (mime);
+                  word = NULL;
+                  break;
+                default:
+                  return 0;
+                }             
              if ((word != NULL) && (strlen (word) > 0))
                {
-                  prev = addKeyword (prev, word, tmap[i].type);
+                  if (0 != proc (proc_cls,
-                }
+                                 "id3v24",
-              else
+                                 tmap[i].type,
-                {
+                                 EXTRACTOR_METAFORMAT_UTF8,
-                  free (word);
+                                 "text/plain",
+                                 word,
+                                 strlen(word)+1))
+                    {
+                      free (word);
+                      return 1;
+                    }
                }
+              free (word);
              break;
            }
          i++;
        }
      pos += 10 + csize;
    }
-  return prev;
+  return 0;
 }
 /* end of id3v24_extractor.c */
diff --git a/src/plugins/id3v2_extractor.c b/src/plugins/id3v2_extractor.c
index da5c6d9..f0227f1 100644
--- a/src/plugins/id3v2_extractor.c
+++ b/src/plugins/id3v2_extractor.c
@@ -113,7 +113,7 @@ static Matches tmap[] = {
  /* skipping CRM */
  /* skipping CRA */
  /* {"LNK", EXTRACTOR_METATYPE_URL, XXX}, */
-  {NULL, 0},
+  {NULL, 0, T},
 };
diff --git a/src/plugins/odf_extractor.c b/src/plugins/odf_extractor.c
index 479f5ca..9a8c827 100644
--- a/src/plugins/odf_extractor.c
+++ b/src/plugins/odf_extractor.c
@@ -44,7 +44,7 @@ static Matches tmap[] = {
  { "meta:creation-date", EXTRACTOR_METATYPE_CREATION_DATE },
  { "dc:date",            EXTRACTOR_METATYPE_UNKNOWN_DATE },
  { "dc:creator",         EXTRACTOR_METATYPE_CREATOR },
-  { "dc:language",        EXTRACTOR_METATYPE_DOCUMENT_LANGUAGE },
+  { "dc:language",        EXTRACTOR_METATYPE_LANGUAGE },
  { "dc:title",           EXTRACTOR_METATYPE_TITLE },
  { "dc:description",     EXTRACTOR_METATYPE_DESCRIPTION },
  { "dc:subject",         EXTRACTOR_METATYPE_SUBJECT },
diff --git a/src/plugins/ole2_extractor.c b/src/plugins/ole2_extractor.c
index 1b8d5cf..5f6cd01 100644
--- a/src/plugins/ole2_extractor.c
+++ b/src/plugins/ole2_extractor.c
@@ -107,7 +107,7 @@ static Matches tmap[] = {
  { "meta:generator", EXTRACTOR_METATYPE_CREATED_BY_SOFTWARE },
  { "meta:template", EXTRACTOR_METATYPE_TEMPLATE },
  { "meta:editing-cycles", EXTRACTOR_METATYPE_EDITING_CYCLES }, 
-  /* { "Dictionary", EXTRACTOR_METATYPE_DOCUMENT_LANGUAGE },  */
+  /* { "Dictionary", EXTRACTOR_METATYPE_LANGUAGE },  */
  /* { "gsf:security", EXTRACTOR_SECURITY }, */
  /* { "gsf:scale", EXTRACTOR_SCALE }, // always "false"? */
  /* { "meta:editing-duration", EXTRACTOR_METATYPE_TOTAL_EDITING_TIME }, // encoding? */
@@ -544,7 +544,7 @@ EXTRACTOR_ole2_extract (const char *data,
  if ( (lang != NULL) && (ret == 0) )
    ret = addKeyword(proc, proc_cls,
                     lang,
-                     EXTRACTOR_METATYPE_DOCUMENT_LANGUAGE);  
+                     EXTRACTOR_METATYPE_LANGUAGE);  
  if (lcb >= 6) {
    for (i=0;i<gsf_infile_num_children(infile);i++) {
      if (ret != 0)
diff --git a/src/plugins/png_extractor.c b/src/plugins/png_extractor.c
index 5fb2b9d..bdba922 100644
--- a/src/plugins/png_extractor.c
+++ b/src/plugins/png_extractor.c
@@ -141,7 +141,7 @@ processiTXt (const char *data,
  language = &data[pos];
  ret = 0;
  if (stnlen (language, length - pos) > 0)
-    ADDF (EXTRACTOR_METATYPE_DOCUMENT_LANGUAGE,
+    ADDF (EXTRACTOR_METATYPE_LANGUAGE,
          stndup (language, length - pos));
  pos += stnlen (language, length - pos) + 1;
  if (pos + 1 >= length)
diff --git a/src/plugins/qt_extractor.c b/src/plugins/qt_extractor.c
index 3abd543..123e0f5 100644
--- a/src/plugins/qt_extractor.c
+++ b/src/plugins/qt_extractor.c
@@ -395,9 +395,9 @@ static ITTagConversionEntry it_to_extr_table[] = {
  {"catg", EXTRACTOR_METATYPE_SECTION},
  {"keyw", EXTRACTOR_METATYPE_KEYWORDS},
  {"desc", EXTRACTOR_METATYPE_DESCRIPTION},
-  {"tvnn", EXTRACTOR_METATYPE_TV_NETWORK_NAME},
+  {"tvnn", EXTRACTOR_METATYPE_NETWORK_NAME},
-  {"tvsh", EXTRACTOR_METATYPE_TV_SHOW_NAME}, 
+  {"tvsh", EXTRACTOR_METATYPE_SHOW_NAME}, 
-  {"tven", EXTRACTOR_METATYPE_TV_NETWORK_NAME},
+  {"tven", EXTRACTOR_METATYPE_NETWORK_NAME},
  {NULL, EXTRACTOR_METATYPE_RESERVED}
 };
@@ -850,7 +850,7 @@ processTextTag (const char *input,
  lang = ntohs (txt->language);
  if (lang >= sizeof (languages) / sizeof (char *))
    return 0;                   /* invalid */
-  addKeyword (EXTRACTOR_METATYPE_DOCUMENT_LANGUAGE, languages[lang], ec);
+  addKeyword (EXTRACTOR_METATYPE_LANGUAGE, languages[lang], ec);
  meta = malloc (len + 1);
  memcpy (meta, &txt[1], len);
author	Christian Grothoff <christian@grothoff.org>	2009-12-20 00:06:45 +0000
committer	Christian Grothoff <christian@grothoff.org>	2009-12-20 00:06:45 +0000
commit	949dae1583254b789e3dafe569e030140a621846 (patch)
tree	a6e356030fcb030bd88d96b74d7aa62e1dd5aeb7
parent	73b50507dba0570f2182f21f8b1c27a95886e4e7 (diff)
download	libextractor-949dae1583254b789e3dafe569e030140a621846.tar.gz libextractor-949dae1583254b789e3dafe569e030140a621846.zip