aboutsummaryrefslogtreecommitdiff
path: root/src/plugins/zip_extractor.c
blob: ca60b64e0cb5835991cb0ec685395144fad7074f (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
/*
 * This file is part of libextractor.
 * Copyright (C) 2012 Vidyut Samanta and Christian Grothoff
 *
 * libextractor is free software; you can redistribute it and/or modify
 * it under the terms of the GNU General Public License as published
 * by the Free Software Foundation; either version 3, or (at your
 * option) any later version.
 * 
 * libextractor is distributed in the hope that it will be useful, but
 * WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 * General Public License for more details.
 *
 * You should have received a copy of the GNU General Public License
 * along with libextractor; see the file COPYING.  If not, write to the
 * Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor,
 * Boston, MA 02110-1301, USA.
 */ 
/**
 * @file plugins/zip_extractor.c
 * @brief plugin to support ZIP files
 * @author Christian Grothoff
 */
#include "platform.h"
#include <ctype.h>
#include "extractor.h"
#include "unzip.h"

  
/**
 * Main entry method for the 'application/zip' extraction plugin.  
 *
 * @param ec extraction context provided to the plugin
 */
void
EXTRACTOR_zip_extract_method (struct EXTRACTOR_ExtractContext *ec)
{
  struct EXTRACTOR_UnzipFile *uf;
  struct EXTRACTOR_UnzipFileInfo fi;
  char fname[256];
  char fcomment[256];

  if (NULL == (uf = EXTRACTOR_common_unzip_open (ec)))
    return;
  if ( (EXTRACTOR_UNZIP_OK ==
	EXTRACTOR_common_unzip_go_find_local_file (uf,
						   "meta.xml",
						   2)) ||
       (EXTRACTOR_UNZIP_OK ==
	EXTRACTOR_common_unzip_go_find_local_file (uf,
						   "META-INF/MANIFEST.MF",
						   2)) )
    {
      /* not a normal zip, might be odf, jar, etc. */
      goto CLEANUP;
    }
  if (EXTRACTOR_UNZIP_OK !=
      EXTRACTOR_common_unzip_go_to_first_file (uf))
    { 
      /* zip malformed? */
      goto CLEANUP;
   }
  if (0 !=
      ec->proc (ec->cls, 
		"zip",
		EXTRACTOR_METATYPE_MIMETYPE,
		EXTRACTOR_METAFORMAT_UTF8,
		"text/plain",
		"application/zip",
		strlen ("application/zip") + 1))
    goto CLEANUP;
  if (EXTRACTOR_UNZIP_OK ==
      EXTRACTOR_common_unzip_get_global_comment (uf,
						 fcomment,
						 sizeof (fcomment)))
    {
      if ( (0 != strlen (fcomment)) &&
	   (0 !=
	    ec->proc (ec->cls, 
		      "zip",
		      EXTRACTOR_METATYPE_COMMENT,
		      EXTRACTOR_METAFORMAT_C_STRING,
		      "text/plain",
		      fcomment,
		      strlen (fcomment) + 1)))
	goto CLEANUP;
    }
  do
    {
      if (EXTRACTOR_UNZIP_OK ==
	  EXTRACTOR_common_unzip_get_current_file_info (uf,
							&fi,
							fname,
							sizeof (fname),
							NULL, 0,
							fcomment,
							sizeof (fcomment)))
	{
	  if ( (0 != strlen (fname)) &&
	       (0 !=
		ec->proc (ec->cls, 
			  "zip",
			  EXTRACTOR_METATYPE_FILENAME,
			  EXTRACTOR_METAFORMAT_C_STRING,
			  "text/plain",
			  fname,
			  strlen (fname) + 1)))
	    goto CLEANUP;
	  if ( (0 != strlen (fcomment)) &&
	       (0 !=
		ec->proc (ec->cls, 
			  "zip",
			  EXTRACTOR_METATYPE_COMMENT,
			  EXTRACTOR_METAFORMAT_C_STRING,
			  "text/plain",
			  fcomment,
			  strlen (fcomment) + 1)))
	    goto CLEANUP;
	}						    
    }
  while (EXTRACTOR_UNZIP_OK ==
	 EXTRACTOR_common_unzip_go_to_next_file (uf));
  
CLEANUP:
  (void) EXTRACTOR_common_unzip_close (uf);
}

/* end of zip_extractor.c */