aboutsummaryrefslogtreecommitdiff
path: root/src/plugins/archive_extractor.c
blob: ef4e7c75163923d45aa2210d547fb194da081c35 (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
/*
     This file is part of libextractor.
     (C) 2012 Christian Grothoff

     libextractor is free software; you can redistribute it and/or modify
     it under the terms of the GNU General Public License as published
     by the Free Software Foundation; either version 3, or (at your
     option) any later version.

     libextractor is distributed in the hope that it will be useful, but
     WITHOUT ANY WARRANTY; without even the implied warranty of
     MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
     General Public License for more details.

     You should have received a copy of the GNU General Public License
     along with libextractor; see the file COPYING.  If not, write to the
     Free Software Foundation, Inc., 59 Temple Place - Suite 330,
     Boston, MA 02111-1307, USA.
 */
/**
 * @file plugins/archive_extractor.c
 * @brief plugin to support archives (such as TAR)
 * @author Christian Grothoff
 */
#include "platform.h"
#include "extractor.h"
#include <archive.h>
#include <archive_entry.h>

/**
 * Callback for libarchive for 'reading'.
 *
 * @param a archive handle
 * @param client_data our 'struct EXTRACTOR_ExtractContext'
 * @param buff where to store data with pointer to data
 * @return number of bytes read
 */
static ssize_t
read_cb (struct archive *a, 
	 void *client_data, 
	 const void **buff)
{
  struct EXTRACTOR_ExtractContext *ec = client_data;
  ssize_t ret;

  *buff = NULL;
  if (-1 == (ret = ec->read (ec->cls, (void **) buff, 16 * 1024)))
    return ARCHIVE_FATAL;
  return ret;
}


/**
 * Callback for libarchive for 'skipping'.
 *
 * @param a archive handle
 * @param client_data our 'struct EXTRACTOR_ExtractContext'
 * @param request number of bytes to skip
 * @return number of bytes skipped
 */
static __LA_INT64_T
skip_cb (struct archive *a, 
	 void *client_data,
	 __LA_INT64_T request)
{
  struct EXTRACTOR_ExtractContext *ec = client_data;

  if (-1 == ec->seek (ec->cls, request, SEEK_CUR))
    return 0;
  return request;
}


/**
 * Main entry method for the ARCHIVE extraction plugin.  
 *
 * @param ec extraction context provided to the plugin
 */
void 
EXTRACTOR_archive_extract_method (struct EXTRACTOR_ExtractContext *ec)
{
  struct archive *a;
  struct archive_entry *entry;
  const char *fname;
  const char *s;
  char *format;

  format = NULL;
  a = archive_read_new ();
  archive_read_support_compression_all (a);
  archive_read_support_format_all (a);
  archive_read_open2 (a, ec, NULL, &read_cb, &skip_cb, NULL);
  while (ARCHIVE_OK == archive_read_next_header(a, &entry))
    {
      if ( (NULL == format) &&
	   (NULL != (fname = archive_format_name (a))) )
	format = strdup (fname);
      s = archive_entry_pathname (entry);
      if (0 != ec->proc (ec->cls, 
			 "tar", 
			 EXTRACTOR_METATYPE_FILENAME, 
			 EXTRACTOR_METAFORMAT_UTF8, 
			 "text/plain", 
			 s, strlen (s) + 1))
	break;
    }
  archive_read_finish (a);
  if (NULL != format)
    {
      if (0 != ec->proc (ec->cls, 
			 "tar",
			 EXTRACTOR_METATYPE_FORMAT,
			 EXTRACTOR_METAFORMAT_UTF8,
			 "text/plain", format, strlen (format) + 1))
	{
	  free (format);
	  return;
	} 
      free (format);
    }
}


/* end of tar_extractor.c */