commit 96582d0cc647699770666651f928d0ced29bf155
parent 10764c9eb4ab4e0674c7142f66419a6539f92c1e
Author: Christian Grothoff <christian@grothoff.org>
Date: Mon, 19 Sep 2005 02:44:45 +0000
fx
Diffstat:
1 file changed, 8 insertions(+), 11 deletions(-)
diff --git a/src/plugins/htmlextractor.c b/src/plugins/htmlextractor.c
@@ -137,11 +137,10 @@ static int lookFor(char c,
size_t size) {
size_t p = *pos;
- if (data[p] == '\0') return 0;
while ( (p < size) &&
(data[p] != c) ) {
- p++;
if (data[p] == '\0') return 0;
+ p++;
}
*pos = p;
return p < size;
@@ -152,11 +151,10 @@ static int skipWhitespace(size_t * pos,
size_t size) {
size_t p = *pos;
- if (data[p] == '\0') return 0;
while ( (p < size) &&
(isspace(data[p])) ) {
- p++;
if (data[p] == '\0') return 0;
+ p++;
}
*pos = p;
return p < size;
@@ -167,11 +165,10 @@ static int skipLetters(size_t * pos,
size_t size) {
size_t p = *pos;
- if (data[p] == '\0') return 0;
while ( (p < size) &&
(isalpha(data[p])) ) {
- p++;
if (data[p] == '\0') return 0;
+ p++;
}
*pos = p;
return p < size;
@@ -183,11 +180,10 @@ static int lookForMultiple(const char * c,
size_t size) {
size_t p = *pos;
- if (data[p] == '\0') return 0;
while ( (p < size) &&
(strchr(c, data[p]) == NULL) ) {
- p++;
if (data[p] == '\0') return 0;
+ p++;
}
*pos = p;
return p < size;
@@ -389,11 +385,12 @@ libextractor_html_extract(const char * filename,
prev);
charset = strstr(tmp, "charset=");
+
+ if (charset != NULL)
+ charset = strdup(&charset[strlen("charset=")]);
free(tmp);
}
- if (charset != NULL)
- charset = strdup(&charset[strlen("charset=")]);
- else
+ if (charset == NULL)
charset = strdup("ISO-8859-1"); /* try a sensible default */