libextractor

GNU libextractor
Log | Files | Refs | Submodules | README | LICENSE

commit 96582d0cc647699770666651f928d0ced29bf155
parent 10764c9eb4ab4e0674c7142f66419a6539f92c1e
Author: Christian Grothoff <christian@grothoff.org>
Date:   Mon, 19 Sep 2005 02:44:45 +0000

fx

Diffstat:
Msrc/plugins/htmlextractor.c | 19++++++++-----------
1 file changed, 8 insertions(+), 11 deletions(-)

diff --git a/src/plugins/htmlextractor.c b/src/plugins/htmlextractor.c @@ -137,11 +137,10 @@ static int lookFor(char c, size_t size) { size_t p = *pos; - if (data[p] == '\0') return 0; while ( (p < size) && (data[p] != c) ) { - p++; if (data[p] == '\0') return 0; + p++; } *pos = p; return p < size; @@ -152,11 +151,10 @@ static int skipWhitespace(size_t * pos, size_t size) { size_t p = *pos; - if (data[p] == '\0') return 0; while ( (p < size) && (isspace(data[p])) ) { - p++; if (data[p] == '\0') return 0; + p++; } *pos = p; return p < size; @@ -167,11 +165,10 @@ static int skipLetters(size_t * pos, size_t size) { size_t p = *pos; - if (data[p] == '\0') return 0; while ( (p < size) && (isalpha(data[p])) ) { - p++; if (data[p] == '\0') return 0; + p++; } *pos = p; return p < size; @@ -183,11 +180,10 @@ static int lookForMultiple(const char * c, size_t size) { size_t p = *pos; - if (data[p] == '\0') return 0; while ( (p < size) && (strchr(c, data[p]) == NULL) ) { - p++; if (data[p] == '\0') return 0; + p++; } *pos = p; return p < size; @@ -389,11 +385,12 @@ libextractor_html_extract(const char * filename, prev); charset = strstr(tmp, "charset="); + + if (charset != NULL) + charset = strdup(&charset[strlen("charset=")]); free(tmp); } - if (charset != NULL) - charset = strdup(&charset[strlen("charset=")]); - else + if (charset == NULL) charset = strdup("ISO-8859-1"); /* try a sensible default */