While in crawler mode wget exit with "bad buffer" then meet following
page:
<html>
<font style=i></font>
Can fix with following patch:
--- html-url.c 2009-09-22 07:00:12.000000000 +0400
+++ html-url.c2 2010-10-07 10:13:11.000000000 +0400
@@ -350,12 +350,23 @@
check_style_attr (struct taginfo *tag, struct map_context *ctx)
{
int attrind;
+ int raw_start;
+ int raw_len;
char *style = find_attr (tag, "style", &attrind);
if (!style)
return;
/* raw pos and raw size include the quotes, hence the +1 -2 */
- get_urls_css (ctx, ATTR_POS(tag,attrind,ctx)+1,
ATTR_SIZE(tag,attrind)-2);
+ raw_start = ATTR_POS(tag,attrind,ctx);
+ raw_len = ATTR_SIZE(tag,attrind);
+ if( *(char *)(ctx->text + raw_start) == ''' ||
+ *(char *)(ctx->text + raw_start) == '"'){
+ raw_start += 1;
+ raw_len -= 2;
+ }
+ if(raw_len <= 0)
+ return;
+ get_urls_css (ctx, raw_start, raw_len);
}
/* All the tag_* functions are called from collect_tags_mapper, as