Author: siren Date: Tue Oct 24 07:23:38 2006 New Revision: 467343 URL: http://svn.apache.org/viewvc?view=rev&rev=467343 Log: fix for NUTCH-391
Modified: lucene/nutch/branches/branch-0.8/CHANGES.txt lucene/nutch/branches/branch-0.8/src/java/org/apache/nutch/parse/ParseUtil.java Modified: lucene/nutch/branches/branch-0.8/CHANGES.txt URL: http://svn.apache.org/viewvc/lucene/nutch/branches/branch-0.8/CHANGES.txt?view=diff&rev=467343&r1=467342&r2=467343 ============================================================================== --- lucene/nutch/branches/branch-0.8/CHANGES.txt (original) +++ lucene/nutch/branches/branch-0.8/CHANGES.txt Tue Oct 24 07:23:38 2006 @@ -2,7 +2,8 @@ Unreleased changes (0.8.2) - 1. + 1. NUTCH-391 ParseUtil logs file contents to log file when it + cannot find parser (siren) Release 0.8.1 - 2006-09-24 Modified: lucene/nutch/branches/branch-0.8/src/java/org/apache/nutch/parse/ParseUtil.java URL: http://svn.apache.org/viewvc/lucene/nutch/branches/branch-0.8/src/java/org/apache/nutch/parse/ParseUtil.java?view=diff&rev=467343&r1=467342&r2=467343 ============================================================================== --- lucene/nutch/branches/branch-0.8/src/java/org/apache/nutch/parse/ParseUtil.java (original) +++ lucene/nutch/branches/branch-0.8/src/java/org/apache/nutch/parse/ParseUtil.java Tue Oct 24 07:23:38 2006 @@ -68,8 +68,8 @@ parsers = this.parserFactory.getParsers(content.getContentType(), ""); } catch (ParserNotFound e) { if (LOG.isWarnEnabled()) { - LOG.warn("No suitable parser found when trying to parse content " + - content); + LOG.warn("No suitable parser found when trying to parse content " + content.getUrl() + + " of type " + content.getContentType()); } throw new ParseException(e.getMessage()); } @@ -123,8 +123,8 @@ p = this.parserFactory.getParserById(extId); } catch (ParserNotFound e) { if (LOG.isWarnEnabled()) { - LOG.warn("No suitable parser found when trying to parse content " + - content); + LOG.warn("No suitable parser found when trying to parse content " + content.getUrl() + + " of type " + content.getContentType()); } throw new ParseException(e.getMessage()); }