Dear Wiki user, You have subscribed to a wiki page or wiki category on "Nutch Wiki" for change notification.
The "NutchFileFormats" page has been changed by LewisJohnMcgibbney: https://wiki.apache.org/nutch/NutchFileFormats?action=diff&rev1=9&rev2=10 ||file||key datatype||value datatype||codec|| - ||data||org.apache.hadoop.io.Text||org.apache.nutch.crawl.CrawlDatum||org.apache.hadoop.io.compress.DefaultCodec|| - ||index||org.apache.hadoop.io.Text||org.apache.hadoop.io.LongWritable||org.apache.hadoop.io.compress.DefaultCodec|| + ||data||org.apache.hadoop.io.Text||org.apache.nutch.crawl.CrawlDatum||[[http://hadoop.apache.org/docs/current/api/index.html?org/apache/hadoop/io/compress/DefaultCodec.html|org.apache.hadoop.io.compress.DefaultCodec]]|| + ||index||org.apache.hadoop.io.Text||org.apache.hadoop.io.LongWritable||[[http://hadoop.apache.org/docs/current/api/index.html?org/apache/hadoop/io/compress/DefaultCodec.html|org.apache.hadoop.io.compress.DefaultCodec]]|| = LinkDB = @@ -111, +111 @@ == File Formats == ||file||key datatype||value datatype||codec|| - ||data||org.apache.hadoop.io.Text||org.apache.nutch.crawl.Inlinks||org.apache.hadoop.io.compress.DefaultCodec|| - ||index||org.apache.hadoop.io.Text||org.apache.hadoop.io.LongWritable||org.apache.hadoop.io.compress.DefaultCodec|| + ||data||org.apache.hadoop.io.Text||org.apache.nutch.crawl.Inlinks||[[http://hadoop.apache.org/docs/current/api/index.html?org/apache/hadoop/io/compress/DefaultCodec.html|org.apache.hadoop.io.compress.DefaultCodec]]|| + ||index||org.apache.hadoop.io.Text||org.apache.hadoop.io.LongWritable||[[http://hadoop.apache.org/docs/current/api/index.html?org/apache/hadoop/io/compress/DefaultCodec.html|org.apache.hadoop.io.compress.DefaultCodec]]|| = Segments = @@ -153, +153 @@ == Description == - ||content||data||org.apache.hadoop.io.Text||org.apache.nutch.protocol.Content||org.apache.hadoop.io.compress.DefaultCodec|| - ||content||index||org.apache.hadoop.io.Text||org.apache.hadoop.io.LongWritable||org.apache.hadoop.io.compress.DefaultCodec|| - ||crawl_fetch||data||org.apache.hadoop.io.Text||org.apache.nutch.crawl.CrawlDatum||org.apache.hadoop.io.compress.DefaultCodec|| - ||crawl_fetch||index||org.apache.hadoop.io.Text||org.apache.hadoop.io.LongWritable||org.apache.hadoop.io.compress.DefaultCodec|| - ||crawl_generate||part-0000||org.apache.hadoop.io.Text||org.apache.nutch.crawl.CrawlDatum||org.apache.hadoop.io.compress.DefaultCodec|| - ||crawl_parse||data||org.apache.hadoop.io.Text||org.apache.nutch.crawl.CrawlDatum||org.apache.hadoop.io.compress.DefaultCodec|| - ||crawl_parse||index||org.apache.hadoop.io.Text||org.apache.hadoop.io.LongWritable||org.apache.hadoop.io.compress.DefaultCodec|| - ||parse_data||data||org.apache.hadoop.io.Text||org.apache.nutch.parse.ParseData||org.apache.hadoop.io.compress.DefaultCodec|| - ||parse_data||index||org.apache.hadoop.io.Text||org.apache.hadoop.io.LongWritable||org.apache.hadoop.io.compress.DefaultCodec|| - ||parse_text||data||org.apache.hadoop.io.Text||org.apache.nutch.parse.ParseText||org.apache.hadoop.io.compress.DefaultCodec|| - ||parse_text||index||org.apache.hadoop.io.Text||org.apache.hadoop.io.LongWritable||org.apache.hadoop.io.compress.DefaultCodec|| + ||content||data||org.apache.hadoop.io.Text||org.apache.nutch.protocol.Content||[[http://hadoop.apache.org/docs/current/api/index.html?org/apache/hadoop/io/compress/DefaultCodec.html|org.apache.hadoop.io.compress.DefaultCodec]]|| + ||content||index||org.apache.hadoop.io.Text||org.apache.hadoop.io.LongWritable||[[http://hadoop.apache.org/docs/current/api/index.html?org/apache/hadoop/io/compress/DefaultCodec.html|org.apache.hadoop.io.compress.DefaultCodec]]|| + ||crawl_fetch||data||org.apache.hadoop.io.Text||org.apache.nutch.crawl.CrawlDatum||[[http://hadoop.apache.org/docs/current/api/index.html?org/apache/hadoop/io/compress/DefaultCodec.html|org.apache.hadoop.io.compress.DefaultCodec]]|| + ||crawl_fetch||index||org.apache.hadoop.io.Text||org.apache.hadoop.io.LongWritable||[[http://hadoop.apache.org/docs/current/api/index.html?org/apache/hadoop/io/compress/DefaultCodec.html|org.apache.hadoop.io.compress.DefaultCodec]]|| + ||crawl_generate||part-0000||org.apache.hadoop.io.Text||org.apache.nutch.crawl.CrawlDatum||[[http://hadoop.apache.org/docs/current/api/index.html?org/apache/hadoop/io/compress/DefaultCodec.html|org.apache.hadoop.io.compress.DefaultCodec]]|| + ||crawl_parse||data||org.apache.hadoop.io.Text||org.apache.nutch.crawl.CrawlDatum||[[http://hadoop.apache.org/docs/current/api/index.html?org/apache/hadoop/io/compress/DefaultCodec.html|org.apache.hadoop.io.compress.DefaultCodec]]|| + ||crawl_parse||index||org.apache.hadoop.io.Text||org.apache.hadoop.io.LongWritable||[[http://hadoop.apache.org/docs/current/api/index.html?org/apache/hadoop/io/compress/DefaultCodec.html|org.apache.hadoop.io.compress.DefaultCodec]]|| + ||parse_data||data||org.apache.hadoop.io.Text||org.apache.nutch.parse.ParseData||[[http://hadoop.apache.org/docs/current/api/index.html?org/apache/hadoop/io/compress/DefaultCodec.html|org.apache.hadoop.io.compress.DefaultCodec]]|| + ||parse_data||index||org.apache.hadoop.io.Text||org.apache.hadoop.io.LongWritable||[[http://hadoop.apache.org/docs/current/api/index.html?org/apache/hadoop/io/compress/DefaultCodec.html|org.apache.hadoop.io.compress.DefaultCodec]]|| + ||parse_text||data||org.apache.hadoop.io.Text||org.apache.nutch.parse.ParseText||[[http://hadoop.apache.org/docs/current/api/index.html?org/apache/hadoop/io/compress/DefaultCodec.html|org.apache.hadoop.io.compress.DefaultCodec]]|| + ||parse_text||index||org.apache.hadoop.io.Text||org.apache.hadoop.io.LongWritable||[[http://hadoop.apache.org/docs/current/api/index.html?org/apache/hadoop/io/compress/DefaultCodec.html|org.apache.hadoop.io.compress.DefaultCodec]]|| = Old File Format Documentation =