Author: nick
Date: Fri Jun 5 10:12:07 2015
New Revision: 1683702
URL: http://svn.apache.org/r1683702
Log:
Mark the Tex formats as subtypes of text, so that if there isn't a dedicated
parser for them, then they still get some basic text extracted via the text
parser. Improves govdocs1 coverage
Modified:
tika/trunk/tika-core/src/main/resources/org/apache/tika/mime/tika-mimetypes.xml
Modified:
tika/trunk/tika-core/src/main/resources/org/apache/tika/mime/tika-mimetypes.xml
URL:
http://svn.apache.org/viewvc/tika/trunk/tika-core/src/main/resources/org/apache/tika/mime/tika-mimetypes.xml?rev=1683702&r1=1683701&r2=1683702&view=diff
==============================================================================
---
tika/trunk/tika-core/src/main/resources/org/apache/tika/mime/tika-mimetypes.xml
(original)
+++
tika/trunk/tika-core/src/main/resources/org/apache/tika/mime/tika-mimetypes.xml
Fri Jun 5 10:12:07 2015
@@ -2824,6 +2824,7 @@
</magic>
<glob pattern="*.bib"/>
<glob pattern="*.bibtex"/>
+ <sub-class-of type="text/plain"/>
</mime-type>
<mime-type type="application/x-bittorrent">
@@ -3760,6 +3761,7 @@
<match value="\\contentsline" type="string" offset="0"/>
</magic>
<glob pattern="*.tex"/>
+ <sub-class-of type="text/plain"/>
</mime-type>
<mime-type type="application/x-tex-tfm">