This is an automated email from the ASF dual-hosted git repository.
tallison pushed a commit to branch 2.x
in repository https://gitbox.apache.org/repos/asf/tika.git
The following commit(s) were added to refs/heads/2.x by this push:
new d0ebfda fix tika-eval bug - include child file extension instead
of parent
d0ebfda is described below
commit d0ebfda73c40af151ad4487f2fba2edf89a0ec73
Author: tballison <[email protected]>
AuthorDate: Tue Feb 28 15:55:10 2017 -0500
fix tika-eval bug - include child file extension instead of parent
---
.../src/main/java/org/apache/tika/eval/AbstractProfiler.java | 8 ++++++--
1 file changed, 6 insertions(+), 2 deletions(-)
diff --git a/tika-eval/src/main/java/org/apache/tika/eval/AbstractProfiler.java
b/tika-eval/src/main/java/org/apache/tika/eval/AbstractProfiler.java
index 0e89849..f81d25e 100644
--- a/tika-eval/src/main/java/org/apache/tika/eval/AbstractProfiler.java
+++ b/tika-eval/src/main/java/org/apache/tika/eval/AbstractProfiler.java
@@ -30,6 +30,7 @@ import java.util.Collections;
import java.util.Comparator;
import java.util.HashMap;
import java.util.List;
+import java.util.Locale;
import java.util.Map;
import java.util.concurrent.ArrayBlockingQueue;
import java.util.concurrent.atomic.AtomicInteger;
@@ -217,8 +218,11 @@ public abstract class AbstractProfiler extends
FileResourceConsumer {
data.put(Cols.IS_EMBEDDED, TRUE);
data.put(Cols.FILE_NAME,
getFileName(m.get(RecursiveParserWrapper.EMBEDDED_RESOURCE_PATH)));
}
- data.put(Cols.FILE_EXTENSION,
-
FilenameUtils.getExtension(fps.getRelativeSourceFilePath().getFileName().toString()));
+
+ String ext = FilenameUtils.getExtension(data.get(Cols.FILE_NAME));
+ ext = (ext == null) ? "" : ext.toLowerCase(Locale.US);
+ data.put(Cols.FILE_EXTENSION, ext);
+
long srcFileLen = getSourceFileLength(m);
if (srcFileLen > NON_EXISTENT_FILE_LENGTH) {
data.put(Cols.LENGTH, Long.toString(srcFileLen));
--
To stop receiving notification emails like this one, please contact
['"[email protected]" <[email protected]>'].