diff --git a/KeywordSearch/src/org/sleuthkit/autopsy/keywordsearch/AbstractFileStringExtract.java b/KeywordSearch/src/org/sleuthkit/autopsy/keywordsearch/AbstractFileStringExtract.java index f2f7318a32976e15c09295f0920d05d18a7d9498..72a9d7dadd2fd93a19d57af57a2ee33eaf405727 100644 --- a/KeywordSearch/src/org/sleuthkit/autopsy/keywordsearch/AbstractFileStringExtract.java +++ b/KeywordSearch/src/org/sleuthkit/autopsy/keywordsearch/AbstractFileStringExtract.java @@ -56,7 +56,8 @@ class AbstractFileStringExtract implements AbstractFileExtract { static final String[] UNSUPPORTED_EXTENSIONS = { //Archives //Note: archive unpacker module will process these instead - "tar", "jar", "zip", "7z", "gzip", "bzip", "bzip2", "gz", "tgz", "cab", "rar", "arj", "dmg", "iso"}; + //"tar", "jar", "zip", "7z", "gzip", "bzip", "bzip2", "gz", "tgz", "cab", "rar", "arj", "dmg", "iso" + }; //disabled prepending of BOM //static { diff --git a/KeywordSearch/src/org/sleuthkit/autopsy/keywordsearch/AbstractFileTikaTextExtract.java b/KeywordSearch/src/org/sleuthkit/autopsy/keywordsearch/AbstractFileTikaTextExtract.java index ed7d85eb96bf9af3133c19f329ba4c4c16c38aa0..e8f6f0ba42d77236ea1844cb5f71c747fedadf0d 100644 --- a/KeywordSearch/src/org/sleuthkit/autopsy/keywordsearch/AbstractFileTikaTextExtract.java +++ b/KeywordSearch/src/org/sleuthkit/autopsy/keywordsearch/AbstractFileTikaTextExtract.java @@ -69,6 +69,8 @@ public class AbstractFileTikaTextExtract implements AbstractFileExtract { // TODO: use type detection mechanism instead, and maintain supported MimeTypes, not extensions // supported extensions list from http://www.lucidimagination.com/devzone/technical-articles/content-extraction-tika static final String[] SUPPORTED_EXTENSIONS = { + //Archive (to be removed when we have archive module + "tar", "jar", "zip", "gzip", "bzip2", "gz", "tgz", "ar", "cpio", //MS Office "doc", "dot", "docx", "docm", "dotx", "dotm", "xls", "xlw", "xlt", "xlsx", "xlsm", "xltx", "xltm",