Author: kwright
Date: Thu Mar 30 12:25:33 2017
New Revision: 1789511

URL: http://svn.apache.org/viewvc?rev=1789511&view=rev
Log:
Strip anything after the semicolon off of the mime type for MS Exchange

Modified:
    
manifoldcf/trunk/connectors/email/connector/src/main/java/org/apache/manifoldcf/crawler/connectors/email/EmailConnector.java

Modified: 
manifoldcf/trunk/connectors/email/connector/src/main/java/org/apache/manifoldcf/crawler/connectors/email/EmailConnector.java
URL: 
http://svn.apache.org/viewvc/manifoldcf/trunk/connectors/email/connector/src/main/java/org/apache/manifoldcf/crawler/connectors/email/EmailConnector.java?rev=1789511&r1=1789510&r2=1789511&view=diff
==============================================================================
--- 
manifoldcf/trunk/connectors/email/connector/src/main/java/org/apache/manifoldcf/crawler/connectors/email/EmailConnector.java
 (original)
+++ 
manifoldcf/trunk/connectors/email/connector/src/main/java/org/apache/manifoldcf/crawler/connectors/email/EmailConnector.java
 Thu Mar 30 12:25:33 2017
@@ -803,10 +803,12 @@ public class EmailConnector extends org.
                 
               final String origMimeType = part.getContentType();
               final String mimeType;
-              if (origMimeType == null || origMimeType.indexOf("\n") == -1) {
+              //MSExchange puts crap after the mime type so it has to be 
munged.
+              // Example: "application/msword; name=SampleDOCFile_100kb.doc"
+              if (origMimeType == null || origMimeType.indexOf(";") == -1) {
                 mimeType = origMimeType;
               } else {
-                mimeType = origMimeType.substring(0, 
origMimeType.indexOf("\n")).trim();
+                mimeType = origMimeType.substring(0, 
origMimeType.indexOf(";"));
               }
               if (!activities.checkMimeTypeIndexable(mimeType)) {
                 errorCode = activities.EXCLUDED_MIMETYPE;


Reply via email to