http://git-wip-us.apache.org/repos/asf/tika/blob/38916f89/tika-test-resources/src/test/resources/test-documents/testPagesHeadersFootersFootnotes.pages
----------------------------------------------------------------------
diff --git 
a/tika-test-resources/src/test/resources/test-documents/testPagesHeadersFootersFootnotes.pages
 
b/tika-test-resources/src/test/resources/test-documents/testPagesHeadersFootersFootnotes.pages
deleted file mode 100644
index cfecc8c..0000000
Binary files 
a/tika-test-resources/src/test/resources/test-documents/testPagesHeadersFootersFootnotes.pages
 and /dev/null differ

http://git-wip-us.apache.org/repos/asf/tika/blob/38916f89/tika-test-resources/src/test/resources/test-documents/testPagesHeadersFootersRomanLower.pages
----------------------------------------------------------------------
diff --git 
a/tika-test-resources/src/test/resources/test-documents/testPagesHeadersFootersRomanLower.pages
 
b/tika-test-resources/src/test/resources/test-documents/testPagesHeadersFootersRomanLower.pages
deleted file mode 100644
index 9cc0edf..0000000
Binary files 
a/tika-test-resources/src/test/resources/test-documents/testPagesHeadersFootersRomanLower.pages
 and /dev/null differ

http://git-wip-us.apache.org/repos/asf/tika/blob/38916f89/tika-test-resources/src/test/resources/test-documents/testPagesHeadersFootersRomanUpper.pages
----------------------------------------------------------------------
diff --git 
a/tika-test-resources/src/test/resources/test-documents/testPagesHeadersFootersRomanUpper.pages
 
b/tika-test-resources/src/test/resources/test-documents/testPagesHeadersFootersRomanUpper.pages
deleted file mode 100644
index de97673..0000000
Binary files 
a/tika-test-resources/src/test/resources/test-documents/testPagesHeadersFootersRomanUpper.pages
 and /dev/null differ

http://git-wip-us.apache.org/repos/asf/tika/blob/38916f89/tika-test-resources/src/test/resources/test-documents/testPagesLayout.pages
----------------------------------------------------------------------
diff --git 
a/tika-test-resources/src/test/resources/test-documents/testPagesLayout.pages 
b/tika-test-resources/src/test/resources/test-documents/testPagesLayout.pages
deleted file mode 100644
index 46d8a40..0000000
Binary files 
a/tika-test-resources/src/test/resources/test-documents/testPagesLayout.pages 
and /dev/null differ

http://git-wip-us.apache.org/repos/asf/tika/blob/38916f89/tika-test-resources/src/test/resources/test-documents/testPagesPwdProtected.pages
----------------------------------------------------------------------
diff --git 
a/tika-test-resources/src/test/resources/test-documents/testPagesPwdProtected.pages
 
b/tika-test-resources/src/test/resources/test-documents/testPagesPwdProtected.pages
deleted file mode 100644
index 788b516..0000000
Binary files 
a/tika-test-resources/src/test/resources/test-documents/testPagesPwdProtected.pages
 and /dev/null differ

http://git-wip-us.apache.org/repos/asf/tika/blob/38916f89/tika-test-resources/src/test/resources/test-documents/testPhoneNumberExtractor.odt
----------------------------------------------------------------------
diff --git 
a/tika-test-resources/src/test/resources/test-documents/testPhoneNumberExtractor.odt
 
b/tika-test-resources/src/test/resources/test-documents/testPhoneNumberExtractor.odt
deleted file mode 100644
index d32e834..0000000
Binary files 
a/tika-test-resources/src/test/resources/test-documents/testPhoneNumberExtractor.odt
 and /dev/null differ

http://git-wip-us.apache.org/repos/asf/tika/blob/38916f89/tika-test-resources/src/test/resources/test-documents/testPopupAnnotation.pdf
----------------------------------------------------------------------
diff --git 
a/tika-test-resources/src/test/resources/test-documents/testPopupAnnotation.pdf 
b/tika-test-resources/src/test/resources/test-documents/testPopupAnnotation.pdf
deleted file mode 100644
index c82107d..0000000
Binary files 
a/tika-test-resources/src/test/resources/test-documents/testPopupAnnotation.pdf 
and /dev/null differ

http://git-wip-us.apache.org/repos/asf/tika/blob/38916f89/tika-test-resources/src/test/resources/test-documents/testQUATTRO.qpw
----------------------------------------------------------------------
diff --git 
a/tika-test-resources/src/test/resources/test-documents/testQUATTRO.qpw 
b/tika-test-resources/src/test/resources/test-documents/testQUATTRO.qpw
deleted file mode 100644
index ec34f47..0000000
Binary files 
a/tika-test-resources/src/test/resources/test-documents/testQUATTRO.qpw and 
/dev/null differ

http://git-wip-us.apache.org/repos/asf/tika/blob/38916f89/tika-test-resources/src/test/resources/test-documents/testQUATTRO.wb3
----------------------------------------------------------------------
diff --git 
a/tika-test-resources/src/test/resources/test-documents/testQUATTRO.wb3 
b/tika-test-resources/src/test/resources/test-documents/testQUATTRO.wb3
deleted file mode 100644
index 8fc7022..0000000
Binary files 
a/tika-test-resources/src/test/resources/test-documents/testQUATTRO.wb3 and 
/dev/null differ

http://git-wip-us.apache.org/repos/asf/tika/blob/38916f89/tika-test-resources/src/test/resources/test-documents/testRDF.rdf
----------------------------------------------------------------------
diff --git a/tika-test-resources/src/test/resources/test-documents/testRDF.rdf 
b/tika-test-resources/src/test/resources/test-documents/testRDF.rdf
deleted file mode 100644
index 04b3da7..0000000
--- a/tika-test-resources/src/test/resources/test-documents/testRDF.rdf
+++ /dev/null
@@ -1,23 +0,0 @@
-<?xml version="1.0" encoding="UTF-8"?>
-<!--
- Licensed to the Apache Software Foundation (ASF) under one or more
- contributor license agreements.  See the NOTICE file distributed with
- this work for additional information regarding copyright ownership.
- The ASF licenses this file to You under the Apache License, Version 2.0
- (the "License"); you may not use this file except in compliance with
- the License.  You may obtain a copy of the License at
-
-     http://www.apache.org/licenses/LICENSE-2.0
-
- Unless required by applicable law or agreed to in writing, software
- distributed under the License is distributed on an "AS IS" BASIS,
- WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- See the License for the specific language governing permissions and
- limitations under the License.
--->
-<rdf:RDF xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#";
-         xmlns:dc="http://purl.org/dc/elements/1.1/";>
-  <rdf:Description
-      rdf:about="http://lucene.apache.org/tika/";
-      dc:title="Apache Tika"/>
-</rdf:RDF>

http://git-wip-us.apache.org/repos/asf/tika/blob/38916f89/tika-test-resources/src/test/resources/test-documents/testRFC822
----------------------------------------------------------------------
diff --git a/tika-test-resources/src/test/resources/test-documents/testRFC822 
b/tika-test-resources/src/test/resources/test-documents/testRFC822
deleted file mode 100644
index 22fbf15..0000000
--- a/tika-test-resources/src/test/resources/test-documents/testRFC822
+++ /dev/null
@@ -1,41 +0,0 @@
-From: "Julien Nioche (JIRA)" <[email protected]>
-To: [email protected]
-Subject: [jira] Commented: (TIKA-461) RFC822 messages not parsed
-Reply-To: [email protected]
-Delivered-To: mailing list [email protected]
-Date: Mon, 6 Sep 2010 05:25:34 -0400 (EDT)
-In-Reply-To: <6089099.260231278600349994.JavaMail.jira@thor>
-MIME-Version: 1.0
-Content-Type: text/plain; charset=utf-8
-Content-Transfer-Encoding: 7bit
-X-JIRA-FingerPrint: 30527f35849b9dde25b450d4833f0394
-X-Virus-Checked: Checked by ClamAV on apache.org
-
-
-    [ 
https://issues.apache.org/jira/browse/TIKA-461?page=com.atlassian.jira.plugin.system.issuetabpanels:comment-tabpanel&focusedCommentId=12906468#action_12906468
 ] 
-
-Julien Nioche commented on TIKA-461:
-------------------------------------
-
-I'll have a look at mime4j and try to use it in Tika
-
-> RFC822 messages not parsed
-> --------------------------
->
->                 Key: TIKA-461
->                 URL: https://issues.apache.org/jira/browse/TIKA-461
->             Project: Tika
->          Issue Type: Bug
->          Components: parser
->    Affects Versions: 0.7
->            Reporter: Joshua Turner
->            Assignee: Julien Nioche
->
-> Presented with an RFC822 message exported from Thunderbird, AutodetectParser 
produces an empty body, and a Metadata containing only one key-value pair: 
"Content-Type=message/rfc822". Directly calling MboxParser likewise gives an 
empty body, but with two metadata pairs: "Content-Encoding=us-ascii 
Content-Type=application/mbox".
-> A quick peek at the source of MboxParser shows that the implementation is 
pretty naive. If the wiring can be sorted out, something like Apache James' 
mime4j might be a better bet.
-
--- 
-This message is automatically generated by JIRA.
--
-You can reply to this email to add a comment to the issue online.
-

http://git-wip-us.apache.org/repos/asf/tika/blob/38916f89/tika-test-resources/src/test/resources/test-documents/testRFC822-CC-BCC
----------------------------------------------------------------------
diff --git 
a/tika-test-resources/src/test/resources/test-documents/testRFC822-CC-BCC 
b/tika-test-resources/src/test/resources/test-documents/testRFC822-CC-BCC
deleted file mode 100644
index 6fe7c2e..0000000
--- a/tika-test-resources/src/test/resources/test-documents/testRFC822-CC-BCC
+++ /dev/null
@@ -1,44 +0,0 @@
-Message-ID: <4890112.1075845067403.JavaMail.evans@thyme>
-Date: Tue, 10 Apr 2001 11:52:00 -0700 (PDT)
-From: [email protected]
-To: [email protected], [email protected], [email protected],
-       [email protected], [email protected], [email protected],
-       [email protected],
-       [email protected], [email protected],
-       [email protected]
-Subject: Confidential Folder to safely pass information to  Arthur Andersen
-Cc: [email protected], [email protected],
-       [email protected], [email protected],
-       [email protected], [email protected], [email protected]
-Mime-Version: 1.0
-Content-Type: text/plain; charset=us-ascii
-Content-Transfer-Encoding: 7bit
-Bcc: [email protected], [email protected],
-       [email protected], [email protected],
-       [email protected], [email protected], [email protected]
-X-From: Beth Apollo <Beth Apollo/ENRON@enronXgate@ENRON>
-X-To: Shona Wilson <Shona Wilson/NA/Enron@Enron>, Jeffrey C Gossett <Jeffrey C 
Gossett/HOU/ECT@ECT>, Stacey W White <Stacey W White/HOU/ECT@ECT>, D Todd Hall 
<D Todd Hall/ENRON@enronXgate>, Sheri Thomas <Sheri Thomas/HOU/ECT@ECT>, Brenda 
F Herod <Brenda F Herod/ENRON@enronXgate>, 
[email protected]@SMTP 
<[email protected]@SMTP@enronXgate>, 
[email protected]@SMTP 
<[email protected]@SMTP@enronXgate>, 
[email protected]@SMTP 
<[email protected]@SMTP@enronXgate>, 
[email protected]@SMTP 
<[email protected]@SMTP@enronXgate>
-X-cc: Sally Beck <Sally Beck/HOU/ECT@ECT>, 
[email protected]@SMTP 
<[email protected]@SMTP@enronXgate>, Georgeanne Hodges 
<Georgeanne Hodges/ENRON@enronXgate>, Vanessa Schulte <Vanessa 
Schulte/ENRON@enronXgate>, Bob M Hall <Bob M Hall/NA/Enron@Enron>, Leslie 
Reeves <Leslie Reeves/HOU/ECT@ECT>, Brent A Price <Brent A 
Price/ENRON@enronXgate>
-X-bcc:
-X-Folder: \Beck, Sally\Beck, Sally\Apollo, Beth
-X-Origin: BECK-S
-X-FileName: Beck, Sally.pst
-
-
-We have become increasingly concerned about confidential information 
(dpr/position info, curves, validations/stress tests, etc) being passed to 
Arthur Andersen for audit purposes over the Web to their Arthur Andersen email 
addresses. (necessary now they no longer have access to Enron's internal email 
system)
-
-Please use the folder described below when passing any info (that you would 
have concerns about if it was picked up by a third party) via the shared drive 
that has been set up for this specific purpose.
-
-Note:  AA should also use the shared drive to pass info back if there are 
questions, or the data needs updating.  We should also consider the sensitivity 
of audit findings and special presentations if they are being distributed 
electronically.
-
-
-Please pass this note to others in your groups who have the need to pass info 
back and forth.
-
-
-Details on how to access for those who will use this method to pass info:
-
-A secured folder has been set up on the "o" drive under Corporate called 
Arthur_Andersen (O:\Corporate\Arthur_Anderson).  Please post all confidential 
files in this folder rather than emailing the files to their company email 
address.  If you need access to this folder, submit an eRequest through the IT 
Central site: http://itcentral.enron.com/Data/Services/SecurityRequests/.  
Arthur Andersen will be able to retrieve these files for review with their 
terminal server access at the Three Allen Center location.
-
-Please contact Vanessa Schulte if you have any problems or questions
-
-Beth Apollo
\ No newline at end of file

http://git-wip-us.apache.org/repos/asf/tika/blob/38916f89/tika-test-resources/src/test/resources/test-documents/testRFC822-big
----------------------------------------------------------------------
diff --git 
a/tika-test-resources/src/test/resources/test-documents/testRFC822-big 
b/tika-test-resources/src/test/resources/test-documents/testRFC822-big
deleted file mode 100644
index 6875959..0000000
--- a/tika-test-resources/src/test/resources/test-documents/testRFC822-big
+++ /dev/null
@@ -1,199 +0,0 @@
-Date: Thu, 7 Jun 2001 02:15:00 -0700 (PDT)
-Message-ID: <00000000EBC47FCC994BED47A6D939DDC8E5C58AC44E2000@PMZL01>
-MIME-Version: 1.0
-Content-Type: text/plain; charset=us-ascii
-Content-Transfer-Encoding: 7bit
-From:  Janette Elbertson
-To:  Alan Aronowitz, Sandi M Braband, Robert Bruce, Teresa G Bushman, Michelle 
Cash,
-        Dominic Carolan, Barton Clark, Harry M Collins, Mary Cook, Nancy 
Corbet, Ned
-        E Crady, Eddy Daniels, Angela Davis, Peter del Vecchio, Stacy E 
Dickson, Andrew
-        Edison, Roseann Engeldorf, Shawna Flynn, Robert H George, Barbara N 
Gray, Mark
-        Greenberg, Wayne Gresham, Leslie Hansen, Jeffrey T Hodge, Brent 
Hendry, Dan
-        J Hyvl, Anne C Koehler, Cheryl Lindeman, Dan Lyons, Kay Mann, Travis 
McCullough,
-        Lisa Mellencamp, Janet H Moore, Harlan Murphy, Julia Murray, Cheryl 
Nelson,
-        Gerald Nemec, Marcus Nettelton, Francisco Pinto Leite, David Portz, 
Coralina
-        Rivera, Michael A Robison, Daniel R Rogers, Elizabeth Sager, Richard B 
Sanders,
-        Frank Sayre, Lance Schuler-Legal, Sara Shackleton, Carlos Sole, Carol 
St Clair,
-        Lou Stoler, Mark Taylor, Sheila Tweed, Steve Van Hooser, John 
Viverito, Ann
-        Elizabeth White, Randy Young, Susan Bailey, Kimberlee A Bennick, 
Martha Braddy,
-        Sarah Bruck, Genia FitzGerald, Nony Flores, Diane Goode, Linda R 
Guinn, Marie
-        Heard, Ed B Hearn III, Mary J Heinitz, Tana Jones, Kathleen Carnahan, 
Deb Korkmas,
-        Laurie Mayer, Matt Maxwell, Mary Ogden, Stephanie Panus, Debra 
Perlingiere,
-        Robert Walker, Kay Young, Merrill W Haas, Samantha Ferguson, Majed 
Nachawati,
-        Suzanne Adams, Connie Castillo, Margaret Doucette, Keegan Farrell, 
Nita Garcia,
-        Carolyn George, Holly Keiser, MaryHelen Martinez, Taffy Milligan, 
Linda J Simmons,
-        Becky Spencer, Twanda Sweet, Alice Wright, Theresa Zucha, Reginald 
Shanks,
-        Elizabeth Lauterbach, Claudia Meraz
-Cc:  Gary Bode, Vanessa Griffin, Esmeralda Gonzalez, Martha Keesler, Rae 
Meadows,
-        Stephanie Truss
-Subject:  Outlook Migration - EWS Legal
-X-Filename:  sbailey2.nsf
-X-Folder:  \All documents
-X-SDOC:  421977
-X-ZLID:  zl-edrm-enron-v2-bailey-s-1216.eml
-
-Our department will be migrated to Outlook in two groups.  The first group
-will be migrated on Monday, June 11,  and the second group will be migrated
-on Tuesday, June 12.   You will receive four e-mails from the Outlook
-migration team.  Please do not delete them.  You will need to open the four
-e-mails and follow the instructions to migrate to Outlook.
-
-Assistants, you will be responsible for scheduling training for yourself and
-your assignments.  It is recommended everyone attend a one hour training
-class.  Training can be scheduled by contacting Maggie Cruz at extension
-3-1816.  (Assistants, please coordinate training with your backup so both of
-you are not in training at the same time.)  Outlook migration specialists
-will be on the 38th floor to answer questions Tuesday and Wednesday, June 12
-and 13.
-
-Listed below is useful information provided to us by the Outlook Migration
-team.
-
-E-mail Policies
-
-Users will be restricted to a Mailbox size of 100 MB.
-
-Further mailbox size restrictions are detailed as follows:
-
-Issue Warning at 75 MB - users are automatically sent a warning from the
-System Administrator explaining they are near their Mailbox limit.
-
-Prohibit Send at 100 MB - users are prevented from sending e-mail, yet they
-can still receive internal and external messages.  Users must reduce the size
-of their mailbox by deleting old mail, saving attachments to a local drive,
-etc. before they can send e-mail again.
-
-Inbound/Outbound Mail Size Limits - inbound and outbound e-mail messages will
-be limited to a size of 10MB.
-
-Deleted Item Retention - users will be able to recover deleted items from
-their mailbox as old as 8 days.  Deleted items include e-mail messages,
-folders, contacts, calendar entries, tasks, notes, journal entries and
-meeting notices.
-
-Archiving - archiving will not be a supported feature of Outlook 2000.
-
-Migration Preparation
-
-Clean Your Mailbox - due to new space limitations on your mailbox, you are
-advised to clean your Notes mailbox of old, unneeded messages BEFORE
-migration.  If you are at the 100MB limit on the day of migration, you will
-not be able to send messages once you are in Outlook.
-
-Limits on Items Migrated  - from the day of your migration, only 30 days of
-old mail will be migrated from your mailbox.  This includes mail in your
-inbox and other folders.  Calendar items dating back one year from the day of
-migration will be migrated (with the exception of repeating appointments).
-
-The following people will be migrated Monday evening, June 11.
-
-Adams, Suzanne
-Bushman, Teresa
-Cash, Michelle
-Clark, Bart
-Corbet, Nancy
-Daniels, Eddy
-Davis, Angela
-Dickson, Stacy
-Edison, Andy
-Elbertson, Janette
-FitzGerald, Genia
-Flores, Nony
-George, Robert H.
-Goode, Diane
-Guinn, Linda
-Haedicke, Mark
-Hansen, Leslie
-Hearn, Ed
-Heinitz, Mary
-Hodge, Jeff
-Legal Temp 1
-Legal Temp 2
-Legal Temp 3
-Legal Temp 4
-Mann, Kay
-Maxwell, Matt
-McCullough, Travis
-Meraz, Claudia
-Mellencamp, Lisa
-Milligan, Taffy
-Moore, Janet H.
-Nemec, Gerald
-Nettelton, Marcus
-Ogden, Mary
-Perlingiere, Debra
-Portz, David
-Sager, Elizabeth
-Sanders, Richard
-Simmons, Linda
-Sol,, Carlos
-St. Clair, Carol
-Sweet, Twanda
-Tweed, Sheila
-Van Hooser, Steve
-White, Ann Elizabeth
-Zucha, Theresa
-
-The following people will be migrated Tuesday evening, June 12.
-
-Aronowitz, Alan
-Bailey, Susan
-Boyd, Samantha
-Braddy, Martha
-Bruce, Robert
-Bruck, Sarah
-Carolan, Dominic
-Castillo, Connie
-Collins, Harry
-Cook, Mary
-Crady, Ned
-del Vecchio, Peter
-Doucette, Margaret
-Farrell, Keegan
-Ferguson, Samantha
-Garcia, Nita
-George, Carolyn
-Gray, Barbara
-Greenberg, Mark
-Gresham, Wayne
-Haas, Merrill
-Heard, Marie
-Hendry, Brent
-Jones, Tana
-Keiser, Holly
-Koehler, Anne
-Korkmas, Deb
-Lauterbach, Elizabeth
-Legal Temp 5
-Legal Temp 6
-Legal Temp 7
-Lindeman, Cheryl
-Lovelady, Steven
-Lyons, Dan
-Martinez, Mary Helen
-Mayer, Laurie
-Murray, Julia Heintz
-Nachawati, Majed
-Nelson,  Cheryl
-Panus, Stephanie
-Pinto Leite, Francisco
-Rivera, Coralina
-Robison, Michael
-Rogers, Daniel
-Sayre, Frank
-Shackleton, Sara
-Shanks, Reginald
-Spencer, Becky
-Stoler, Lou
-Taylor, Mark
-Viverito, John
-Young, Randy
-
-
-Many thanks for your help in making this a smooth migration to Outlook.
-
-Nony Flores and Janette Elbertson
-
-***********
-EDRM Enron Email Data Set has been produced in EML, PST and NSF format by ZL 
Technologies, Inc. This Data Set is licensed under a Creative Commons 
Attribution 3.0 United States License 
<http://creativecommons.org/licenses/by/3.0/us/> . To provide attribution, 
please cite to "ZL Technologies, Inc. (http://www.zlti.com)."
-***********
\ No newline at end of file

http://git-wip-us.apache.org/repos/asf/tika/blob/38916f89/tika-test-resources/src/test/resources/test-documents/testRFC822-limitedheaders
----------------------------------------------------------------------
diff --git 
a/tika-test-resources/src/test/resources/test-documents/testRFC822-limitedheaders
 
b/tika-test-resources/src/test/resources/test-documents/testRFC822-limitedheaders
deleted file mode 100644
index 8e3b765..0000000
--- 
a/tika-test-resources/src/test/resources/test-documents/testRFC822-limitedheaders
+++ /dev/null
@@ -1,9 +0,0 @@
-From: xyz, abc
-Sent: Monday, May 03, 2010 4:21 PM
-To: abc, def
-Subject: abcd
-
-foo:
-
-bar biz bat
-

http://git-wip-us.apache.org/repos/asf/tika/blob/38916f89/tika-test-resources/src/test/resources/test-documents/testRFC822-multipart
----------------------------------------------------------------------
diff --git 
a/tika-test-resources/src/test/resources/test-documents/testRFC822-multipart 
b/tika-test-resources/src/test/resources/test-documents/testRFC822-multipart
deleted file mode 100644
index 7c0a8c9..0000000
--- a/tika-test-resources/src/test/resources/test-documents/testRFC822-multipart
+++ /dev/null
@@ -1,111 +0,0 @@
-MIME-Version: 1.0
-Sender: [email protected]
-Received: by 10.231.31.200 with HTTP; Mon, 27 Sep 2010 06:29:16 -0700 (PDT)
-Date: Mon, 27 Sep 2010 14:29:16 +0100
-Delivered-To: [email protected]
-X-Google-Sender-Auth: it4o8JYLKcQ5bHJbTpqDhZv46vk
-Message-ID: <[email protected]>
-Subject: Test Multi Part Message
-From: DigitalPebble <[email protected]>
-To: [email protected]
-Content-Type: multipart/mixed; boundary=0016e64606800312ee04913db790
-
---0016e64606800312ee04913db790
-Content-Type: multipart/alternative; boundary=0016e64606800312ea04913db78e
-
---0016e64606800312ea04913db78e
-Content-Type: text/plain; charset=UTF-8
-
-This is a test for parsing multi-part mails. With some funky HTML code an a
-picture attached.
-
-Text specific to body 1.
-
--- 
-**
-*
-Open Source Solutions for Text Engineering
-
-http://digitalpebble.blogspot.com
-http://www.digitalpebble.com*
-
---0016e64606800312ea04913db78e
-Content-Type: text/html; charset=UTF-8
-Content-Transfer-Encoding: quoted-printable
-
-This is a test for parsing multi-part mails. With<span style=3D"color: rgb(=
-204, 0, 0);"> some funky HTML code</span> an a picture attached.<br clear=
-=3D"all"><br>-- <br><font face=3D"arial, helvetica, sans-serif"><b><span st=
-yle=3D"font-family: arial; font-weight: normal;"><b style=3D"color: rgb(0, =
-0, 0); font-family: arial,helvetica,sans-serif;"><img src=3D"http://digital=
-pebble.com/img/logo.gif" height=3D"38" width=3D"200"></b></span></b></font>=
-<div>
-<font face=3D"arial, helvetica, sans-serif"><b><span style=3D"font-family: =
-arial; font-weight: normal;"><b style=3D"color: rgb(0, 0, 0); font-family: =
-arial,helvetica,sans-serif;"><span style=3D"font-size: x-small;">=C2=A0</sp=
-an><br style=3D"font-family: arial,helvetica,sans-serif;">
-</b><span style=3D"color: rgb(102, 102, 102); font-family: arial,helvetica,=
-sans-serif;"><span style=3D"color: rgb(51, 51, 51);">Open Source Solutions =
-for Text Engineering</span><br>
-<span style=3D"font-size: x-small;">=C2=A0</span><br>
-</span></span><span style=3D"color: rgb(102, 102, 102);"><span style=3D"fon=
-t-weight: normal;"><a href=3D"http://digitalpebble.blogspot.com"; target=3D"=
-_blank">http://digitalpebble.blogspot.com</a></span></span><span style=3D"f=
-ont-weight: normal;"><br style=3D"color: rgb(102, 102, 102);">
-</span>Text specific to body 2.
-<span style=3D"color: rgb(102, 102, 102);"><span style=3D"font-weight: norm=
-al;"><a href=3D"http://www.digitalpebble.com"; target=3D"_blank">http://www.=
-digitalpebble.com</a></span></span></b></font></div><br>
-
---0016e64606800312ea04913db78e--
---0016e64606800312ee04913db790
-Content-Type: image/gif; name="logo.gif"
-Content-Disposition: attachment; filename="logo.gif"
-Content-Transfer-Encoding: base64
-X-Attachment-Id: f_geldjvqq0
-
-R0lGODlhNgE8AMQAALxlVPv19JmZmaysrNnZ2cR4acXFxaWlpd2yqeXl5dWelObFv82Lfu7Y1Ozs
-7L+/v////8BuXtGVibKysszMzPLi39/f3/fs6tmonsiBdOrPyeK7tP4BAgAAAAAAAAAAACH5BAUU
-ABwALAAAAAA2ATwAAAX/ICSOZGmeaKqubOu+cCzPdG3feK7vfO//wKBwSCwaj8ikcslsOp/QqHRK
-rVqv2KwW2mj0KprfZbEtm7eBBoIBACByjY0kAmDsKgtFoY0lTP4TDiYOgBMERISAh1IGhScLCJES
-DJSVEpEaFUxtnG44bJ12OQidfFcUAqkCCSYJqgIURK6qsSoGrEUTryegpb6cEgsBSL5vN71tojik
-pVioqrgks6m1QtOwKQSp0UO6qry/4ZwRGMNFxZ+lyjfMnc6v3CLX1UHzJ4TQRt6p4OL+EZqIoDum
-Tkc7Tu/ylbA3hGGJZ9v07TKBzF84L0MG2qi4zsZBU1YgrjIRgIJJCvF+/5Q8mRKCyJY/9gnoZ1Fc
-hAsZSxnbWHCUr4QRy7yU+I2iry5dNCCYI05Bzk47a3A0+PMUPDNDc00sUREAigV7fpkDolFqz2VV
-Q14VupaITJoIUQSQ8ItMkLI0pvpsZlXhlqxut5LoqiJA2E4YhOCdoRct3yUWKAAyQGAsYGkJMo9V
-QaDRH8qbM2s+ITpB6MwPXqEUXTjyg0IGULZ4a/QxCgy+OpoYg6ESAwTCWqC7sEFBJQwbArKYGmBB
-b0oKEGB08dHriwrFLSEIE0PkK1jDLstTXTj1d1rDrqV0COG8exQEBrj/TmGzCdpc06JokDtFg66d
-SDAdCr4ooIA4BSBgX/9tnGSAAB2/RKAATixU5wJYNk3YggXzvTJASW2NwF4JHHaYygAOqNcKeSOY
-WBQJDhzg4isHCIICfoPpdwJ/Z5FwAYC/SLDgCDVFyB0KQFoUFQoWrtDAYUquoM2MAhxgQIjj0QIf
-ldRgCQF7VJbgAJffDQkBjiMQpgKPoZhQAYRFAgAQgXH6khiSdapjpghNprBAngBkYOY1qUywGgHm
-ubceiwud98BqFCR63qJajnCSTI+eREIA5w1AgQWiRerojYKlqaMJ1S3ZAJx1zmkCoKXcySCsGajQ
-5wkbwBrokDKqckBKAcjkl4iMktBrKr+2cqyXI4og3giSjnSPfK8Miab/CGqmAGUbdonwZjgZULJt
-gwsiSEkG/hyZY4SV+CMrqqeO8Gc4lbDaiVMP0bhntNJKU6yzHu5JLbP/AjzsCJx6WcJ3LV0LQba4
-/kKhCOiWEoGCPlbnSQm/aEiCBnT5EsGCXTEwIAQV4PbLySPc6qO9ABTQrbchl3LysjamMHBQ/lZK
-wnc5n5AwwT6T8KxLr0zAwpVFj+AwxJtqXGvLIitXwredjMxxrCloADO+6zaYQgUVd1IAk/E+7Iug
-X/U3QompPMACoZRSQ+IrBrDgXd3YmHC0SBawAHffJTzty8Qoa4ABzNySALPVJszbyQZbQ6WC5OPY
-19gJWHfCMgQue+tL/wF7QnBgKcoxnUrQKSzLNz0QSFp6i0Tb7bfCIgSQAOwoNHtmqdjqysk6mLcB
-trY9QrBYfqXMrHabthZ4Quim++L8bhrt7ILq/RLb9LEHuCDT6yccLYPvhgt/Ewk1cwL59Dou/7H0
-YSezQgCjw2/bCPZG0EJjSXPB4Mj3M1XIrQXP8p35XOAARNHnBOmDVQEgt62zsUADvrCa/EjgNlNB
-TwVQ49OpLkC/FahsHLl7xQFZMKaDfalYvitf7QhnNNz1jgCRElbBfvei+tVJSK8S3lE4qBMWjIt5
-w2PB6TwHr/1BgE1CjEsMTzBDekyxUS5UoA1H4EAy8Y6H/JhVkRTwOf8oRhEAA9qgB93hQ900kYkl
-CJ3GhJcl27Wgij2z4wpUhEU9WmqL3uHSFyPYIHX8Rl0mMGMUNVjEFUBtc2iz2RvjQoI5wsp/L2ya
-CvDoPT+mgI95pOEfXTiCnc3HUCnaISFBEgNFCrFynFgSXFj5vCSuoDosk+MZbXnFhWURhjuU4S81
-iTRSQsCUhXqUaUI5SODVkpKt3GUbpkakRqqgbG3A5BrtZ8IMTpKWoJMmAGSlQhcMrXt1pOE5V7iC
-BO7wb995AEzS2cwebhOcLiChNW2gRhF0MHgfTEEIw+nE4qHxBh5yASg7KcqEtkBSBMwXKb+zCM6o
-0pkDdcE/a9DPCtj/CYncVIG9qFnJUylSljGQyewMxjOGwk6ld+SkRFuaTnamQCT1DCNI8ekCbMpp
-pSzoZ3WcB8lElrCkTsRf8mQgkoqqYGcRZakAnIqCwaEzk54sJk21KoDAsWBnOZ2JGK0zgxPGEgdq
-NIwvNLfUErSvDYgUoRMh4NOD1uCc4dsjw1akSX2tQFhRHeVWFziCFhJzlWSVgUct9j6SqECNS+TE
-8QBqy7aVwoLfTOwIclUKtt0vBZLK21P32kdRxq6cKeDeVrXoQpx+9YH3wWjaXNCVCMS1kpg9gS8k
-IJfIcoJlFSEdCji7T6R24n0BgFkGGps7CUwWRhQF7aT4mtV4Dkm1/6t9Z8GukVfpxhOCsp3rC1xZ
-hwUo5wINWFzj6NRZDZjjAopj3HOfmc0FUCgNCBhXzFJQHcpl1ngamBgYloi4Eqj2AfZJADKv6rsp
-+YoCNgoAAZYlUxJYNSXWJQ2FCwVee1IWmmXVVW5hKcEhJalIzCWo2VBQ1zGO9juGooABdgZV6ppW
-BPzqUI1L+0XDnsccgTQAqBLQmWXtTGmx9TB9NTsD38bpev5UH3NPbBEojwCDR0VYi2tS4BIsuFMD
-tPEXcUwlHFbYWPOJhg47hGDtJVmnPmRyk2nFXkAtV6C6su396LWgAGzZXe100QR0d2YSbdhXrBAJ
-67B6YwhYtWg5Pv/PIgD3ZrHuVM4z0IB+6dXlKGfzreEoBwjvVSQGdNoETgbAfPnEuFCvNAA5PsAi
-FkpPwT1gYAd4gFe5SppgfmnDNo3PfDy1mQAWLrxs1MEC/hwzDKRYeZygXANA3YYCYODUYePtBRTA
-OAl9Ti4+fZfQ8uuPDGwA2707CQEWjQSHxcABJ0HJkHQX72WeYVMNgEQkgNMAoO7bv7lTw74bgO4S
-6BtjI4jDvjNBA6UAB6giQO8G9r2db99bBPvo7sU3zvGO14ACA3hUZWLKYY+b/OQoF2Yqdp2CwY05
-5TCP+RYGZ9MT7IzdMs+5zqkQXe+WfOdAD3oUovWARU8YaEJPutI9l3DKPxyaqkuPutR94OMyT/3q
-WO9BpGGM86x7/evmnLF7BmCAroP97GhXQYoyY/a0u/3tcI+73OdOd46HAAA7
---0016e64606800312ee04913db790--

http://git-wip-us.apache.org/repos/asf/tika/blob/38916f89/tika-test-resources/src/test/resources/test-documents/testRFC822_base64
----------------------------------------------------------------------
diff --git 
a/tika-test-resources/src/test/resources/test-documents/testRFC822_base64 
b/tika-test-resources/src/test/resources/test-documents/testRFC822_base64
deleted file mode 100644
index 6060095..0000000
--- a/tika-test-resources/src/test/resources/test-documents/testRFC822_base64
+++ /dev/null
@@ -1,8 +0,0 @@
-To: Nobody <[email protected]>
-From: Nowhere <[email protected]>
-Subject: This tests a base64 encoded body
-MIME-Version: 1.0
-Content-Type: text/plain; charset=ISO-8859-1
-Content-Transfer-Encoding: base64
-
-SGVyZSBpcyBzb21lIHRleHQsIHdpdGggaW50ZXJuYXRpb25hbCBjaGFyYWN0ZXJzLCB2b2ls4CE=

http://git-wip-us.apache.org/repos/asf/tika/blob/38916f89/tika-test-resources/src/test/resources/test-documents/testRFC822_encrypted_zip
----------------------------------------------------------------------
diff --git 
a/tika-test-resources/src/test/resources/test-documents/testRFC822_encrypted_zip
 
b/tika-test-resources/src/test/resources/test-documents/testRFC822_encrypted_zip
deleted file mode 100644
index 5f0780f..0000000
--- 
a/tika-test-resources/src/test/resources/test-documents/testRFC822_encrypted_zip
+++ /dev/null
@@ -1,61 +0,0 @@
-Return-Path: <[email protected]>
-X-Spam-Checker-Version: SpamAssassin 3.3.1 (2010-03-16) on
-       virt0003.codenomicon.com
-X-Spam-Level: 
-X-Spam-Status: No, score=-2.7 required=5.0 tests=BAYES_00,DKIM_SIGNED,
-       DKIM_VALID,DKIM_VALID_AU,FREEMAIL_FROM,HTML_MESSAGE,RCVD_IN_DNSWL_LOW,
-       SPF_PASS autolearn=ham version=3.3.1
-Received: from mail-wg0-f48.google.com (mail-wg0-f48.google.com [74.125.82.48])
-       by codenomicon.com (8.14.4/8.14.4) with ESMTP id t0G7ZmGs002981
-       (version=TLSv1/SSLv3 cipher=DHE-RSA-AES256-SHA bits=256 verify=OK)
-       for <[email protected]>; Fri, 16 Jan 2015 07:35:54 GMT
-Received: by mail-wg0-f48.google.com with SMTP id l2so19028230wgh.7
-        for <[email protected]>; Thu, 15 Jan 2015 23:35:48 -0800 (PST)
-DKIM-Signature: v=1; a=rsa-sha256; c=relaxed/relaxed;
-        d=gmail.com; s=20120113;
-        h=mime-version:from:date:message-id:subject:to:content-type;
-        bh=wjcer9ESeBUN8rAEahqeDiOHf3wqBHgaeAboZtkw8qM=;
-        b=S3ezJU84qISP1OzMoH+wLMxn7y1JkcJwlUs4Uvfy+QlaSFcDcG66oxqsxniQ4kWmCC
-         QdQ94iztFvcvTAHuJys+jAH1UeVQKgs6T5lINj73nww3CKGh1B78LpnCRkFS93o19Zvt
-         QDSDtB23y9FlLF/dH6okvTIq7jQXNPuaDDqY8yJtp+DcYfW+QiNIGI83QievgQlWMRiV
-         fHuCbeEofTRP/82vHxUDVoZo/hwx8OAjWqPitrCmxU7Mly8lG5No1CHsKWmWd2Q+yxN3
-         tC3Ptbrig720BdBZKYwWSI6xBS4AY+46+utaloq9Hr0qpaDf5e9eXqq0ef0efDgd2kJT
-         gmyw==
-X-Received: by 10.180.39.204 with SMTP id r12mr3350467wik.11.1421393748083;
- Thu, 15 Jan 2015 23:35:48 -0800 (PST)
-MIME-Version: 1.0
-From: Juha Haaga <[email protected]>
-Date: Fri, 16 Jan 2015 07:35:46 +0000
-Message-ID: 
<cao2pydsg81q7pb4sb+2gt02-8pefgmq7qvw5zqfe5xage6w...@mail.gmail.com>
-Subject: Test mail for Tika
-To: Juha Haaga <[email protected]>
-Content-Type: multipart/mixed; boundary=001a11c3649c712d2a050cc0050f
-
---001a11c3649c712d2a050cc0050f
-Content-Type: multipart/alternative; boundary=001a11c3649c712d27050cc0050d
-
---001a11c3649c712d27050cc0050d
-Content-Type: text/plain; charset=UTF-8
-
-Includes encrypted zip file as attachment. password is "test".
-This is the Plain Text part
-
---001a11c3649c712d27050cc0050d
-Content-Type: text/html; charset=UTF-8
-
-Includes encrypted zip file as attachment. password is &quot;test&quot;.<br/>
-This is the HTML part
-
---001a11c3649c712d27050cc0050d--
---001a11c3649c712d2a050cc0050f
-Content-Type: application/zip; name="test.zip"
-Content-Disposition: attachment; filename="test.zip"
-Content-Transfer-Encoding: base64
-X-Attachment-Id: 14af1ab4e8dbb946bc5
-
-UEsDBBQACQAIAP1LMEZzIEVkVQAAAE4AAAAIABwAdGV4dC50eHRVVAkAA26+uFSNvrhUdXgLAAEE
-9gEAAAQUAAAAypmn5/WV8PAdMdAB7WIFh/oQZw9KUG57D9/+Sl/mWzAaa2mMH3uENWiIVoypnqB2
-2GFSwihoRH4krgegW8EXEN3YbDQGBTvfEa6p3d/0V0EfZO4F31BLBwhzIEVkVQAAAE4AAABQSwEC
-HgMUAAkACAD9SzBGcyBFZFUAAABOAAAACAAYAAAAAAABAAAApIEAAAAAdGV4dC50eHRVVAUAA26+
-uFR1eAsAAQT2AQAABBQAAABQSwUGAAAAAAEAAQBOAAAApwAAAAAA
---001a11c3649c712d2a050cc0050f--

http://git-wip-us.apache.org/repos/asf/tika/blob/38916f89/tika-test-resources/src/test/resources/test-documents/testRFC822_i18nheaders
----------------------------------------------------------------------
diff --git 
a/tika-test-resources/src/test/resources/test-documents/testRFC822_i18nheaders 
b/tika-test-resources/src/test/resources/test-documents/testRFC822_i18nheaders
deleted file mode 100644
index f711a27..0000000
--- 
a/tika-test-resources/src/test/resources/test-documents/testRFC822_i18nheaders
+++ /dev/null
@@ -1,9 +0,0 @@
-From: =?ISO-8859-1?Q?Keld_J=F8rn_Simonsen?= <[email protected]>
-To: Nobody in Particular <[email protected]>
-Subject: =?ISO-8859-1?B?SWYgeW91IGNhbiByZWFkIHRoaXMgeW8=?=
- =?ISO-8859-2?B?dSB1bmRlcnN0YW5kIHRoZSBleGFtcGxlLg==?=
-MIME-Version: 1.0
-Content-type: text/plain
-Content-transfer-encoding: 7bit
-
-Examples taken from RFC 2047. 

http://git-wip-us.apache.org/repos/asf/tika/blob/38916f89/tika-test-resources/src/test/resources/test-documents/testRFC822_normal_zip
----------------------------------------------------------------------
diff --git 
a/tika-test-resources/src/test/resources/test-documents/testRFC822_normal_zip 
b/tika-test-resources/src/test/resources/test-documents/testRFC822_normal_zip
deleted file mode 100644
index 86dc0c6..0000000
--- 
a/tika-test-resources/src/test/resources/test-documents/testRFC822_normal_zip
+++ /dev/null
@@ -1,61 +0,0 @@
-Return-Path: <[email protected]>
-X-Spam-Checker-Version: SpamAssassin 3.3.1 (2010-03-16) on
-       virt0003.codenomicon.com
-X-Spam-Level: 
-X-Spam-Status: No, score=-2.7 required=5.0 tests=BAYES_00,DKIM_SIGNED,
-       DKIM_VALID,DKIM_VALID_AU,FREEMAIL_FROM,HTML_MESSAGE,RCVD_IN_DNSWL_LOW,
-       SPF_PASS autolearn=ham version=3.3.1
-Received: from mail-wg0-f48.google.com (mail-wg0-f48.google.com [74.125.82.48])
-       by codenomicon.com (8.14.4/8.14.4) with ESMTP id t0G7ZmGs002981
-       (version=TLSv1/SSLv3 cipher=DHE-RSA-AES256-SHA bits=256 verify=OK)
-       for <[email protected]>; Fri, 16 Jan 2015 07:35:54 GMT
-Received: by mail-wg0-f48.google.com with SMTP id l2so19028230wgh.7
-        for <[email protected]>; Thu, 15 Jan 2015 23:35:48 -0800 (PST)
-DKIM-Signature: v=1; a=rsa-sha256; c=relaxed/relaxed;
-        d=gmail.com; s=20120113;
-        h=mime-version:from:date:message-id:subject:to:content-type;
-        bh=wjcer9ESeBUN8rAEahqeDiOHf3wqBHgaeAboZtkw8qM=;
-        b=S3ezJU84qISP1OzMoH+wLMxn7y1JkcJwlUs4Uvfy+QlaSFcDcG66oxqsxniQ4kWmCC
-         QdQ94iztFvcvTAHuJys+jAH1UeVQKgs6T5lINj73nww3CKGh1B78LpnCRkFS93o19Zvt
-         QDSDtB23y9FlLF/dH6okvTIq7jQXNPuaDDqY8yJtp+DcYfW+QiNIGI83QievgQlWMRiV
-         fHuCbeEofTRP/82vHxUDVoZo/hwx8OAjWqPitrCmxU7Mly8lG5No1CHsKWmWd2Q+yxN3
-         tC3Ptbrig720BdBZKYwWSI6xBS4AY+46+utaloq9Hr0qpaDf5e9eXqq0ef0efDgd2kJT
-         gmyw==
-X-Received: by 10.180.39.204 with SMTP id r12mr3350467wik.11.1421393748083;
- Thu, 15 Jan 2015 23:35:48 -0800 (PST)
-MIME-Version: 1.0
-From: Juha Haaga <[email protected]>
-Date: Fri, 16 Jan 2015 07:35:46 +0000
-Message-ID: 
<cao2pydsg81q7pb4sb+2gt02-8pefgmq7qvw5zqfe5xage6w...@mail.gmail.com>
-Subject: Test mail for Tika
-To: Juha Haaga <[email protected]>
-Content-Type: multipart/mixed; boundary=001a11c3649c712d2a050cc0050f
-
---001a11c3649c712d2a050cc0050f
-Content-Type: multipart/alternative; boundary=001a11c3649c712d27050cc0050d
-
---001a11c3649c712d27050cc0050d
-Content-Type: text/plain; charset=UTF-8
-
-Includes a normal, unencrypted zip file as attachment.
-This is the Plain Text part
-
---001a11c3649c712d27050cc0050d
-Content-Type: text/html; charset=UTF-8
-
-Includes &quot;normal&quot;, unencrypted zip file as attachment.<br />
-This is the HTML part
-
---001a11c3649c712d27050cc0050d--
---001a11c3649c712d2a050cc0050f
-Content-Type: application/zip; name="test.zip"
-Content-Disposition: attachment; filename="test.zip"
-Content-Transfer-Encoding: base64
-X-Attachment-Id: 14af1ab4e8dbb946bc5
-
-UEsDBBQAAgAIAKt+MEYEXs11bwAAAHgAAAAIABwAdGV4dC50eHRVVAkAA/IzuVSNvrhUdXgLAAEE
-6AMAAAToAwAADcxBCsJADEbh/Zzi9wCKduV2QIXiQrC5QNuJNFqmQ5MB6+kNvOXHo2tHuESKuD2e
-oPYeDyHQJArP+GuQrJIYfUbNnMd1K8YJPyl4ycyuW4NOS50TBkZZl5FVXQwbSD493lXNaeadj/2/
-Px2bc/gDUEsBAh4DFAACAAgAq34wRgRezXVvAAAAeAAAAAgAGAAAAAAAAQAAAKSBAAAAAHRleHQu
-dHh0VVQFAAPyM7lUdXgLAAEE6AMAAAToAwAAUEsFBgAAAAABAAEATgAAALEAAAAAAA==
---001a11c3649c712d2a050cc0050f--

Reply via email to