This is an automated email from the ASF dual-hosted git repository.
tallison pushed a commit to branch main
in repository https://gitbox.apache.org/repos/asf/tika.git
The following commit(s) were added to refs/heads/main by this push:
new 019041117 TIKA-4257 -- lower dbf priority (#1773)
019041117 is described below
commit 019041117149667bc4d18fabf222a0670d407959
Author: Tim Allison <[email protected]>
AuthorDate: Mon May 20 16:29:29 2024 -0400
TIKA-4257 -- lower dbf priority (#1773)
---
tika-core/src/main/resources/org/apache/tika/mime/tika-mimetypes.xml | 3 ++-
.../src/test/java/org/apache/tika/parser/crypto/TSDParserTest.java | 2 +-
2 files changed, 3 insertions(+), 2 deletions(-)
diff --git
a/tika-core/src/main/resources/org/apache/tika/mime/tika-mimetypes.xml
b/tika-core/src/main/resources/org/apache/tika/mime/tika-mimetypes.xml
index 94318a0ca..279632018 100644
--- a/tika-core/src/main/resources/org/apache/tika/mime/tika-mimetypes.xml
+++ b/tika-core/src/main/resources/org/apache/tika/mime/tika-mimetypes.xml
@@ -157,7 +157,8 @@
<glob pattern="*.davmount"/>
</mime-type>
<mime-type type="application/x-dbf">
- <magic priority="100">
+ <!-- this looks unique/precise. It isn't. False positives are common. Keep
priority low. -->
+ <magic priority="40">
<match
value="(?s)^[\\x02\\x03\\x30\\x31\\x32\\x43\\x63\\x83\\x8B\\xCB\\xF5\\xE5\\xFB].[\\x01-\\x0C][\\x01-\\x1F].{4}(?:.[^\\x00]|[\\x41-\\xFF].)(?:[^\\x00\\x01].|.[^\\x00]).{31}(?<=[\\x00][^\\x00]{0,10})[A-Z@+]"
type="regex" offset="0"/>
</magic>
<glob pattern="*.dbf"/>
diff --git
a/tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-crypto-module/src/test/java/org/apache/tika/parser/crypto/TSDParserTest.java
b/tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-crypto-module/src/test/java/org/apache/tika/parser/crypto/TSDParserTest.java
index 2789ef114..02ba1f7a7 100644
---
a/tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-crypto-module/src/test/java/org/apache/tika/parser/crypto/TSDParserTest.java
+++
b/tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-crypto-module/src/test/java/org/apache/tika/parser/crypto/TSDParserTest.java
@@ -116,7 +116,7 @@ public class TSDParserTest extends TikaTest {
@Test
public void testTSDFileDataRecursiveMetadataXML() throws Exception {
List<Metadata> list = getRecursiveMetadata("MANIFEST.XML.TSD");
- assertEquals(2, list.size());
+ assertEquals(3, list.size());
assertContains(TSDParser.class.getName(),
Arrays.asList(list.get(0).getValues(TikaCoreProperties.TIKA_PARSED_BY)));
}