Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
Show all changes
18 commits
Select commit Hold shift + click to select a range
7914318
added version-specific mime-type definitions for Quattro for DOS and …
bitsgalore Sep 16, 2017
b5c07d5
added missing glob patterns to old Quattro Pro definition
bitsgalore Sep 16, 2017
1fd441e
deleted existing entry for application/x-123 b/c of collisions with Q…
bitsgalore Sep 16, 2017
e6d332d
added version-specific mime-type definitions for Lotus 1-2-3
bitsgalore Sep 16, 2017
85d25cc
removed glob pattern for .wks to avoid conflic with vnd.ms-works
bitsgalore Sep 16, 2017
c8deb97
modified quattro pro version fields so they are consistent with wb3 a…
bitsgalore Sep 16, 2017
73d37e6
added test documents for wk1, wk3, wq1 and wq2 formats
bitsgalore Sep 16, 2017
83832cb
added reference to PRONOM / TNA and the Open Government License to NO…
bitsgalore Sep 16, 2017
817f848
added mimetype definition for Lotus 1-2-3 97/9.x
bitsgalore Sep 17, 2017
b2a0b78
added test documents for Lotus 1-2-3 v4 and 97/9.x formats
bitsgalore Sep 17, 2017
6c60f5c
added suffix to Lotus samples from Lotus FTP site
bitsgalore Sep 18, 2017
c5f0de1
removed old entry for .123 extension
bitsgalore Sep 18, 2017
920f682
fixed indentation
bitsgalore Sep 18, 2017
5e6b2c6
created entry for application/vnd.lotus-1-2-3
bitsgalore Sep 18, 2017
be9d440
commented out glob pattern for wks because it creates a conflict
bitsgalore Sep 18, 2017
6844d90
added samples for .wb1, .wb2 and .wks (all created using Quattro Pro …
bitsgalore Sep 18, 2017
6744383
added mimetype definition for WordPerfect 4.2,based on Philip Storry'…
bitsgalore Sep 19, 2017
8c7c760
added Wordperfect 4.2 sample file (made with WordPerfect 6.1 for Wind…
bitsgalore Sep 19, 2017
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
4 changes: 4 additions & 0 deletions NOTICE.txt
Original file line number Diff line number Diff line change
Expand Up @@ -15,3 +15,7 @@ Tika-parsers component uses CDDL/LGPL dual-licensed dependency: jhighlight (http
OpenCSV: Copyright 2005 Bytecode Pty Ltd. Licensed under the Apache License, Version 2.0

IPTC Photo Metadata descriptions Copyright 2010 International Press Telecommunications Council.

Tika-mimetypes.xml includes mimetype definitions that were adapted from the PRONOM Technical Registry
by The National Archives (http://www.nationalarchives.gov.uk/PRONOM/Default.aspx). PRONOM is published
under the Open Government License 3.0 (http://www.nationalarchives.gov.uk/doc/open-government-licence/version/3/)
128 changes: 121 additions & 7 deletions tika-core/src/main/resources/org/apache/tika/mime/tika-mimetypes.xml
Original file line number Diff line number Diff line change
Expand Up @@ -1498,9 +1498,69 @@
<mime-type type="application/vnd.llamagraphics.life-balance.exchange+xml">
<glob pattern="*.lbe"/>
</mime-type>

<mime-type type="application/vnd.lotus-1-2-3">
<alias type="application/x-123"/>
<_comment>Lotus 1-2-3</_comment>
<!-- <glob pattern="*.wks"/> - conflicts with application/vnd.ms-works -->
<glob pattern="*.wk1"/>
<glob pattern="*.wk2"/>
<glob pattern="*.wk3"/>
<glob pattern="*.wk4"/>
<glob pattern="*.123"/>
</mime-type>

<mime-type type="application/vnd.lotus-1-2-3;version=1">
<sub-class-of type="application/vnd.lotus-1-2-3"/>
<_comment>Lotus 1-2-3, version 1</_comment>
<magic priority="50">
<match value="0x000002000404" type="string" offset="0">
<!-- <glob pattern="*.wks"/> - conflicts with application/vnd.ms-works -->
</match>
</magic>
</mime-type>

<mime-type type="application/vnd.lotus-1-2-3;version=2">
<sub-class-of type="application/vnd.lotus-1-2-3"/>
<_comment>Lotus 1-2-3, version 2</_comment>
<magic priority="50">
<match value="0x00000200060406000800" type="string" offset="0">
</match>
</magic>
<glob pattern="*.wk1"/>
<glob pattern="*.wk2"/>
</mime-type>

<mime-type type="application/vnd.lotus-1-2-3;version=3">
<sub-class-of type="application/vnd.lotus-1-2-3"/>
<_comment>Lotus 1-2-3, version 3</_comment>
<magic priority="50">
<match value="0x00001A0000100400" type="string" offset="0">
</match>
</magic>
<glob pattern="*.wk3"/>
</mime-type>

<mime-type type="application/vnd.lotus-1-2-3;version=4">
<sub-class-of type="application/vnd.lotus-1-2-3"/>
<_comment>Lotus 1-2-3, version 4-5</_comment>
<magic priority="50">
<match value="0x00001A0002100400" type="string" offset="0">
</match>
</magic>
<glob pattern="*.wk4"/>
</mime-type>

<mime-type type="application/vnd.lotus-1-2-3;version=97+9.x">
<sub-class-of type="application/vnd.lotus-1-2-3"/>
<_comment>Lotus 1-2-3, version 97/9.x</_comment>
<magic priority="50">
<match value="0x00001A0003100400" type="string" offset="0">
</match>
</magic>
<glob pattern="*.123"/>
</mime-type>

<mime-type type="application/vnd.lotus-approach">
<glob pattern="*.apr"/>
</mime-type>
Expand Down Expand Up @@ -2665,6 +2725,14 @@

</mime-type>
<!-- TODO: figure out how to identify earlier versions -->
<mime-type type="application/vnd.wordperfect;version=4.2">
<sub-class-of type="application/vnd.wordperfect"/>
<magic priority="50">
<match value="0xCB0A01" type="string" offset="0">
<match value="0xCB" type="string" offset="5"/>
</match>
</magic>
</mime-type>
<mime-type type="application/vnd.wordperfect;version=5.0">
<sub-class-of type="application/vnd.wordperfect"/>
<magic priority="50">
Expand Down Expand Up @@ -2776,13 +2844,6 @@
<glob pattern="*.wspolicy"/>
</mime-type>

<mime-type type="application/x-123">
<magic priority="50">
<match value="0x00001a00" type="big32" offset="0" />
<match value="0x00000200" type="big32" offset="0" />
</magic>
</mime-type>

<mime-type type="application/x-abiword">
<glob pattern="*.abw"/>
</mime-type>
Expand Down Expand Up @@ -3829,12 +3890,65 @@
</_comment>
<!-- qp2 and wb3 are currently detected by POIFSContainerDetector
TODO: add detection for wb2 and wb1 -->
<glob pattern="*.wq1"/>
<glob pattern="*.wq2"/>
<glob pattern="*.wkq"/>
<glob pattern="*.qpw"/>
<glob pattern="*.wb1"/>
<glob pattern="*.wb2"/>
<glob pattern="*.wb3"/>
</mime-type>

<mime-type type="application/x-quattro-pro;version=1-4">
<sub-class-of type="application/x-quattro-pro"/>
<_comment>Quattro Pro for DOS, version 1-4</_comment>
<magic priority="50">
<match value="0x000002002051" type="string" offset="0">
</match>
</magic>
<glob pattern="*.wq1"/>
<glob pattern="*.wkq"/>
</mime-type>

<mime-type type="application/x-quattro-pro;version=5">
<sub-class-of type="application/x-quattro-pro"/>
<_comment>Quattro Pro for DOS, version 5</_comment>
<magic priority="50">
<match value="0x000002002151" type="string" offset="0">
</match>
</magic>
<glob pattern="*.wq2"/>
<glob pattern="*.wkq"/>
</mime-type>

<!-- First Quattro Pro for Windows had major version number 1, which
was followed by 5. This is confusing, perhaps adding "win" qualifier to version
field could clear this up (but it's quite ugly as well) -->

<mime-type type="application/x-quattro-pro;version=1+5">
<sub-class-of type="application/x-quattro-pro"/>
<_comment>Quattro Pro for Windows, version 1, 5</_comment>
<magic priority="50">
<match value="0x000002000110" type="string" offset="0">
</match>
</magic>
<glob pattern="*.wb1"/>
</mime-type>

<mime-type type="application/x-quattro-pro;version=6">
<sub-class-of type="application/x-quattro-pro"/>
<_comment>Quattro Pro for Windows, version 6</_comment>
<magic priority="50">
<match value="0x000002000210" type="string" offset="0">
</match>
</magic>
<glob pattern="*.wb2"/>
</mime-type>

<!-- Quattro Pro for Windows 7-8 (wb3) and and 9 (qpw) files are
currently detected by POIFSContainerDetector
-->

<mime-type type="application/xquery">
<_comment>XQuery source code</_comment>
<glob pattern="*.xq"/>
Expand Down
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.