blob: e445f464f6c1275f4fa8a25023a53c4ca3a6d954 [file] [log] [blame]
<?xml version="1.0" encoding="UTF-8"?>
<!--
Licensed to the Apache Software Foundation (ASF) under one or more contributor
license agreements. See the NOTICE.txt file distributed with this work for
additional information regarding copyright ownership. The ASF licenses this
file to you under the Apache License, Version 2.0 (the "License"); you may not
use this file except in compliance with the License. You may obtain a copy of
the License at
http://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
License for the specific language governing permissions and limitations under
the License.
-->
<cas:mimetypemap xmlns:cas="http://oodt.jpl.nassa.gov/1.0/cas" magic="false"
mimeRepo="mime-types.xml">
<!-- This will be the default extractor used if product doesn't match any
of the mime-types defined in mime-types.xml file (this element is optional) -->
<default>
<!-- you can put a default NamingConvention here too.
<namingConvention id="PDFNamingConv" />
-->
<!-- You can add multiple extractors here if there are more than one,
however extractor is optional, so below extractor can be removed -->
<extractor class="org.apache.oodt.cas.metadata.extractors.MetReaderExtractor" />
</default>
<mime type="all/products">
<extractor class="org.apache.oodt.cas.metadata.extractors.MetReaderExtractor" />
</mime>
<!-- Example type where PGE generates a metadata file for the product, but
the product also needs additional metadata extraction from it... in the
mime-types.xml file txt/product has super type all/products, which means
that for any product that is a txt/product then all/products extractors
will be first be run on it (which, in this case, is just one extractor
which reads in the existing metadata file) followed by txt/product
extractors which is a filename based extractor. -->
<mime type="txt/product">
<extractor class="org.apache.oodt.cas.metadata.extractors.FilenameTokenMetExtractor">
<config file="filename.extractor.config.xml" />
</extractor>
</mime>
<!-- This is an example of a type where only one extractor is run on
product, this is because pdf/product only specifies one extractor and
in mime-types.xml file pdf/product has no super type. -->
<mime type="pdf/product">
<namingConvention id="PDFNamingConv" />
<extractor class="org.apache.oodt.cas.metadata.extractors.FilenameTokenMetExtractor">
<config file="filename.extractor.config.xml" />
</extractor>
</mime>
<!-- This is an example of a type where two extractors get run... this case
is an alternative way of handling txt/product... txt/product will run
the same 2 extractors which this type will run but for different reasons...
doc/product doesn't have any super type, it instead defines both extractors
directly to itself. -->
<mime type="doc/product">
<extractor class="org.apache.oodt.cas.metadata.extractors.MetReaderExtractor" />
<extractor class="org.apache.oodt.cas.metadata.extractors.FilenameTokenMetExtractor">
<config file="filename.extractor.config.xml" />
</extractor>
</mime>
</cas:mimetypemap>