blob: b1454ac71500369261745f5c3af6f2e7bf5ae5c8 [file] [log] [blame]
<?xml version="1.0" encoding="UTF-8"?>
<pgeConfig>
<!-- How to run the PGE -->
<exe dir="[JobDir]" shell="/bin/bash">
<cmd>export PATH=$HOME/bin/:${PATH}</cmd>
<cmd>shopt -s expand_aliases</cmd>
<cmd>echo "Creating working dirs"</cmd>
<cmd>mkdir [JobInputDir] ; mkdir [JobOutputDir]; mkdir [JobLogDir]</cmd>
<cmd>echo "Running MIME partitioner"</cmd>
<cmd>[MimePartitionerPyScript] -u [SolrUrl] -c [NumFilesPerJob] -w [PCS_WorkflowManagerUrl] -t [RatTaskId] > [JobLogDir]/mime-partitioner-[DateMilis].log</cmd>
</exe>
<!-- Files to ingest -->
<output>
</output>
<!-- Custom metadata to add to output files -->
<customMetadata>
<!-- helpful keys -->
<metadata key="LessThan" val="&#x3C;"/>
<metadata key="LessThanOrEqualTo" val="[LessThan]="/>
<metadata key="GreaterThan" val="&#x3E;"/>
<metadata key="GreaterThanOrEqualTo" val="[GreaterThan]="/>
<metadata key="Exclamation" val="&#33;"/>
<metadata key="Ampersand" val="&#38;"/>
<metadata key="NotEqualTo" val="[Ampersand]="/>
<metadata key="LogicalAnd" val="[Ampersand][Ampersand]"/>
<metadata key="CshPipeToStdOutAndError" val="[GreaterThan][Ampersand][Exclamation]"/>
<metadata key="ProductionDateTime" val="[DATE.UTC]"/>
<metadata key="DateMilis" val="[DATE_TO_MILLIS([ProductionDateTime],UTC_FORMAT,1970-01-01)]"/>
<metadata key="JobDir" val="[DRAT_HOME]/data/jobs/mimepartitioner/[DateMilis]"/>
<metadata key="JobInputDir" val="[JobDir]/input"/>
<metadata key="JobOutputDir" val="[JobDir]/output"/>
<metadata key="JobLogDir" val="[JobDir]/logs"/>
</customMetadata>
</pgeConfig>