api/src/main/resources/default-configuration.properties - any23 - Git at Google

 #
 #  Licensed to the Apache Software Foundation (ASF) under one or more
 #  contributor license agreements.  See the NOTICE file distributed with
 #  this work for additional information regarding copyright ownership.
 #  The ASF licenses this file to You under the Apache License, Version 2.0
 #  (the "License"); you may not use this file except in compliance with
 #  the License.  You may obtain a copy of the License at
 #
 #   http://www.apache.org/licenses/LICENSE-2.0
 #
 #  Unless required by applicable law or agreed to in writing, software
 #  distributed under the License is distributed on an "AS IS" BASIS,
 #  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 #  See the License for the specific language governing permissions and
 #  limitations under the License.
 #

 # Any23 Core Version
 any23.core.version=${project.version}

 # HTTP Client Configuration.
 # ---- Default HTTP User Agent if not specified.
 any23.http.user.agent.default=Any23-CLI
 # ---- HTTP client timeout in milliseconds.
 any23.http.client.timeout=10000
 # ---- HTTP client max number of connections.
 any23.http.client.max.connections=5

 # RDFa Extractor
 any23.rdfa.extractor.xslt=rdfa.xslt

 # Allows to enable(on)/disable(off) addition
 # of timestamp and size metadata triples.
 any23.extraction.metadata.timesize=off

 # Allows to enable(on)/disable(off) addition
 # of nesting metadata triples.
 any23.extraction.metadata.nesting=on

 # Allows to enable(on)/disable(off)
 # the domain triple for every Microformat entity.
 any23.extraction.metadata.domain.per.entity=off

 # Allows to decide which RDFa Extractor to enable.
 # If 'on' will be activated the programmatic RDFa 1.1 Extractor
 # (org.apache.any23.extractor.rdfa.RDFa11Extractor) otherwise will be
 # registered the RDFa 1.0 legacy one (org.apache.any23.extractor.rdfa.RDFaExtractor).
 any23.extraction.rdfa.programmatic=on

 # The extraction context IRI to be used by the
 # SingleDocumentExtraction. If == '?' the document IRI will
 # be used. It can be overriden by specifying a different
 # value in ExtractionParameters.
 any23.extraction.context.iri=?

 # Any23 Core Plugin Dirs
 any23.plugin.dirs=./plugins

 # Microdata Configuration.
 # ---- Enables(on)/disables(off) strict Microdata extraction.
 #      If turned off, it uses the any23.microdata.ns.default
 #      to build IRIs for anonymous properties
 any23.microdata.strict=off
 # ---- Microdata default namespace.
 any23.microdata.ns.default=http://schema.org/

 # Allows to enable(on)/disable(off) the registration
 # of HTMLMetaExtractor.java to
 # ExtractionRegistry.java
 any23.extraction.head.meta=on

 # Allows to specify a CSV file separator and comment delimeter
 any23.extraction.csv.field=,
 any23.extraction.csv.comment=#
	#
	# Licensed to the Apache Software Foundation (ASF) under one or more
	# contributor license agreements. See the NOTICE file distributed with
	# this work for additional information regarding copyright ownership.
	# The ASF licenses this file to You under the Apache License, Version 2.0
	# (the "License"); you may not use this file except in compliance with
	# the License. You may obtain a copy of the License at
	#
	# http://www.apache.org/licenses/LICENSE-2.0
	#
	# Unless required by applicable law or agreed to in writing, software
	# distributed under the License is distributed on an "AS IS" BASIS,
	# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	# See the License for the specific language governing permissions and
	# limitations under the License.
	#

	# Any23 Core Version
	any23.core.version=${project.version}

	# HTTP Client Configuration.
	# ---- Default HTTP User Agent if not specified.
	any23.http.user.agent.default=Any23-CLI
	# ---- HTTP client timeout in milliseconds.
	any23.http.client.timeout=10000
	# ---- HTTP client max number of connections.
	any23.http.client.max.connections=5

	# RDFa Extractor
	any23.rdfa.extractor.xslt=rdfa.xslt

	# Allows to enable(on)/disable(off) addition
	# of timestamp and size metadata triples.
	any23.extraction.metadata.timesize=off

	# Allows to enable(on)/disable(off) addition
	# of nesting metadata triples.
	any23.extraction.metadata.nesting=on

	# Allows to enable(on)/disable(off)
	# the domain triple for every Microformat entity.
	any23.extraction.metadata.domain.per.entity=off

	# Allows to decide which RDFa Extractor to enable.
	# If 'on' will be activated the programmatic RDFa 1.1 Extractor
	# (org.apache.any23.extractor.rdfa.RDFa11Extractor) otherwise will be
	# registered the RDFa 1.0 legacy one (org.apache.any23.extractor.rdfa.RDFaExtractor).
	any23.extraction.rdfa.programmatic=on

	# The extraction context IRI to be used by the
	# SingleDocumentExtraction. If == '?' the document IRI will
	# be used. It can be overriden by specifying a different
	# value in ExtractionParameters.
	any23.extraction.context.iri=?

	# Any23 Core Plugin Dirs
	any23.plugin.dirs=./plugins

	# Microdata Configuration.
	# ---- Enables(on)/disables(off) strict Microdata extraction.
	# If turned off, it uses the any23.microdata.ns.default
	# to build IRIs for anonymous properties
	any23.microdata.strict=off
	# ---- Microdata default namespace.
	any23.microdata.ns.default=http://schema.org/

	# Allows to enable(on)/disable(off) the registration
	# of HTMLMetaExtractor.java to
	# ExtractionRegistry.java
	any23.extraction.head.meta=on

	# Allows to specify a CSV file separator and comment delimeter
	any23.extraction.csv.field=,
	any23.extraction.csv.comment=#