All Downloads are FREE. Search and download functionalities are using the official Maven repository.

y23.apache-any23-core.0.7.0-incubating.source-code.default-configuration.properties Maven / Gradle / Ivy

There is a newer version: 2.7
Show newest version
#
#  Licensed to the Apache Software Foundation (ASF) under one or more
#  contributor license agreements.  See the NOTICE file distributed with
#  this work for additional information regarding copyright ownership.
#  The ASF licenses this file to You under the Apache License, Version 2.0
#  (the "License"); you may not use this file except in compliance with
#  the License.  You may obtain a copy of the License at
#
#   http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
#

# Any23 Core Version
any23.core.version=${project.version} (${implementation.build.tstamp})

# HTTP Client Configuration.
# ---- Default HTTP User Agent if not specified.
any23.http.user.agent.default=Any23-CLI
# ---- HTTP client timeout in milliseconds.
any23.http.client.timeout=10000
# ---- HTTP client max number of connections.
any23.http.client.max.connections=5

# RDFa Extractor
any23.rdfa.extractor.xslt=rdfa.xslt

# Allows to enable(on)/disable(off) addition
# of timestamp and size metadata triples.
any23.extraction.metadata.timesize=off

# Allows to enable(on)/disable(off) addition
# of nesting metadata triples.
any23.extraction.metadata.nesting=on

# Allows to enable(on)/disable(off)
# the domain triple for every Microformat entity.
any23.extraction.metadata.domain.per.entity=off

# Allows to decide which RDFa Extractor to enable.
# If 'on' will be activated the programmatic RDFa 1.1 Extractor
# (org.deri.any23.extractor.rdfa.RDFa11Extractor) otherwise will be
# registered the RDFa 1.0 legacy one (org.deri.any23.extractor.rdfa.RDFaExtractor).
any23.extraction.rdfa.programmatic=on

# The extraction context URI to be used by the
# SingleDocumentExtraction. If == '?' the document URI will
# be used. It can be overriden by specifying a different
# value in ExtractionParameters.
any23.extraction.context.uri=?

# Any23 Core Plugin Dirs
any23.plugin.dirs=./plugins

# Microdata Configuration.
# ---- Enables(on)/disables(off) strict Microdata extraction.
#      If turned off, it uses the any23.microdata.ns.default
#      to build URIs for anonymous properties
any23.microdata.strict=off
# ---- Microdata default namespace.
any23.microdata.ns.default=http://rdf.data-vocabulary.org/

# Allows to enable(on)/disable(off) the registration
# of HTMLMetaExtractor.java to
# ExtractionRegistry.java
any23.extraction.head.meta=off

# Allows to specify a CSV file separator and comment delimeter
any23.extraction.csv.field=,
any23.extraction.csv.comment=#




© 2015 - 2025 Weber Informatics LLC | Privacy Policy