![JAR search and dependency download from the Maven repository](/logo.png)
org.apache.tika.parser.microsoft.OfficeParserConfig Maven / Gradle / Ivy
/*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.tika.parser.microsoft;
import java.io.Serializable;
public class OfficeParserConfig implements Serializable {
private boolean includeDeletedContent = false;
private boolean includeMoveFromContent = false;
private boolean useSAXDocxExtractor = false;
private boolean useSAXPptxExtractor = false;
/**
* Sets whether or not the parser should include deleted content.
*
* This has only been implemented in the streaming docx parser
* ({@link org.apache.tika.parser.microsoft.ooxml.SXWPFWordExtractorDecorator} so far!!!
* @param includeDeletedContent
*/
public void setIncludeDeletedContent(boolean includeDeletedContent) {
this.includeDeletedContent = includeDeletedContent;
}
public boolean getIncludeDeletedContent() {
return includeDeletedContent;
}
/**
* With track changes on, when a section is moved, the content
* is stored in both the "moveFrom" section and in the "moveTo" section.
*
* If you'd like to include the section both in its original location (moveFrom)
* and in its new location (moveTo), set this to true
*
* Default: false
*
* This has only been implemented in the streaming docx parser
* ({@link org.apache.tika.parser.microsoft.ooxml.SXWPFWordExtractorDecorator} so far!!!
* @param includeMoveFromContent
*/
public void setIncludeMoveFromContent(boolean includeMoveFromContent) {
this.includeMoveFromContent = includeMoveFromContent;
}
public boolean getIncludeMoveFromContent() {
return includeMoveFromContent;
}
public boolean getUseSAXDocxExtractor() {
return useSAXDocxExtractor;
}
/**
* Use the experimental SAX-based streaming DOCX parser?
* If set to false
, the classic parser will be used; if true
,
* the new experimental parser will be used.
*
* Default: false
(classic DOM parser)
* @param useSAXDocxExtractor
*/
public void setUseSAXDocxExtractor(boolean useSAXDocxExtractor) {
this.useSAXDocxExtractor = useSAXDocxExtractor;
}
/**
* Use the experimental SAX-based streaming DOCX parser?
* If set to false
, the classic parser will be used; if true
,
* the new experimental parser will be used.
*
* Default: false
(classic DOM parser)
* @param useSAXPptxExtractor
*/
public void setUseSAXPptxExtractor(boolean useSAXPptxExtractor) {
this.useSAXPptxExtractor = useSAXPptxExtractor;
}
public boolean getUseSAXPptxExtractor() {
return useSAXPptxExtractor;
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy