org.apache.poi.hwpf.usermodel.HeaderStories Maven / Gradle / Ivy
Go to download
Show more of this group Show more artifacts with this name
Show all versions of poi-scratchpad Show documentation
Show all versions of poi-scratchpad Show documentation
Apache POI - Java API To Access Microsoft Format Files (Scratchpad)
/* ====================================================================
Licensed to the Apache Software Foundation (ASF) under one or more
contributor license agreements. See the NOTICE file distributed with
this work for additional information regarding copyright ownership.
The ASF licenses this file to You under the Apache License, Version 2.0
(the "License"); you may not use this file except in compliance with
the License. You may obtain a copy of the License at
http://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
==================================================================== */
package org.apache.poi.hwpf.usermodel;
import org.apache.poi.hwpf.HWPFDocument;
import org.apache.poi.hwpf.model.FileInformationBlock;
import org.apache.poi.hwpf.model.GenericPropertyNode;
import org.apache.poi.hwpf.model.PlexOfCps;
import org.apache.poi.hwpf.model.SubdocumentType;
/**
* A HeaderStory is a Header, a Footer, or footnote/endnote
* separator.
* All the Header Stories get stored in the same Range in the
* document, and this handles getting out all the individual
* parts.
*
* WARNING - you shouldn't change the headers or footers,
* as offsets are not yet updated!
*/
public final class HeaderStories {
private Range headerStories;
private PlexOfCps plcfHdd;
private boolean stripFields = false;
public HeaderStories(HWPFDocument doc) {
this.headerStories = doc.getHeaderStoryRange();
FileInformationBlock fib = doc.getFileInformationBlock();
// // If there's no PlcfHdd, nothing to do
// if(fib.getCcpHdd() == 0) {
// return;
// }
if (fib.getSubdocumentTextStreamLength( SubdocumentType.HEADER ) == 0)
return;
if(fib.getPlcfHddSize() == 0) {
return;
}
// Handle the PlcfHdd
/*
* Page 88:
*
* "The plcfhdd, a table whose location and length within the file is
* stored in fib.fcPlcfhdd and fib.cbPlcfhdd, describes where the text
* of each header/footer begins. If there are n headers/footers stored
* in the Word file, the plcfhdd consists of n+2 CP entries. The
* beginning CP of the ith header/footer is the ith CP in the plcfhdd.
* The limit CP (the CP of character 1 position past the end of a
* header/footer) of the ith header/footer is the i+1st CP in the
* plcfhdd. Note: at the limit CP - 1, Word always places a chEop as a
* placeholder which is never displayed as part of the header/footer.
* This allows Word to change an existing header/footer to be empty.
*
* If there are n header/footers, the n+2nd CP entry value is always 1
* greater than the n+1st CP entry value. A paragraph end (ASCII 13) is
* always stored at the file position marked by the n+1st CP value.
*
* The transformation in a full saved file from a header/footer CP to an
* offset from the beginning of a file (fc) is
* fc=fib.fcMin+ccpText+ccpFtn+cp."
*/
plcfHdd = new PlexOfCps( doc.getTableStream(), fib.getPlcfHddOffset(),
fib.getPlcfHddSize(), 0 );
}
/**
* @deprecated 3.8 beta 4
*/
@Deprecated
public String getFootnoteSeparator()
{
return getAt( 0 );
}
/**
* @deprecated 3.8 beta 4
*/
@Deprecated
public String getFootnoteContSeparator()
{
return getAt( 1 );
}
/**
* @deprecated 3.8 beta 4
*/
@Deprecated
public String getFootnoteContNote()
{
return getAt( 2 );
}
/**
* @deprecated 3.8 beta 4
*/
@Deprecated
public String getEndnoteSeparator()
{
return getAt( 3 );
}
/**
* @deprecated 3.8 beta 4
*/
@Deprecated
public String getEndnoteContSeparator()
{
return getAt( 4 );
}
/**
* @deprecated 3.8 beta 4
*/
@Deprecated
public String getEndnoteContNote()
{
return getAt( 5 );
}
public Range getFootnoteSeparatorSubrange()
{
return getSubrangeAt( 0 );
}
public Range getFootnoteContSeparatorSubrange()
{
return getSubrangeAt( 1 );
}
public Range getFootnoteContNoteSubrange()
{
return getSubrangeAt( 2 );
}
public Range getEndnoteSeparatorSubrange()
{
return getSubrangeAt( 3 );
}
public Range getEndnoteContSeparatorSubrange()
{
return getSubrangeAt( 4 );
}
public Range getEndnoteContNoteSubrange()
{
return getSubrangeAt( 5 );
}
/**
* @deprecated 3.8 beta 4
*/
@Deprecated
public String getEvenHeader() {
return getAt(6+0);
}
/**
* @deprecated 3.8 beta 4
*/
@Deprecated
public String getOddHeader() {
return getAt(6+1);
}
/**
* @deprecated 3.8 beta 4
*/
@Deprecated
public String getFirstHeader() {
return getAt(6+4);
}
public Range getEvenHeaderSubrange() {
return getSubrangeAt(6+0);
}
public Range getOddHeaderSubrange() {
return getSubrangeAt(6+1);
}
public Range getFirstHeaderSubrange() {
return getSubrangeAt(6+4);
}
/**
* Returns the correct, defined header for the given
* one based page
* @param pageNumber The one based page number
*/
public String getHeader(int pageNumber) {
// First page header is optional, only return
// if it's set
if(pageNumber == 1) {
if(getFirstHeader().length() > 0) {
return getFirstHeader();
}
}
// Even page header is optional, only return
// if it's set
if(pageNumber % 2 == 0) {
if(getEvenHeader().length() > 0) {
return getEvenHeader();
}
}
// Odd is the default
return getOddHeader();
}
/**
* @deprecated 3.8 beta 4
*/
@Deprecated
public String getEvenFooter()
{
return getAt( 6 + 2 );
}
/**
* @deprecated 3.8 beta 4
*/
@Deprecated
public String getOddFooter()
{
return getAt( 6 + 3 );
}
/**
* @deprecated 3.8 beta 4
*/
@Deprecated
public String getFirstFooter()
{
return getAt( 6 + 5 );
}
public Range getEvenFooterSubrange()
{
return getSubrangeAt( 6 + 2 );
}
public Range getOddFooterSubrange()
{
return getSubrangeAt( 6 + 3 );
}
public Range getFirstFooterSubrange()
{
return getSubrangeAt( 6 + 5 );
}
/**
* Returns the correct, defined footer for the given
* one based page
* @param pageNumber The one based page number
*/
public String getFooter(int pageNumber) {
// First page footer is optional, only return
// if it's set
if(pageNumber == 1) {
if(getFirstFooter().length() > 0) {
return getFirstFooter();
}
}
// Even page footer is optional, only return
// if it's set
if(pageNumber % 2 == 0) {
if(getEvenFooter().length() > 0) {
return getEvenFooter();
}
}
// Odd is the default
return getOddFooter();
}
/**
* Get the string that's pointed to by the
* given plcfHdd index
* @deprecated 3.8 beta 4
*/
@Deprecated
private String getAt(int plcfHddIndex) {
if(plcfHdd == null) return null;
GenericPropertyNode prop = plcfHdd.getProperty(plcfHddIndex);
if(prop.getStart() == prop.getEnd()) {
// Empty story
return "";
}
if(prop.getEnd() < prop.getStart()) {
// Broken properties?
return "";
}
// Ensure we're getting a sensible length
String rawText = headerStories.text();
int start = Math.min(prop.getStart(), rawText.length());
int end = Math.min(prop.getEnd(), rawText.length());
// Grab the contents
String text = rawText.substring(start, end);
// Strip off fields and macros if requested
if(stripFields) {
return Range.stripFields(text);
}
// If you create a header/footer, then remove it again, word
// will leave \r\r. Turn these back into an empty string,
// which is more what you'd expect
if(text.equals("\r\r")) {
return "";
}
return text;
}
private Range getSubrangeAt( int plcfHddIndex )
{
if ( plcfHdd == null )
return null;
GenericPropertyNode prop = plcfHdd.getProperty( plcfHddIndex );
if ( prop.getStart() == prop.getEnd() )
{
// Empty story
return null;
}
if ( prop.getEnd() < prop.getStart() )
{
// Broken properties?
return null;
}
final int headersLength = headerStories.getEndOffset()
- headerStories.getStartOffset();
int start = Math.min( prop.getStart(), headersLength );
int end = Math.min( prop.getEnd(), headersLength );
return new Range( headerStories.getStartOffset() + start,
headerStories.getStartOffset() + end, headerStories );
}
public Range getRange() {
return headerStories;
}
protected PlexOfCps getPlcfHdd() {
return plcfHdd;
}
/**
* Are fields currently being stripped from
* the text that this {@link HeaderStories} returns?
* Default is false, but can be changed
*/
public boolean areFieldsStripped() {
return stripFields;
}
/**
* Should fields (eg macros) be stripped from
* the text that this class returns?
* Default is not to strip.
* @param stripFields
*/
public void setAreFieldsStripped(boolean stripFields) {
this.stripFields = stripFields;
}
}
© 2015 - 2024 Weber Informatics LLC | Privacy Policy