All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.culturegraph.mf.mediawiki.helpers.TextExtractor Maven / Gradle / Ivy

/*
 *  Copyright 2013 Deutsche Nationalbibliothek
 *
 *  Licensed under the Apache License, Version 2.0 the "License";
 *  you may not use this file except in compliance with the License.
 *  You may obtain a copy of the License at
 *
 *      http://www.apache.org/licenses/LICENSE-2.0
 *
 *  Unless required by applicable law or agreed to in writing, software
 *  distributed under the License is distributed on an "AS IS" BASIS,
 *  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 *  See the License for the specific language governing permissions and
 *  limitations under the License.
 */
package org.culturegraph.mf.mediawiki.helpers;


import de.fau.cs.osr.ptk.common.ast.AstNode;
import de.fau.cs.osr.ptk.common.ast.Text;

/**
 * Concatenates the contents of all text nodes visited
 * by the extractor.
 *
 * @author Christoph Böhme
 *
 */
public final class TextExtractor extends TraverseTree {

	private final StringBuilder builder = new StringBuilder();

	@Override
	protected boolean before(final AstNode node) {
		builder.delete(0, builder.length());

		return super.before(node);
	}

	@Override
	protected Object after(final AstNode node, final Object result) {
		return builder.toString();
	}

	public void visit(final Text node) {
		builder.append(node.getContent());
	}
}




© 2015 - 2025 Weber Informatics LLC | Privacy Policy