org.databene.benerator.primitive.TokenCombiner Maven / Gradle / Ivy
Go to download
benerator is a framework for creating realistic and valid high-volume test data, used for
testing (unit/integration/load) and showcase setup.
Metadata constraints are imported from systems and/or configuration files. Data can imported from
and exported to files and systems, anonymized or generated from scratch. Domain packages provide
reusable generators for creating domain-specific data as names and addresses internationalizable
in language and region. It is strongly customizable with plugins and configuration options.
/*
* (c) Copyright 2010 by Volker Bergmann. All rights reserved.
*
* Redistribution and use in source and binary forms, with or without
* modification, is permitted under the terms of the
* GNU General Public License (GPL).
*
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
* WITHOUT A WARRANTY OF ANY KIND. ALL EXPRESS OR IMPLIED CONDITIONS,
* REPRESENTATIONS AND WARRANTIES, INCLUDING ANY IMPLIED WARRANTY OF
* MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE OR NON-INFRINGEMENT, ARE
* HEREBY EXCLUDED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
* LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
* CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
* SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
* INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
* CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
* ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
* POSSIBILITY OF SUCH DAMAGE.
*/
package org.databene.benerator.primitive;
import java.io.IOException;
import java.util.HashSet;
import java.util.Set;
import org.databene.benerator.Generator;
import org.databene.benerator.GeneratorContext;
import org.databene.benerator.sample.SampleGenerator;
import org.databene.benerator.wrapper.CompositeStringGenerator;
import org.databene.benerator.wrapper.GeneratorProxy;
import org.databene.benerator.wrapper.ValidatingGeneratorProxy;
import org.databene.commons.ConfigurationError;
import org.databene.commons.Encodings;
import org.databene.commons.StringUtil;
import org.databene.commons.SystemInfo;
import org.databene.commons.validator.BlacklistValidator;
import org.databene.document.csv.CSVLineIterator;
/**
* {@link Generator} implementation which takes cells from a CSV file as input
* and combines the cells by taking a cell value from a random row for each column
* and concatenating them to a string.
* Created: 01.08.2010 14:48:50
* @since 0.6.3
* @author Volker Bergmann
*/
public class TokenCombiner extends GeneratorProxy {
protected String uri;
private boolean unique;
protected char separator = ',';
protected String encoding = Encodings.UTF_8;
protected boolean excludeSeed = false;
protected Set seed = new HashSet();
public TokenCombiner(String uri) {
this(uri, false);
}
public TokenCombiner(String uri, boolean unique) {
this(uri, unique, ',', SystemInfo.getFileEncoding(), false);
}
public TokenCombiner(String uri, boolean unique, char separator, String encoding, boolean excludeSeed) {
this.uri = uri;
this.unique = unique;
this.separator = separator;
this.encoding = encoding;
this.excludeSeed = excludeSeed;
}
public void setUri(String uri) {
this.uri = uri;
}
public void setUnique(boolean unique) {
this.unique = unique;
}
public void setSeparator(char separator) {
this.separator = separator;
}
public void setEncoding(String encoding) {
this.encoding = encoding;
}
public void setExcludeSeed(boolean excludeSeed) {
this.excludeSeed = excludeSeed;
}
@Override
public synchronized void init(GeneratorContext context) {
Generator source = new SimpleTokenCombinator(unique);
if (excludeSeed) {
BlacklistValidator validator = new BlacklistValidator(seed);
source = new ValidatingGeneratorProxy(source, validator);
}
super.setSource(source);
super.init(context);
}
protected class SimpleTokenCombinator extends CompositeStringGenerator {
SimpleTokenCombinator(boolean unique) {
super(unique);
}
@SuppressWarnings("unchecked")
@Override
protected Generator>[] initSources(GeneratorContext context, boolean unique) {
try {
SampleGenerator[] sources = null;
String absoluteUri = context.resolveRelativeUri(uri);
CSVLineIterator iterator = new CSVLineIterator(absoluteUri, separator, true, encoding);
if (!iterator.hasNext())
throw new ConfigurationError("Source file of " + getClass().getSimpleName() + " is empty: " + absoluteUri);
int tokenCount = -1;
while (iterator.hasNext()) {
String[] tokens = iterator.next();
if (sources == null) {
tokenCount = tokens.length;
sources = new SampleGenerator[tokenCount];
for (int i = 0; i < tokenCount; i++) {
sources[i] = new SampleGenerator(String.class);
sources[i].setUnique(unique);
}
}
for (int i = 0; i < tokens.length; i++)
if (!unique || !sources[i].contains(tokens[i]))
sources[i].addValue(tokens[i]);
if (excludeSeed)
seed.add(StringUtil.concat(null, tokens));
}
return sources;
} catch (IOException e) {
throw new ConfigurationError("Error initializing " + getClass().getSimpleName() + " from URI " + uri, e);
}
}
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy