All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.databene.benerator.primitive.TokenCombiner Maven / Gradle / Ivy

Go to download

benerator is a framework for creating realistic and valid high-volume test data, used for testing (unit/integration/load) and showcase setup. Metadata constraints are imported from systems and/or configuration files. Data can imported from and exported to files and systems, anonymized or generated from scratch. Domain packages provide reusable generators for creating domain-specific data as names and addresses internationalizable in language and region. It is strongly customizable with plugins and configuration options.

The newest version!
/*
 * (c) Copyright 2010-2013 by Volker Bergmann. All rights reserved.
 *
 * Redistribution and use in source and binary forms, with or without
 * modification, is permitted under the terms of the
 * GNU General Public License (GPL).
 *
 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
 * WITHOUT A WARRANTY OF ANY KIND. ALL EXPRESS OR IMPLIED CONDITIONS,
 * REPRESENTATIONS AND WARRANTIES, INCLUDING ANY IMPLIED WARRANTY OF
 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE OR NON-INFRINGEMENT, ARE
 * HEREBY EXCLUDED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
 * POSSIBILITY OF SUCH DAMAGE.
 */

package org.databene.benerator.primitive;

import java.io.IOException;
import java.util.HashSet;
import java.util.Set;

import org.databene.benerator.Generator;
import org.databene.benerator.GeneratorContext;
import org.databene.benerator.NonNullGenerator;
import org.databene.benerator.sample.NonNullSampleGenerator;
import org.databene.benerator.util.GeneratorUtil;
import org.databene.benerator.wrapper.CompositeStringGenerator;
import org.databene.benerator.wrapper.GeneratorProxy;
import org.databene.benerator.wrapper.WrapperFactory;
import org.databene.commons.ConfigurationError;
import org.databene.commons.Encodings;
import org.databene.commons.StringUtil;
import org.databene.commons.SystemInfo;
import org.databene.commons.validator.BlacklistValidator;
import org.databene.formats.DataContainer;
import org.databene.formats.csv.CSVLineIterator;

/**
 * {@link Generator} implementation which takes cells from a CSV file as input 
 * and combines the cells by taking a cell value from a random row for each column
 * and concatenating them to a string.

* Created: 01.08.2010 14:48:50 * @since 0.6.3 * @author Volker Bergmann */ public class TokenCombiner extends GeneratorProxy implements NonNullGenerator { protected String uri; private boolean unique; protected char separator = ','; protected String encoding = Encodings.UTF_8; protected boolean excludeSeed = false; protected Set seed = new HashSet(); public TokenCombiner(String uri) { this(uri, false); } public TokenCombiner(String uri, boolean unique) { this(uri, unique, ',', SystemInfo.getFileEncoding(), false); } public TokenCombiner(String uri, boolean unique, char separator, String encoding, boolean excludeSeed) { super(String.class); this.uri = uri; this.unique = unique; this.separator = separator; this.encoding = encoding; this.excludeSeed = excludeSeed; } public void setUri(String uri) { this.uri = uri; } public void setUnique(boolean unique) { this.unique = unique; } public void setSeparator(char separator) { this.separator = separator; } public void setEncoding(String encoding) { this.encoding = encoding; } public void setExcludeSeed(boolean excludeSeed) { this.excludeSeed = excludeSeed; } @SuppressWarnings("resource") @Override public synchronized void init(GeneratorContext context) { Generator source = new SimpleTokenCombinator(unique); if (excludeSeed) { BlacklistValidator validator = new BlacklistValidator(seed); source = WrapperFactory.applyValidator(validator, source); } super.setSource(source); super.init(context); } @Override public String generate() { return GeneratorUtil.generateNonNull(this); } protected class SimpleTokenCombinator extends CompositeStringGenerator { @SuppressWarnings("unchecked") SimpleTokenCombinator(boolean unique) { super(unique); } @Override @SuppressWarnings("unchecked") public void init(GeneratorContext context) { try { NonNullSampleGenerator[] sources = null; String absoluteUri = context.resolveRelativeUri(uri); CSVLineIterator iterator = new CSVLineIterator(absoluteUri, separator, true, encoding); int tokenCount = -1; DataContainer container = new DataContainer(); while ((container = iterator.next(container)) != null) { String[] tokens = container.getData(); if (sources == null) { tokenCount = tokens.length; sources = new NonNullSampleGenerator[tokenCount]; for (int i = 0; i < tokenCount; i++) { sources[i] = new NonNullSampleGenerator(String.class); sources[i].setUnique(unique); } } for (int i = 0; i < tokens.length; i++) if (!unique || !sources[i].contains(tokens[i])) sources[i].addValue(tokens[i]); if (excludeSeed) seed.add(StringUtil.concat(null, tokens)); } setSources(sources); super.init(context); } catch (IOException e) { throw new ConfigurationError("Error initializing " + getClass().getSimpleName() + " from URI " + uri, e); } } } }




© 2015 - 2025 Weber Informatics LLC | Privacy Policy