All Downloads are FREE. Search and download functionalities are using the official Maven repository.

com.univocity.parsers.tsv.TsvFormat Maven / Gradle / Ivy

/*******************************************************************************
 * Copyright 2014 uniVocity Software Pty Ltd
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 * http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 ******************************************************************************/
package com.univocity.parsers.tsv;

import com.univocity.parsers.common.*;

import java.util.*;

/**
 * The TSV format configuration, for tab-separated inputs. It offers the options in the default configuration in {@link Format}, as well as
 * the {@link #escapeChar} character for escaping \t, \n, \r and \ in TSV values.
 *
 * Delimiters are defined as tab characters '\t'
 *
 * @see com.univocity.parsers.common.Format
 *
 * @author uniVocity Software Pty Ltd - [email protected]
 *
 */
public class TsvFormat extends Format {

	private char escapeChar = '\\';
	private char escapedTabChar = 't';

	/**
	 * Defines the character used for escaping special characters in TSV inputs: \t, \n, \r and \ . Defaults to '\\'
	 * @param escapeChar the escape character
	 */
	public void setEscapeChar(char escapeChar) {
		this.escapeChar = escapeChar;
	}

	/**
	 * Returns the character used for escaping special characters in TSV inputs: \t, \n, \r and \
	 * @return the escape character.
	 */
	public char getEscapeChar() {
		return escapeChar;
	}

	/**
	 * Returns the character that should be used to represent an escaped tab, i.e. the character before the defined
	 * {@link #getEscapeChar()}. For example, if {@link #getEscapeChar()} == '\\' and {@link #getEscapedTabChar() == 'X'},
	 * the sequence {@code '\X'} will identify a tab.
	 *
	 * Defaults to {@code 't'}.
	 *
	 * @return the character following the {@link #getEscapeChar()} that represents an escaped tab.
	 */
	public char getEscapedTabChar() {
		return escapedTabChar;
	}

	/**
	 * Defines the character that should be used to represent an escaped tab, i.e. the character before the defined
	 * {@link #getEscapeChar()}. For example, if {@link #getEscapeChar()} == '\\' and {@link #getEscapedTabChar() == 'X'},
	 * the sequence {@code '\X'} will identify a tab.
	 *
	 * Defaults to {@code 't'}.
	 *
	 * @param escapedTabChar the character following the {@link #getEscapeChar()} that represents an escaped tab.
	 */
	public void setEscapedTabChar(char escapedTabChar) {
		this.escapedTabChar = escapedTabChar;
	}

	/**
	 * Identifies whether or not a given character is used for escaping special characters in TSV (\t, \n, \r and \).
	 * @param ch the character to be verified
	 * @return true if the given character is escape character, false otherwise
	 */
	public boolean isEscapeChar(char ch) {
		return this.escapeChar == ch;
	}

	@Override
	protected TreeMap getConfiguration() {
		TreeMap out = new TreeMap();
		out.put("Escape character", escapeChar);
		return out;
	}

	@Override
	public final TsvFormat clone() {
		return (TsvFormat) super.clone();
	}
}




© 2015 - 2025 Weber Informatics LLC | Privacy Policy