
smile.data.vector.StringVectorImpl Maven / Gradle / Ivy
/*
* Copyright (c) 2010-2021 Haifeng Li. All rights reserved.
*
* Smile is free software: you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation, either version 3 of the License, or
* (at your option) any later version.
*
* Smile is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with Smile. If not, see .
*/
package smile.data.vector;
import java.time.LocalDate;
import java.time.LocalDateTime;
import java.time.LocalTime;
import java.time.format.DateTimeFormatter;
import java.util.Collections;
import java.util.List;
import smile.data.measure.CategoricalMeasure;
import smile.data.measure.NominalScale;
import smile.data.type.DataTypes;
import smile.data.type.StructField;
/**
* An immutable string vector.
*
* @author Haifeng Li
*/
class StringVectorImpl extends VectorImpl implements StringVector {
/** Constructor. */
public StringVectorImpl(String name, String[] vector) {
super(name, String.class, vector);
}
/** Constructor. */
public StringVectorImpl(StructField field, String[] vector) {
super(field.name, field.type, vector);
if (field.measure != null) {
throw new IllegalArgumentException(String.format("Invalid measure %s for %s", field.measure, type()));
}
}
@Override
public StringVector get(int... index) {
String[] v = new String[index.length];
for (int i = 0; i < index.length; i++) v[i] = get(index[i]);
return new StringVectorImpl(field(), v);
}
@Override
public Vector toDate() {
return toDate(DateTimeFormatter.ISO_LOCAL_DATE);
}
@Override
public Vector toDate(DateTimeFormatter format) {
LocalDate[] dates = stream().map(format::parse).map(LocalDate::from).toArray(LocalDate[]::new);
return new VectorImpl<>(name(), DataTypes.DateType, dates);
}
@Override
public Vector toTime() {
return toTime(DateTimeFormatter.ISO_LOCAL_TIME);
}
@Override
public Vector toTime(DateTimeFormatter format) {
LocalTime[] dates = stream().map(format::parse).map(LocalTime::from).toArray(LocalTime[]::new);
return new VectorImpl<>(name(), DataTypes.TimeType, dates);
}
@Override
public Vector toDateTime() {
return toDateTime(DateTimeFormatter.ISO_LOCAL_DATE_TIME);
}
@Override
public Vector toDateTime(DateTimeFormatter format) {
LocalDateTime[] dates = stream().map(format::parse).map(LocalDateTime::from).toArray(LocalDateTime[]::new);
return new VectorImpl<>(name(), DataTypes.DateTimeType, dates);
}
@Override
public NominalScale nominal() {
List levels = distinct();
Collections.sort(levels);
return new NominalScale(levels);
}
@Override
public BaseVector factorize(CategoricalMeasure scale) {
switch (scale.type().id()) {
case Byte: {
byte[] data = new byte[size()];
for (int i = 0; i < data.length; i++) {
String s = get(i);
data[i] = s == null ? (byte) -1 : scale.valueOf(s).byteValue();
}
return new ByteVectorImpl(new StructField(name(), DataTypes.ByteType, scale), data);
}
case Short: {
short[] data = new short[size()];
for (int i = 0; i < data.length; i++) {
String s = get(i);
data[i] = s == null ? (short) -1 : scale.valueOf(s).shortValue();
}
return new ShortVectorImpl(new StructField(name(), DataTypes.ShortType, scale), data);
}
case Integer: {
int[] data = new int[size()];
for (int i = 0; i < data.length; i++) {
String s = get(i);
data[i] = s == null ? -1 : scale.valueOf(s).intValue();
}
return new IntVectorImpl(new StructField(name(), DataTypes.IntegerType, scale), data);
}
default:
// we should never reach here.
throw new UnsupportedOperationException("Unsupported data type for nominal measure: " + scale.type());
}
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy