
smile.data.IndexDataFrame Maven / Gradle / Ivy
/*
* Copyright (c) 2010-2021 Haifeng Li. All rights reserved.
*
* Smile is free software: you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation, either version 3 of the License, or
* (at your option) any later version.
*
* Smile is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with Smile. If not, see .
*/
package smile.data;
import java.util.Arrays;
import java.util.Iterator;
import java.util.stream.Stream;
import smile.data.type.*;
import smile.data.vector.*;
/**
* A data frame with a new index instead of the default [0, n) row index.
*
* @author Haifeng Li
*/
public class IndexDataFrame implements DataFrame {
/** The underlying data frame. */
private final DataFrame df;
/** The row index. */
private final int[] index;
/**
* Constructor.
* @param df The underlying data frame.
* @param index The row index.
*/
public IndexDataFrame(DataFrame df, int[] index) {
this.df = df;
this.index = index;
}
@Override
public StructType schema() {
return df.schema();
}
@Override
public String toString() {
return toString(10, true);
}
@Override
public int indexOf(String name) {
return df.indexOf(name);
}
@Override
public int size() {
return index.length;
}
@Override
public int ncol() {
return df.ncol();
}
@Override
public Object get(int i, int j) {
return df.get(index[i], j);
}
@Override
public Stream stream() {
return Arrays.stream(index).mapToObj(df::get);
}
@Override
public Iterator iterator() {
return stream().iterator();
}
@Override
public BaseVector column(int i) {
return df.column(i).get(index);
}
@Override
public Vector vector(int i) {
return df.vector(i).get(index);
}
@Override
public BooleanVector booleanVector(int i) {
return df.booleanVector(i).get(index);
}
@Override
public CharVector charVector(int i) {
return df.charVector(i).get(index);
}
@Override
public ByteVector byteVector(int i) {
return df.byteVector(i).get(index);
}
@Override
public ShortVector shortVector(int i) {
return df.shortVector(i).get(index);
}
@Override
public IntVector intVector(int i) {
return df.intVector(i).get(index);
}
@Override
public LongVector longVector(int i) {
return df.longVector(i).get(index);
}
@Override
public FloatVector floatVector(int i) {
return df.floatVector(i).get(index);
}
@Override
public DoubleVector doubleVector(int i) {
return df.doubleVector(i).get(index);
}
@Override
public StringVector stringVector(int i) {
return df.stringVector(i).get(index);
}
@Override
public DataFrame select(int... cols) {
return new IndexDataFrame(df.select(cols), index);
}
@Override
public DataFrame drop(int... cols) {
return new IndexDataFrame(df.drop(cols), index);
}
/** Returns a new data frame with regular index. */
private DataFrame rebase() {
return DataFrame.of(stream().collect(java.util.stream.Collectors.toList()));
}
@Override
public DataFrame merge(DataFrame... dataframes) {
for (DataFrame df : dataframes) {
if (df.size() != size()) {
throw new IllegalArgumentException("Merge data frames with different size: " + size() + " vs " + df.size());
}
}
return rebase().merge(dataframes);
}
@Override
public DataFrame merge(BaseVector... vectors) {
for (BaseVector vector : vectors) {
if (vector.size() != size()) {
throw new IllegalArgumentException("Merge data frames with different size: " + size() + " vs " + vector.size());
}
}
return rebase().merge(vectors);
}
@Override
public DataFrame union(DataFrame... dataframes) {
for (DataFrame df : dataframes) {
if (!schema().equals(df.schema())) {
throw new IllegalArgumentException("Union data frames with different schema: " + schema() + " vs " + df.schema());
}
}
return rebase().union(dataframes);
}
@Override
public Tuple get(int i) {
return df.get(index[i]);
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy