org.jpmml.xgboost.XGBoostUtil Maven / Gradle / Ivy
Go to download
Show more of this group Show more artifacts with this name
Show all versions of jpmml-xgboost Show documentation
Show all versions of jpmml-xgboost Show documentation
Java library and command-line application for converting XGBoost models to PMML
/*
* Copyright (c) 2016 Villu Ruusmann
*
* This file is part of JPMML-XGBoost
*
* JPMML-XGBoost is free software: you can redistribute it and/or modify
* it under the terms of the GNU Affero General Public License as published by
* the Free Software Foundation, either version 3 of the License, or
* (at your option) any later version.
*
* JPMML-XGBoost is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU Affero General Public License for more details.
*
* You should have received a copy of the GNU Affero General Public License
* along with JPMML-XGBoost. If not, see .
*/
package org.jpmml.xgboost;
import java.io.BufferedInputStream;
import java.io.DataInput;
import java.io.DataInputStream;
import java.io.IOException;
import java.io.InputStream;
import java.io.InputStreamReader;
import java.io.Reader;
import java.nio.ByteOrder;
import java.util.Iterator;
import java.util.List;
import java.util.StringTokenizer;
import com.google.common.io.CharStreams;
import com.google.common.io.LittleEndianDataInputStream;
public class XGBoostUtil {
private XGBoostUtil(){
}
static
public Learner loadLearner(InputStream is) throws IOException {
return loadLearner(is, ByteOrder.nativeOrder(), null);
}
static
public Learner loadLearner(InputStream is, ByteOrder byteOrder, String charset) throws IOException {
return loadLearner(is, byteOrder, charset, "$");
}
static
public Learner loadLearner(InputStream is, ByteOrder byteOrder, String charset, String jsonPath) throws IOException {
is = new BufferedInputStream(is, 16);
if((ByteOrder.BIG_ENDIAN).equals(byteOrder)){
return loadLearner(new DataInputStream(is), charset, jsonPath);
} else
if((ByteOrder.LITTLE_ENDIAN).equals(byteOrder)){
return loadLearner(new LittleEndianDataInputStream(is), charset, jsonPath);
} else
{
throw new IllegalArgumentException();
}
}
static
public Learner loadLearner(DIS is, String charset, String jsonPath) throws IOException {
if(!is.markSupported()){
throw new IllegalArgumentException();
}
boolean isJson;
is.mark(1);
try {
int c = is.read();
isJson = (c == '{');
} finally {
is.reset();
}
Learner learner = new Learner();
if(isJson){
learner.loadJSON(is, charset, jsonPath);
} else
{
learner.loadBinary(is, charset);
}
return learner;
}
static
public FeatureMap loadFeatureMap(InputStream is) throws IOException {
FeatureMap featureMap = new FeatureMap();
Iterator lines = parseFeatureMap(is);
for(int i = 0; lines.hasNext(); i++){
String line = lines.next();
StringTokenizer st = new StringTokenizer(line, "\t");
if(st.countTokens() != 3){
throw new IllegalArgumentException(line);
}
String id = st.nextToken();
String name = st.nextToken();
String type = st.nextToken();
if(Integer.parseInt(id) != i){
throw new IllegalArgumentException(id);
}
featureMap.addEntry(name, type);
}
return featureMap;
}
static
private Iterator parseFeatureMap(InputStream is) throws IOException {
Reader reader = new InputStreamReader(is, "UTF-8");
List lines = CharStreams.readLines(reader);
return lines.iterator();
}
public static final String SERIALIZATION_HEADER = "CONFIG-offset:";
public static final String BINF_HEADER = "binf";
}