org.jpmml.rexp.RecipeEncoder Maven / Gradle / Ivy
Go to download
Show more of this group Show more artifacts with this name
Show all versions of pmml-rexp Show documentation
Show all versions of pmml-rexp Show documentation
JPMML R to PMML converter
The newest version!
/*
* Copyright (c) 2018 Villu Ruusmann
*
* This file is part of JPMML-R
*
* JPMML-R is free software: you can redistribute it and/or modify
* it under the terms of the GNU Affero General Public License as published by
* the Free Software Foundation, either version 3 of the License, or
* (at your option) any later version.
*
* JPMML-R is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU Affero General Public License for more details.
*
* You should have received a copy of the GNU Affero General Public License
* along with JPMML-R. If not, see .
*/
package org.jpmml.rexp;
import java.util.Collections;
import java.util.LinkedHashMap;
import java.util.List;
import java.util.Map;
import java.util.function.Function;
import java.util.stream.Collectors;
import org.dmg.pmml.DataField;
import org.jpmml.converter.Feature;
import org.jpmml.converter.Label;
import org.jpmml.converter.ScalarLabel;
import org.jpmml.converter.Schema;
public class RecipeEncoder extends TransformerEncoder {
private Map varRoles = Collections.emptyMap();
private Map varSources = Collections.emptyMap();
private Map varTypes = Collections.emptyMap();
private Map termRoles = Collections.emptyMap();
private Map termSources = Collections.emptyMap();
private Map termTypes = Collections.emptyMap();
public RecipeEncoder(RGenericVector recipe){
super(recipe);
RGenericVector varInfo = recipe.getGenericElement("var_info");
RGenericVector termInfo = recipe.getGenericElement("term_info");
this.varRoles = parseInfo(varInfo, "role", value -> Role.valueOf(value.toUpperCase()));
this.varSources = parseInfo(varInfo, "source", value -> Source.valueOf(value.toUpperCase()));
this.varTypes = parseInfo(varInfo, "type", value -> Type.valueOf(value.toUpperCase()));
this.termRoles = parseInfo(termInfo, "role", value -> Role.valueOf(value.toUpperCase()));
this.termSources = parseInfo(termInfo, "source", value -> Source.valueOf(value.toUpperCase()));
this.termTypes = parseInfo(termInfo, "type", value -> Type.valueOf(value.toUpperCase()));
}
@Override
public Schema createSchema(){
RGenericVector recipe = getObject();
Label label = getLabel();
List extends Feature> features = getFeatures();
RGenericVector steps = recipe.getGenericElement("steps");
List outcomeNames = this.termRoles.entrySet().stream()
.filter(entry -> (entry.getValue() == Role.OUTCOME))
.map(entry -> entry.getKey())
.collect(Collectors.toList());
if(outcomeNames.size() == 1){
ScalarLabel scalarLabel = (ScalarLabel)label;
String outcomeName = outcomeNames.get(0);
renameDataField(scalarLabel.getName(), outcomeName);
label = scalarLabel.toRenamedLabel(outcomeName);
} else
if(outcomeNames.size() >= 2){
throw new IllegalArgumentException();
} // End if
if(steps != null){
throw new IllegalArgumentException();
}
return new Schema(this, label, features);
}
private void renameDataField(String name, String renamedName){
DataField dataField = removeDataField(name);
dataField.setName(renamedName);
addDataField(dataField);
}
static
private > Map parseInfo(RGenericVector info, String name, Function function){
RStringVector variable = info.getStringElement("variable");
RStringVector value = info.getStringElement(name);
RVectorUtil.checkSize(variable, value);
Map result = new LinkedHashMap<>();
for(int i = 0; i < variable.size(); i++){
result.put(variable.getValue(i), function.apply(value.getValue(i)));
}
return result;
}
static
private enum Role {
OUTCOME,
PREDICTOR,
;
}
static
private enum Source {
ORIGINAL,
DERIVED,
;
}
static
private enum Type {
LOGICAL,
NOMINAL,
NUMERIC
;
}
}