
prerna.reactor.frame.py.ExtractLettersReactor Maven / Gradle / Ivy
The newest version!
package prerna.reactor.frame.py;
import java.util.List;
import java.util.Vector;
import org.apache.logging.log4j.LogManager;
import org.apache.logging.log4j.Logger;
import prerna.algorithm.api.SemossDataType;
import prerna.ds.OwlTemporalEngineMeta;
import prerna.ds.py.PandasFrame;
import prerna.sablecc2.om.GenRowStruct;
import prerna.sablecc2.om.PixelDataType;
import prerna.sablecc2.om.PixelOperationType;
import prerna.sablecc2.om.ReactorKeysEnum;
import prerna.sablecc2.om.nounmeta.NounMetadata;
import prerna.util.Constants;
import prerna.util.Utility;
import prerna.util.usertracking.AnalyticsTrackerHelper;
import prerna.util.usertracking.UserTrackerFactory;
public class ExtractLettersReactor extends AbstractPyFrameReactor {
public static final String ALPHA_COLUMN_NAME = "_ALPHA";
private static final Logger classLogger = LogManager.getLogger(ExtractLettersReactor.class);
public ExtractLettersReactor() {
this.keysToGet = new String[] { ReactorKeysEnum.COLUMNS.getKey(), ReactorKeysEnum.OVERRIDE.getKey() };
}
@Override
public NounMetadata execute() {
// get frame
PandasFrame frame = (PandasFrame) getFrame();
OwlTemporalEngineMeta metaData = frame.getMetaData();
// get table name
String wrapperFrameName = frame.getWrapperName();
// get columns to extract alphabet characters
List columns = getColumns();
// check if user want to override the column or create new columns
boolean overrideColumn = getOverride();
// we need to check data types this will only be valid on non numeric values
OwlTemporalEngineMeta metadata = frame.getMetaData();
// extracts the letters
//mv['add'] = mv.apply(lambda x: re.sub('\d+', '', x['MovieBudget']) if not(isinstance(x['MovieBudget'], int)) else x['MovieBudget'] , axis=1)
List opTypes = new Vector();
opTypes.add(PixelOperationType.FRAME_DATA_CHANGE);
StringBuilder commands = new StringBuilder();
// update existing columns
if (overrideColumn) {
for (int i = 0; i < columns.size(); i++) {
String column = columns.get(i);
// check data type this is only valid on non numeric values
SemossDataType dataType = metadata.getHeaderTypeAsEnum(frame.getName() + "__" + column);
if (Utility.isStringType(dataType.toString())) {
try {
commands.append(wrapperFrameName + ".extract_alpha('" + column + "')\n");
} catch (Exception e) {
classLogger.error(Constants.STACKTRACE, e);
}
} else {
throw new IllegalArgumentException("Column type must be string");
}
}
}
// create new column
else {
opTypes.add(PixelOperationType.FRAME_HEADERS_CHANGE);
for (int i = 0; i < columns.size(); i++) {
String column = columns.get(i);
SemossDataType dataType = metadata.getHeaderTypeAsEnum(frame.getName() + "__" + column);
if (Utility.isStringType(dataType.toString())) {
String newColumn = getCleanNewColName(frame, column + ALPHA_COLUMN_NAME);
commands.append(wrapperFrameName + ".extract_alpha('" + column + "', '" + newColumn + "')\n");
metaData.addProperty(frame.getName(), frame.getName() + "__" + newColumn);
metaData.setAliasToProperty(frame.getName() + "__" + newColumn, newColumn);
metaData.setDataTypeToProperty(frame.getName() + "__" + newColumn, SemossDataType.STRING.toString());
} else {
throw new IllegalArgumentException("Column type must be string");
}
}
}
insight.getPyTranslator().runEmptyPy(commands.toString());
this.addExecutedCode(commands.toString());
// NEW TRACKING
UserTrackerFactory.getInstance().trackAnalyticsWidget(
this.insight,
frame,
"ExtractAlphaChars",
AnalyticsTrackerHelper.getHashInputs(this.store, this.keysToGet));
return new NounMetadata(frame, PixelDataType.FRAME, opTypes);
}
private List getColumns() {
GenRowStruct grs = this.store.getNoun(keysToGet[0]);
Vector columns = new Vector();
NounMetadata noun;
if (grs != null) {
for (int i = 0; i < grs.size(); i++) {
noun = grs.getNoun(i);
if (noun != null) {
String column = noun.getValue() + "";
if (column.length() > 0) {
columns.add(column);
}
}
}
}
return columns;
}
private boolean getOverride() {
GenRowStruct grs = this.store.getNoun(keysToGet[1]);
boolean override = false;
NounMetadata noun;
if (grs != null) {
noun = grs.getNoun(0);
override = (Boolean) noun.getValue();
}
return override;
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy