Source code for mFlow.Blocks.normalizer


import pandas as pd
import numpy as np
from sklearn.preprocessing import RobustScaler
import sys, os
from mFlow.Workflow.compute_graph import node

[docs]def Normalizer(*args, **kwargs): return node(function = __Normalizer, args=args, kwargs=kwargs, name="Normalizer")
def __Normalizer(df, show=False): model = RobustScaler() df = df["dataframe"] features = list(set(df.columns) - {'target'}) numeric = df[features].values h,w = numeric.shape if(show): print(" Normalizer: running matrix of size %dx%d"%(h,w)) model.fit(numeric) out = model.transform(numeric) df1 = pd.DataFrame(data=out, columns=features, index=df.index) if 'target' in df.columns: df1['target'] = df['target'] #df = df1.copy() return({"dataframe":df1})