Source code for mFlow.Blocks.filter

import sys, os
from mFlow.Workflow.compute_graph import node
import time


[docs]def MisingLabelFilter(*args, **kwargs): return node(function = __MisingLabelFilter, args=args, kwargs=kwargs, name="Missing Label Filter")
def __MisingLabelFilter(df,key="dataframe",inplace=False): df=df[key] df=df.dropna(axis=0, subset=["target"], inplace=inplace) return({"dataframe":df})
[docs]def MisingDataRowFilter(*args, **kwargs): return node(function = __MisingDataRowFilter, args=args, kwargs=kwargs, name="Missing Data Row Filter")
def __MisingDataRowFilter(df,thresh=0.2, inplace=False,key="dataframe"): df=df[key] df=df.dropna(axis=0, thresh = thresh*df.shape[0], inplace=inplace) return({"dataframe":df})
[docs]def MisingDataColumnFilter(*args, **kwargs): return node(function = __MisingDataColumnFilter, args=args, kwargs=kwargs, name="Missing Data Column Filter")
def __MisingDataColumnFilter(df, thresh=0.2, inplace=False,key="dataframe"): df=df[key] df=df.dropna(axis=1, thresh = thresh*df.shape[0], inplace=inplace) return({"dataframe":df})
[docs]def Take(*args, **kwargs): return node(function = __Take, args=args, kwargs=kwargs, name="Take")
def __Take(df, num): df = df["dataframe"][:num] return({"dataframe": df})
[docs]def ColumnSelectFilter(*args, **kwargs): return node(function = __ColumnSelectFilter, args=args, kwargs=kwargs, name="Column Filter")
def __ColumnSelectFilter(df, cols, key="dataframe"): df=df[key] df=df[cols] return({"dataframe":df})