Théo Villette commited on
Commit
82c6295
1 Parent(s): cac478c

add categorical data

Browse files
Files changed (3) hide show
  1. app.py +1 -1
  2. datasets/house_california.csv +0 -0
  3. utils.py +1 -13
app.py CHANGED
@@ -2,7 +2,7 @@ import streamlit as st
2
  from flaml.automl.data import get_output_from_log
3
  import plotly.express as px
4
 
5
- from utils import csv_to_featuers_list, pre_process_df, pre_process_features
6
  from autoML import autoML
7
 
8
 
 
2
  from flaml.automl.data import get_output_from_log
3
  import plotly.express as px
4
 
5
+ from utils import csv_to_featuers_list
6
  from autoML import autoML
7
 
8
 
datasets/house_california.csv CHANGED
The diff for this file is too large to render. See raw diff
 
utils.py CHANGED
@@ -1,19 +1,7 @@
1
  import pandas as pd
2
- from sklearn.preprocessing import MinMaxScaler
3
 
4
  def csv_to_featuers_list(csv_file):
5
  if csv_file == None:
6
  return ['No csv yet']
7
  df = pd.read_csv(csv_file)
8
- return df.columns
9
-
10
- def pre_process_df(df):
11
- df.dropna(inplace=True)
12
- df.drop_duplicates(inplace=True)
13
- df.reset_index(inplace=True, drop=True)
14
- return df
15
-
16
- def pre_process_features(X):
17
- scaler = MinMaxScaler()
18
- X = scaler.fit_transform(X)
19
- return X
 
1
  import pandas as pd
 
2
 
3
  def csv_to_featuers_list(csv_file):
4
  if csv_file == None:
5
  return ['No csv yet']
6
  df = pd.read_csv(csv_file)
7
+ return df.columns