Théo Villette
commited on
Commit
·
82c6295
1
Parent(s):
cac478c
add categorical data
Browse files- app.py +1 -1
- datasets/house_california.csv +0 -0
- utils.py +1 -13
app.py
CHANGED
|
@@ -2,7 +2,7 @@ import streamlit as st
|
|
| 2 |
from flaml.automl.data import get_output_from_log
|
| 3 |
import plotly.express as px
|
| 4 |
|
| 5 |
-
from utils import csv_to_featuers_list
|
| 6 |
from autoML import autoML
|
| 7 |
|
| 8 |
|
|
|
|
| 2 |
from flaml.automl.data import get_output_from_log
|
| 3 |
import plotly.express as px
|
| 4 |
|
| 5 |
+
from utils import csv_to_featuers_list
|
| 6 |
from autoML import autoML
|
| 7 |
|
| 8 |
|
datasets/house_california.csv
CHANGED
|
The diff for this file is too large to render.
See raw diff
|
|
|
utils.py
CHANGED
|
@@ -1,19 +1,7 @@
|
|
| 1 |
import pandas as pd
|
| 2 |
-
from sklearn.preprocessing import MinMaxScaler
|
| 3 |
|
| 4 |
def csv_to_featuers_list(csv_file):
|
| 5 |
if csv_file == None:
|
| 6 |
return ['No csv yet']
|
| 7 |
df = pd.read_csv(csv_file)
|
| 8 |
-
return df.columns
|
| 9 |
-
|
| 10 |
-
def pre_process_df(df):
|
| 11 |
-
df.dropna(inplace=True)
|
| 12 |
-
df.drop_duplicates(inplace=True)
|
| 13 |
-
df.reset_index(inplace=True, drop=True)
|
| 14 |
-
return df
|
| 15 |
-
|
| 16 |
-
def pre_process_features(X):
|
| 17 |
-
scaler = MinMaxScaler()
|
| 18 |
-
X = scaler.fit_transform(X)
|
| 19 |
-
return X
|
|
|
|
| 1 |
import pandas as pd
|
|
|
|
| 2 |
|
| 3 |
def csv_to_featuers_list(csv_file):
|
| 4 |
if csv_file == None:
|
| 5 |
return ['No csv yet']
|
| 6 |
df = pd.read_csv(csv_file)
|
| 7 |
+
return df.columns
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|