celineclarissa commited on
Commit
00ea715
1 Parent(s): 6275b71

Upload eda.py

Browse files
Files changed (1) hide show
  1. eda.py +11 -0
eda.py CHANGED
@@ -30,8 +30,19 @@ def run():
30
  # Show dataframe
31
  st.write('### Dataset')
32
  df = pd.read_csv('df_ori.csv')
 
 
 
 
 
 
 
 
 
 
33
  st.dataframe(df)
34
 
 
35
  st.write('')
36
  st.markdown('---')
37
  st.write('')
 
30
  # Show dataframe
31
  st.write('### Dataset')
32
  df = pd.read_csv('df_ori.csv')
33
+
34
+ # data cleaning
35
+ #drop unused columns
36
+ df = df.drop(columns='Unnamed: 0')
37
+ # replace "6" as "5" in "education_level" column
38
+ df['education_level'] = df['education_level'].replace(6, 5)
39
+ # replace "0.0" as "-1.0" in "pay_[i]" column
40
+ df[['pay_0', 'pay_2', 'pay_3', 'pay_4', 'pay_5', 'pay_6']] = df[['pay_0', 'pay_2', 'pay_3', 'pay_4', 'pay_5', 'pay_6']].replace(0.0, -1.0)
41
+
42
+ # show cleaned dataset
43
  st.dataframe(df)
44
 
45
+ # make border
46
  st.write('')
47
  st.markdown('---')
48
  st.write('')