Spaces:
Sleeping
Sleeping
celineclarissa
commited on
Commit
•
00ea715
1
Parent(s):
6275b71
Upload eda.py
Browse files
eda.py
CHANGED
@@ -30,8 +30,19 @@ def run():
|
|
30 |
# Show dataframe
|
31 |
st.write('### Dataset')
|
32 |
df = pd.read_csv('df_ori.csv')
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
33 |
st.dataframe(df)
|
34 |
|
|
|
35 |
st.write('')
|
36 |
st.markdown('---')
|
37 |
st.write('')
|
|
|
30 |
# Show dataframe
|
31 |
st.write('### Dataset')
|
32 |
df = pd.read_csv('df_ori.csv')
|
33 |
+
|
34 |
+
# data cleaning
|
35 |
+
#drop unused columns
|
36 |
+
df = df.drop(columns='Unnamed: 0')
|
37 |
+
# replace "6" as "5" in "education_level" column
|
38 |
+
df['education_level'] = df['education_level'].replace(6, 5)
|
39 |
+
# replace "0.0" as "-1.0" in "pay_[i]" column
|
40 |
+
df[['pay_0', 'pay_2', 'pay_3', 'pay_4', 'pay_5', 'pay_6']] = df[['pay_0', 'pay_2', 'pay_3', 'pay_4', 'pay_5', 'pay_6']].replace(0.0, -1.0)
|
41 |
+
|
42 |
+
# show cleaned dataset
|
43 |
st.dataframe(df)
|
44 |
|
45 |
+
# make border
|
46 |
st.write('')
|
47 |
st.markdown('---')
|
48 |
st.write('')
|