Spaces:
Sleeping
Sleeping
Update eda.py
Browse files
eda.py
CHANGED
@@ -8,6 +8,41 @@ def app():
|
|
8 |
|
9 |
# Load Data
|
10 |
df = pd.read_csv('../Transactions Data.csv')
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
11 |
|
12 |
# Data Summary
|
13 |
st.header('Data Summary')
|
|
|
8 |
|
9 |
# Load Data
|
10 |
df = pd.read_csv('../Transactions Data.csv')
|
11 |
+
|
12 |
+
# Creating the table with column names and descriptions
|
13 |
+
data = {
|
14 |
+
"Column Names": [
|
15 |
+
"step",
|
16 |
+
"type",
|
17 |
+
"amount",
|
18 |
+
"nameOrig",
|
19 |
+
"oldbalanceOrg",
|
20 |
+
"newbalanceOrig",
|
21 |
+
"nameDest",
|
22 |
+
"oldbalanceDest",
|
23 |
+
"newbalanceDest",
|
24 |
+
"isFraud",
|
25 |
+
"isFlaggedFraud"
|
26 |
+
],
|
27 |
+
"Description": [
|
28 |
+
"Represents a unit of time in the transaction process, though the specific time unit is not specified in the dataset. It could denote hours, days, or another unit, depending on the context.",
|
29 |
+
"Describes the type of transaction, such as transfer, payment, etc. This categorical variable allows for the classification of different transaction behaviors.",
|
30 |
+
"Indicates the monetary value of the transaction, providing insight into the financial magnitude of each transaction.",
|
31 |
+
"Serves as the identifier for the origin account or entity initiating the transaction. This helps trace the source of funds in each transaction.",
|
32 |
+
"Represents the balance in the origin account before the transaction occurred, offering a reference point for understanding changes in account balances.",
|
33 |
+
"Reflects the balance in the origin account after the transaction has been processed, providing insight into how the transaction affects the account balance.",
|
34 |
+
"Functions as the identifier for the destination account or entity receiving the funds in each transaction. It helps track where the money is being transferred to.",
|
35 |
+
"Indicates the balance in the destination account before the transaction, offering a baseline for assessing changes in account balances due to incoming funds.",
|
36 |
+
"Represents the balance in the destination account after the transaction has been completed, providing insight into the impact of incoming funds on the account balance.",
|
37 |
+
"A binary indicator (0 or 1) denoting whether the transaction is fraudulent (1) or legitimate (0). This is the target variable for fraud detection modeling.",
|
38 |
+
"Another binary indicator (0 or 1) which may signal whether a transaction has been flagged as potentially fraudulent. This could serve as an additional feature for fraud detection algorithms."
|
39 |
+
]}
|
40 |
+
|
41 |
+
# Displaying the table using Streamlit
|
42 |
+
st.subheader('Transaction Dataset Column Descriptions')
|
43 |
+
st.table(data)
|
44 |
+
|
45 |
+
st.divider()
|
46 |
|
47 |
# Data Summary
|
48 |
st.header('Data Summary')
|