Upload 2 files
Browse files
EDA.py
ADDED
@@ -0,0 +1,33 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
import os
|
2 |
+
import streamlit as st
|
3 |
+
import glob
|
4 |
+
import pandas as pd
|
5 |
+
import matplotlib.pyplot as plt
|
6 |
+
|
7 |
+
def run_eda():
|
8 |
+
st.title('CNN Image Classifier')
|
9 |
+
|
10 |
+
# Set directories
|
11 |
+
train_dir = "Data/train"
|
12 |
+
|
13 |
+
|
14 |
+
|
15 |
+
# train sets
|
16 |
+
for files in os.listdir(train_dir):
|
17 |
+
print(os.path.join(train_dir,files))
|
18 |
+
|
19 |
+
num_A = len(glob.glob(os.path.join(train_dir, "normal", "*.png")))
|
20 |
+
num_ad = len(glob.glob(os.path.join(train_dir, "adenocarcinoma_left.lower.lobe_T2_N0_M0_Ib", "*.png")))
|
21 |
+
num_sq = len(glob.glob(os.path.join(train_dir, "squamous.cell.carcinoma_left.hilum_T1_N2_M0_IIIa", "*.png")))
|
22 |
+
num_lg = len(glob.glob(os.path.join(train_dir, "large.cell.carcinoma_left.hilum_T2_N2_M0_IIIa", "*.png")))
|
23 |
+
|
24 |
+
|
25 |
+
class_names = ['Normal', 'Adenocarcinoma', 'Squamous', 'Large Cell']
|
26 |
+
num_images = [num_A, num_ad, num_sq, num_lg]
|
27 |
+
|
28 |
+
fig, ax = plt.subplots()
|
29 |
+
ax.bar(class_names, num_images)
|
30 |
+
ax.set_title('Banyaknya Data Setiap Kelas pada Dataset Train')
|
31 |
+
ax.set_xlabel('Kelas')
|
32 |
+
ax.set_ylabel('Jumlah Data')
|
33 |
+
st.pyplot(fig)
|