M2P2 / EDA.py
Azrieldr's picture
Upload 2 files
8c8d0b4
import os
import streamlit as st
import glob
import pandas as pd
import matplotlib.pyplot as plt
def run_eda():
st.title('CNN Image Classifier')
# Set directories
train_dir = "Data/train"
# train sets
for files in os.listdir(train_dir):
print(os.path.join(train_dir,files))
num_A = len(glob.glob(os.path.join(train_dir, "normal", "*.png")))
num_ad = len(glob.glob(os.path.join(train_dir, "adenocarcinoma_left.lower.lobe_T2_N0_M0_Ib", "*.png")))
num_sq = len(glob.glob(os.path.join(train_dir, "squamous.cell.carcinoma_left.hilum_T1_N2_M0_IIIa", "*.png")))
num_lg = len(glob.glob(os.path.join(train_dir, "large.cell.carcinoma_left.hilum_T2_N2_M0_IIIa", "*.png")))
class_names = ['Normal', 'Adenocarcinoma', 'Squamous', 'Large Cell']
num_images = [num_A, num_ad, num_sq, num_lg]
fig, ax = plt.subplots()
ax.bar(class_names, num_images)
ax.set_title('Banyaknya Data Setiap Kelas pada Dataset Train')
ax.set_xlabel('Kelas')
ax.set_ylabel('Jumlah Data')
st.pyplot(fig)