Spaces:
Sleeping
Sleeping
import gradio as gr | |
import pandas as pd | |
from clean import clean_data | |
from report import create_full_report, REPORT_DIR | |
import os | |
import tempfile | |
def clean_and_visualize(file, progress=gr.Progress()): | |
# Load the data | |
df = pd.read_csv(file.name) | |
# Clean the data | |
cleaned_df = None | |
nonconforming_cells_before = None | |
process_times = None | |
removed_columns = None | |
removed_rows = None | |
for progress_value, status_text in clean_data(df): | |
if isinstance(status_text, tuple): | |
cleaned_df, nonconforming_cells_before, process_times, removed_columns, removed_rows = status_text | |
progress(progress_value, desc="Cleaning completed") | |
else: | |
progress(progress_value, desc=status_text) | |
# Generate full visualization report | |
create_full_report( | |
df, | |
cleaned_df, | |
nonconforming_cells_before, | |
process_times, | |
removed_columns, | |
removed_rows | |
) | |
# Save cleaned DataFrame to a temporary CSV file | |
with tempfile.NamedTemporaryFile(delete=False, suffix='.csv') as tmp_file: | |
cleaned_df.to_csv(tmp_file.name, index=False) | |
cleaned_csv_path = tmp_file.name | |
# Collect all generated images | |
image_files = [os.path.join(REPORT_DIR, f) for f in os.listdir(REPORT_DIR) if f.endswith('.png')] | |
return cleaned_csv_path, image_files | |
def launch_app(): | |
with gr.Blocks() as app: | |
gr.Markdown("# AI Data Cleaner") | |
with gr.Row(): | |
file_input = gr.File(label="Upload CSV File") | |
with gr.Row(): | |
clean_button = gr.Button("Start Cleaning") | |
with gr.Row(): | |
progress_bar = gr.Progress() | |
with gr.Row(): | |
cleaned_file_output = gr.File(label="Download Cleaned CSV", visible=False) | |
with gr.Row(): | |
output_gallery = gr.Gallery(label="Visualization Results", show_label=True, elem_id="gallery", columns=[2], | |
rows=[2], object_fit="contain", height="auto") | |
def process_and_show_download(file): | |
cleaned_csv_path, image_files = clean_and_visualize(file, progress=progress_bar) | |
return gr.File.update(value=cleaned_csv_path, visible=True), image_files | |
clean_button.click( | |
fn=process_and_show_download, | |
inputs=file_input, | |
outputs=[cleaned_file_output, output_gallery] | |
) | |
app.launch() | |
if __name__ == "__main__": | |
launch_app() |