import re import random from datetime import datetime from typing import Dict, List, Tuple import gradio as gr import pandas as pd import numpy as np import matplotlib.pyplot as plt from matplotlib.patches import Rectangle from dataset import DATASET from constraint_parser_llm import parse_constraints from semantic_ranker import score_courses # optional; keep if you want semantic boost # -------- Robust free-text constraint parsing (deterministic fallback) -------- import re DAY_ALIASES = { "sunday": "Sun", "sundays": "Sun", "sun": "Sun", "monday": "Mon", "mondays": "Mon", "mon": "Mon", "tuesday": "Tue", "tuesdays": "Tue", "tue": "Tue", "wednesday": "Wed", "wednesdays": "Wed", "wed": "Wed", "thursday": "Thu", "thursdays": "Thu", "thu": "Thu", "friday": "Fri", "fridays": "Fri", "fri": "Fri", "saturday": "Sat", "saturdays": "Sat", "sat": "Sat", } WEEKEND = {"Sat", "Sun"} WEEKDAYS = {"Mon", "Tue", "Wed", "Thu", "Fri"} def _norm_ampm(h: str, m: str|None, ap: str|None) -> str: h_i = int(h) m_s = (m or "00") ap = (ap or "").upper() if ap not in ("AM", "PM"): # heuristic: <= 8 -> AM, >= 4 -> PM; otherwise assume AM ap = "AM" if h_i <= 11 else "PM" return f"{h_i}:{m_s} {ap}" def parse_det_constraints(text: str): """ Deterministic, high-recall extraction of: - banned_days: {"Mon","Tue",...} - no_before: "H:MM AM/PM" (start times >= this) - no_after: "H:MM AM/PM" (end times <= this) """ res = {"banned_days": set(), "no_before": None, "no_after": None} if not text: return res t = text.lower().strip() # Weekends / weekdays if re.search(r"\bno (?:weekend|weekends)\b", t) or re.search(r"\bweekdays only\b|\bonly on weekdays\b", t): res["banned_days"] |= WEEKEND if re.search(r"\bweekends only\b|\bonly on weekends\b", t) or re.search(r"\bno weekdays\b", t): res["banned_days"] |= WEEKDAYS # Ban specific days with broad triggers triggers = r"(?:no|avoid|except|skip|without|not on|exclude|ban|block|never on)" for alias, abbr in DAY_ALIASES.items(): # e.g., "no class on monday", "avoid mon", "not on tuesdays" if re.search(rf"\b{triggers}\s+(?:classes?|class|lectures?)?\s*(?:on\s*)?{re.escape(alias)}\b", t): res["banned_days"].add(abbr) # Time windows: "only start after 10 AM", "after 10", "not before 10", "no earlier than 10" m_after = re.search(r"\b(?:only\s*)?(?:start\s*)?after\s+(\d{1,2})(?::(\d{2}))?\s*(am|pm)?\b", t) m_not_before = re.search(r"\b(?:not before|no earlier than)\s+(\d{1,2})(?::(\d{2}))?\s*(am|pm)?\b", t) if m_after or m_not_before: h, mm, ap = (m_after or m_not_before).groups() res["no_before"] = _norm_ampm(h, mm, ap) # "before 6 PM", "end before 6", "not after 6", "no later than 6" m_before = re.search(r"\b(?:before|end before|not after|no later than)\s+(\d{1,2})(?::(\d{2}))?\s*(am|pm)?\b", t) if m_before: h, mm, ap = m_before.groups() res["no_after"] = _norm_ampm(h, mm, ap) # "mornings / afternoons / evenings" shortcuts if re.search(r"\bno mornings?\b", t): res["no_after"] = "12:00 PM" if re.search(r"\bmornings?\b", t) and not re.search(r"\bno mornings?\b", t): res["no_before"] = res["no_before"] or "10:00 AM" if re.search(r"\bafternoons?\b", t): res["no_before"] = res["no_before"] or "12:00 PM" if re.search(r"\bno afternoons?\b", t): res["no_after"] = "12:00 PM" if re.search(r"\bevenings?\b", t): res["no_before"] = res["no_before"] or "4:00 PM" if re.search(r"\bno evenings?\b", t): res["no_after"] = "4:00 PM" return res # Robust day parsing for phrases like "no class on monday", "avoid mon", "not on mondays", etc. DAY_ALIASES = { "sunday": "Sun", "sundays": "Sun", "sun": "Sun", "monday": "Mon", "mondays": "Mon", "mon": "Mon", "tuesday": "Tue", "tuesdays": "Tue", "tue": "Tue", "wednesday": "Wed", "wednesdays": "Wed", "wed": "Wed", "thursday": "Thu", "thursdays": "Thu", "thu": "Thu", "friday": "Fri", "fridays": "Fri", "fri": "Fri", "saturday": "Sat", "saturdays": "Sat", "sat": "Sat", } def extract_banned_days_free_text(text: str): """ Catch broad natural language variations: - "no class on monday", "no monday", "avoid mon", "not on mondays", "skip monday", "except monday" Returns a set of abbreviations like {"Mon","Sun"}. """ if not text: return set() t = text.lower() found = set() # generic trigger phrases before the day triggers = ["no", "avoid", "except", "skip", "without", "not on", "exclude", "ban", "block"] for key, abbr in DAY_ALIASES.items(): # build patterns like: r"\b(no|avoid|...)\s+(?:class(?:es)?\s*)?(?:on\s*)?monday\b" trig_group = "(?:" + "|".join(map(re.escape, triggers)) + ")" pattern = rf"\b{trig_group}\s+(?:class(?:es)?\s*)?(?:on\s*)?{re.escape(key)}\b" if re.search(pattern, t): found.add(abbr) # also catch super-short forms like "no mon" where user omits "on" pattern2 = rf"\b{trig_group}\s+{re.escape(key)}\b" if re.search(pattern2, t): found.add(abbr) return found df = pd.DataFrame(DATASET) # ---------- CONSTANTS ---------- SUBJECTS = sorted(df["subject"].unique().tolist()) DAY_MAP = {"Sun":"Sunday","Mon":"Monday","Tue":"Tuesday","Wed":"Wednesday","Thu":"Thursday","Fri":"Friday","Sat":"Saturday"} DAYS_AXIS = ["Sunday","Monday","Tuesday","Wednesday","Thursday","Friday","Saturday"] TIME_FMT = "%I:%M %p" # e.g., 08:00 AM # ---------- HELPERS ---------- def parse_time_range(timestr: str): start_s, end_s = [t.strip() for t in timestr.split("-")] return datetime.strptime(start_s, TIME_FMT), datetime.strptime(end_s, TIME_FMT) def to_hours(t: datetime) -> float: return t.hour + t.minute / 60.0 def block_overlaps(a, b) -> bool: sa, ea = a; sb, eb = b return (sa < eb) and (sb < ea) def class_record_to_blocks(row_dict): start_dt, end_dt = parse_time_range(row_dict["times"]) start_h, end_h = to_hours(start_dt), to_hours(end_dt) out = [] for d in row_dict["days"].split(","): d = d.strip() if d in DAY_MAP: out.append((DAY_MAP[d], (start_h, end_h), row_dict)) return out def filter_by_constraints(df_in: pd.DataFrame, instructions: str) -> pd.DataFrame: filtered = df_in.copy() text = (instructions or "").lower() # Days off (e.g., "Don't give me classes on Sundays") days_regex = r"(sundays?|mondays?|tuesdays?|wednesdays?|thursdays?|fridays?|saturdays?|sun|mon|tue|wed|thu|fri|sat)" if ("no classes on" in text) or ("don't give me classes on" in text) or ("dont give me classes on" in text): banned_days = {m.group(1) for m in re.finditer(days_regex, text)} norm_banned = {d[:3].title() for d in banned_days if d[:3].title() in DAY_MAP} if norm_banned: mask = ~filtered["days"].apply(lambda s: any(b in [x.strip() for x in s.split(",")] for b in norm_banned)) filtered = filtered[mask] # Time constraints (e.g., "no classes before 10 AM", "no classes after 6 PM") before = re.search(r"no classes before ([0-9]{1,2})(?::([0-9]{2}))?\s*(am|pm)", text) after = re.search(r"no classes after ([0-9]{1,2})(?::([0-9]{2}))?\s*(am|pm)", text) def to_24h(hs, ms, ap): h = int(hs); m = int(ms) if ms else 0; ap = ap.lower() if ap == "pm" and h != 12: h += 12 if ap == "am" and h == 12: h = 0 return h + m/60.0 min_start = to_24h(*before.groups()) if before else None max_end = to_24h(*after.groups()) if after else None if min_start is not None: filtered = filtered[filtered["times"].apply(lambda t: to_hours(parse_time_range(t)[0]) >= min_start)] if max_end is not None: filtered = filtered[filtered["times"].apply(lambda t: to_hours(parse_time_range(t)[1]) <= max_end)] return filtered def pick_schedules(df_pool: pd.DataFrame, demand: Dict[str, int], max_attempts=500) -> List[List[dict]]: schedules = [] rng = random.Random(123) def conflict_free(selected_rows: List[dict], candidate_row: pd.Series) -> bool: cand_blocks = class_record_to_blocks(candidate_row.to_dict()) by_day = {} for r in selected_rows: for d, (s, e), _ in class_record_to_blocks(r): by_day.setdefault(d, []).append((s, e)) for d, (s, e), _ in cand_blocks: for (cs, ce) in by_day.get(d, []): if block_overlaps((s, e), (cs, ce)): return False return True for _ in range(3): attempts = 0 built = None while attempts < max_attempts and built is None: attempts += 1 remaining = demand.copy() chosen: List[dict] = [] idxs = list(df_pool.index) rng.shuffle(idxs) subjects_order = list(remaining.keys()) rng.shuffle(subjects_order) progress = True while progress and any(remaining[s] > 0 for s in subjects_order): progress = False for sub in subjects_order: if remaining[sub] <= 0: continue sub_idxs = [i for i in idxs if df_pool.at[i, "subject"] == sub and df_pool.at[i, "class_id"] not in {c["class_id"] for c in chosen}] rng.shuffle(sub_idxs) for i in sub_idxs: row = df_pool.loc[i] if conflict_free(chosen, row): chosen.append(row.to_dict()) remaining[sub] -= 1 progress = True break if all(v == 0 for v in remaining.values()): built = chosen if built is None: built = chosen if 'chosen' in locals() else [] schedules.append(built) return schedules def draw_timetable(schedule_rows: List[dict], title: str): fig, ax = plt.subplots(figsize=(10, 7), dpi=150) ax.set_xlim(0, 7); ax.set_ylim(8, 21) # Put days on TOP, not bottom ax.set_xticks(range(7)) ax.set_xticklabels(DAYS_AXIS) ax.xaxis.tick_top() ax.xaxis.set_label_position('top') ax.tick_params(axis='x', which='both', bottom=False, top=True, labelbottom=False, labeltop=True) ax.set_yticks(range(8, 22, 1)) ax.set_ylabel("Time") ax.set_title(title, pad=20) for x in range(8): ax.axvline(x, linewidth=0.5) for y in range(8, 22): ax.axhline(y, linewidth=0.3) rng = np.random.default_rng(42) colors = rng.random((len(schedule_rows), 3)) for idx, row in enumerate(schedule_rows): blocks = class_record_to_blocks(row) for day, (start_h, end_h), _ in blocks: if day not in DAYS_AXIS: continue x = DAYS_AXIS.index(day); y = start_h; height = end_h - start_h rect = Rectangle((x + 0.05, y + 0.02), 0.9, height - 0.04, linewidth=0.8, edgecolor='black', facecolor=colors[idx], alpha=0.8) ax.add_patch(rect) ax.text(x + 0.07, y + 0.1, f"{row['name']}\n{row['professor']}", fontsize=7, va='top', wrap=True) ax.invert_yaxis(); ax.set_facecolor("white"); fig.tight_layout() # Backend-safe conversion to numpy RGB fig.canvas.draw() try: buf = np.asarray(fig.canvas.buffer_rgba()) except AttributeError: renderer = fig.canvas.get_renderer() buf = np.asarray(renderer.buffer_rgba()) img = buf[..., :3].copy() # drop alpha plt.close(fig) return img def schedule_details_table(rows: List[dict]) -> pd.DataFrame: if not rows: return pd.DataFrame(columns=["class_id","name","professor","days","times","subject"]) return pd.DataFrame(rows)[["class_id","name","professor","days","times","subject"]] # ---------- UI CALLBACKS ---------- def _ensure_array_table(tbl): """Gradio Dataframe can return None or pandas; normalize to list-of-lists.""" if tbl is None: return [] if isinstance(tbl, pd.DataFrame): return tbl.values.tolist() return tbl def add_subject(tbl, subject): tbl = _ensure_array_table(tbl) if not subject: return tbl, gr.update(value=None), f"Total classes: {sum(int(r[1]) if str(r[1]).isdigit() else 0 for r in tbl)}" # If subject already exists, increment its count by 1 subjects = [r[0] for r in tbl] if subject in subjects: i = subjects.index(subject) try: tbl[i][1] = int(tbl[i][1]) + 1 except Exception: tbl[i][1] = 1 else: tbl.append([subject, 1]) total = sum(int(r[1]) if str(r[1]).isdigit() else 0 for r in tbl) return tbl, gr.update(value=None), f"Total classes: {total}" def update_total(tbl): tbl = _ensure_array_table(tbl) total = sum(int(row[1]) if str(row[1]).isdigit() else 0 for row in tbl) return f"Total classes: {total}" def generate(tbl, instructions): tbl = _ensure_array_table(tbl) # If user didn’t select anything, show empty grid + hide controls if not tbl: blank = draw_timetable([], "Schedule option 1 (empty)") return ( blank, "Schedule option 1", [], 0, gr.update(visible=False), gr.update(visible=False), gr.update(visible=False), gr.update(visible=False), ) # Build demand from the left table (unchanged) demand = {} for subject, count in tbl: try: c = max(0, int(count)) except Exception: c = 0 if c > 0: demand[subject] = demand.get(subject, 0) + c if not demand: blank = draw_timetable([], "Schedule option 1 (empty)") return ( blank, "Schedule option 1", [], 0, gr.update(visible=False), gr.update(visible=False), gr.update(visible=False), gr.update(visible=False), ) # --- Deterministic parse of free text --- det = parse_det_constraints(instructions or "") # --- Apply deterministic filters to the pool --- pool = df.copy() # Days ban banned_days = set(det["banned_days"]) if banned_days: pool = pool[~pool["days"].apply( lambda s: any(b in [x.strip() for x in s.split(",")] for b in banned_days) )] # Time filters def _times_to_hours(ts: str): s, e = [t.strip() for t in ts.split("-")] sd = datetime.strptime(s, TIME_FMT) ed = datetime.strptime(e, TIME_FMT) return sd.hour + sd.minute/60.0, ed.hour + ed.minute/60.0 def _to_hour_24(hhmm_ap: str): # Convert "10:00 AM" -> 10.0 hour, "4:30 PM" -> 16.5 hours sd = datetime.strptime(hhmm_ap.strip(), TIME_FMT) return sd.hour + sd.minute/60.0 if det["no_before"]: th = _to_hour_24(det["no_before"]) pool = pool[pool["times"].apply(lambda t: _times_to_hours(t)[0] >= th)] if det["no_after"]: th = _to_hour_24(det["no_after"]) pool = pool[pool["times"].apply(lambda t: _times_to_hours(t)[1] <= th)] # --- Build 3 schedules and render option 1 --- scheds = pick_schedules(pool, demand) idx = 0 rows = scheds[idx] if (scheds and len(scheds) > 0) else [] title = f"Schedule option {idx+1}" img = draw_timetable(rows, title) prev_vis = gr.update(visible=False) # first page next_vis = gr.update(visible=True if len(scheds) > 1 else False) details_vis = gr.update(visible=True) hide_details_table = gr.update(visible=False) # reset return img, title, scheds, idx, prev_vis, next_vis, details_vis, hide_details_table def step(direction, scheds, idx): if not scheds: return gr.update(), "", idx, gr.update(visible=False), gr.update(visible=False) if direction == "next": idx = (idx + 1) % len(scheds) else: idx = (idx - 1) % len(scheds) title = f"Schedule option {idx+1}" img = draw_timetable(scheds[idx], title) # once you start navigating, show both buttons return img, title, idx, gr.update(visible=True), gr.update(visible=True) def get_details(scheds, idx): rows = scheds[idx] if (scheds and 0 <= idx < len(scheds)) else [] return schedule_details_table(rows) # ---------- UI ---------- with gr.Blocks(css=""" :root { --radius: 16px; } #container { max-width: 1400px; margin: 0 auto; } .card { border: 1px solid #e5e7eb; border-radius: var(--radius); padding: 16px; background: white; box-shadow: 0 6px 24px rgba(0,0,0,0.04); } .split { display: grid; grid-template-columns: 1fr 1fr; gap: 16px; align-items: start; } .totals { font-weight: 600; } .gr-accordion-header { font-weight: 600; } #custom-instructions-label { position: relative; display: inline-block; cursor: pointer; } """) as demo: gr.Markdown("# Class Schedule Generator") with gr.Row(elem_id="container"): # LEFT: inputs with gr.Column(scale=1, min_width=480, elem_classes=["card"]): subject_dropdown = gr.Dropdown( SUBJECTS, label="Select your subjects", value=None, allow_custom_value=False ) add_btn = gr.Button("➕ Add subject") subject_table = gr.Dataframe( headers=["Subject","Count"], datatype=["str","number"], type="array", # returns list-of-lists value=[], row_count=(0,"dynamic"), col_count=2, interactive=True, label="Selected subjects & counts" ) total_text = gr.Markdown("Total classes: 0", elem_classes=["totals"]) # --- Custom instructions with accordion examples (tooltip removed) --- gr.Markdown("### 🤖 Custom instructions") custom_instructions = gr.Textbox( label="", placeholder="Don't give me classes on Sundays", lines=2 ) EXAMPLE_PROMPTS = [ "No classes on Mondays", "Only start after 10 AM", "Avoid Fridays, no weekends", "Weekdays only", "No class on Sundays and only start after 10 AM", "Avoid Monday and avoid Friday; end before 3 PM", "Weekends only and mornings only", "Evenings only", ] with gr.Accordion("See example prompts ▼", open=False): with gr.Row(): with gr.Column(): # left column ex_btns_left = [gr.Button(EXAMPLE_PROMPTS[i]) for i in range(0, len(EXAMPLE_PROMPTS), 2)] with gr.Column(): # right column ex_btns_right = [gr.Button(EXAMPLE_PROMPTS[i]) for i in range(1, len(EXAMPLE_PROMPTS), 2)] # --- end Custom instructions block --- generate_btn = gr.Button("✨ Generate schedule", variant="primary") # RIGHT: output with gr.Column(scale=1, min_width=480, elem_classes=["card"]): schedule_title = gr.Markdown("Schedule option 1") empty_img = draw_timetable([], "Schedule option 1") timetable_img = gr.Image(value=empty_img, label=None, interactive=False) with gr.Row(): prev_btn = gr.Button("◀ Previous", visible=False) next_btn = gr.Button("Next ▶", visible=False) details_btn = gr.Button("See full class details", visible=False) # Inline details table (replaces modal) details_table = gr.Dataframe( headers=["class_id","name","professor","days","times","subject"], interactive=False, visible=False, label="Selected classes" ) # STATE schedules_state = gr.State([]) index_state = gr.State(0) # Fill the textbox when an example is clicked def _fill_prompt(txt: str): return gr.update(value=txt) for btn in (ex_btns_left + ex_btns_right): # capture the label text per-button btn.click(lambda t=btn.value: _fill_prompt(t), outputs=[custom_instructions]) # EVENTS (must be inside Blocks) add_btn.click( add_subject, inputs=[subject_table, subject_dropdown], outputs=[subject_table, subject_dropdown, total_text] ) subject_table.change(update_total, inputs=[subject_table], outputs=[total_text]) generate_btn.click( generate, inputs=[subject_table, custom_instructions], outputs=[timetable_img, schedule_title, schedules_state, index_state, prev_btn, next_btn, details_btn, details_table] ) prev_btn.click( lambda s,i: step("prev", s, i), inputs=[schedules_state, index_state], outputs=[timetable_img, schedule_title, index_state, prev_btn, next_btn] ) next_btn.click( lambda s,i: step("next", s, i), inputs=[schedules_state, index_state], outputs=[timetable_img, schedule_title, index_state, prev_btn, next_btn] ) # Show details inline (no modal) details_btn.click( lambda s,i: gr.update(visible=True, value=get_details(s,i)), inputs=[schedules_state, index_state], outputs=[details_table] ) # ---- RUN ---- if __name__ == "__main__": demo.launch()