Spaces:

Jaywalker061707
/

Space

Sleeping

App Files Files Community

Space / app.py

Jaywalker061707

Update app.py

0bd8b05 verified 2 months ago

raw

history blame contribute delete

10.6 kB

	import gradio as gr
	from datasets import load_dataset
	from itertools import islice
	import numpy as np
	from PIL import Image
	import torch
	from transformers import CLIPModel, CLIPProcessor
	import torch.nn.functional as F
	import os, json, time

	# ---------- utils ----------
	def flux_to_gray(flux_array):
	a = np.array(flux_array, dtype=np.float32)
	a = np.squeeze(a)
	if a.ndim == 3:
	axis = int(np.argmin(a.shape))
	a = np.nanmean(a, axis=axis)
	a = np.nan_to_num(a, nan=0.0, posinf=0.0, neginf=0.0)
	lo = np.nanpercentile(a, 1)
	hi = np.nanpercentile(a, 99)
	if not np.isfinite(lo) or not np.isfinite(hi) or hi <= lo:
	lo, hi = float(np.nanmin(a)), float(np.nanmax(a))
	norm = np.clip((a - lo) / (hi - lo + 1e-9), 0, 1)
	arr = (norm * 255).astype(np.uint8)
	return Image.fromarray(arr, mode="L")

	# ---------- model ----------
	model_id = "openai/clip-vit-base-patch32"
	model = CLIPModel.from_pretrained(model_id)
	processor = CLIPProcessor.from_pretrained(model_id)
	model.eval()

	# ---------- in-memory index ----------
	INDEX = {
	"feats": None, # torch.Tensor [N, 512]
	"ids": [], # list[str]
	"thumbs": [], # list[PIL.Image]
	"bands": [] # list[str]
	}

	def build_index(n=200):
	ds = load_dataset("MultimodalUniverse/jwst", split="train", streaming=True)
	feats, ids, thumbs, bands = [], [], [], []
	for rec in islice(ds, int(n)):
	pil = flux_to_gray(rec["image"]["flux"]).convert("RGB")
	t = pil.copy(); t.thumbnail((128, 128))
	with torch.no_grad():
	inp = processor(images=pil, return_tensors="pt")
	f = model.get_image_features(**inp) # [1, 512]
	f = F.normalize(f, p=2, dim=-1)[0] # [512]
	feats.append(f)
	ids.append(str(rec.get("object_id")))
	bands.append(str(rec["image"].get("band")))
	thumbs.append(t)

	if not feats:
	return "No records indexed."

	INDEX["feats"] = torch.stack(feats) # [N, 512]
	INDEX["ids"] = ids
	INDEX["thumbs"] = thumbs
	INDEX["bands"] = bands
	return f"Index built: {len(ids)} images."

	def search(text_query, image_query, k=5):
	if INDEX["feats"] is None:
	return [], "Build the index first."

	with torch.no_grad():
	if text_query and str(text_query).strip():
	inputs = processor(text=[str(text_query).strip()], return_tensors="pt")
	q = model.get_text_features(**inputs) # [1, 512]
	elif image_query is not None:
	pil = image_query.convert("RGB")
	inputs = processor(images=pil, return_tensors="pt")
	q = model.get_image_features(**inputs) # [1, 512]
	else:
	return [], "Enter text or upload an image."

	q = F.normalize(q, p=2, dim=-1)[0] # [512]
	sims = (INDEX["feats"] @ q).cpu() # [N]
	k = min(int(k), sims.shape[0])
	topk = torch.topk(sims, k=k)

	items = []
	for idx in topk.indices.tolist():
	cap = f"id: {INDEX['ids'][idx]} score: {float(sims[idx]):.3f} band: {INDEX['bands'][idx]}"
	items.append((INDEX["thumbs"][idx], cap))

	return items, f"Returned {k} results."


	# ---------- evaluation helpers ----------
	def _search_topk_for_eval(text_query, image_query, k=5):
	if INDEX["feats"] is None:
	return [], [], "Build the index first."
	with torch.no_grad():
	if text_query and str(text_query).strip():
	inputs = processor(text=[str(text_query).strip()], return_tensors="pt")
	q = model.get_text_features(**inputs)
	elif image_query is not None:
	pil = image_query.convert("RGB")
	inputs = processor(images=pil, return_tensors="pt")
	q = model.get_image_features(**inputs)
	else:
	return [], [], "Enter text or upload an image."
	q = F.normalize(q, p=2, dim=-1)[0]
	sims = (INDEX["feats"] @ q).cpu()
	k = min(int(k), sims.shape[0])
	topk = torch.topk(sims, k=k)
	idxs = topk.indices.tolist()
	# reuse thumbs and captions like your main search
	items = []
	for idx in idxs:
	cap = f"id: {INDEX['ids'][idx]} score: {float(sims[idx]):.3f} band: {INDEX['bands'][idx]}"
	items.append((INDEX["thumbs"][idx], cap))
	return items, idxs, f"Eval preview: top {k} ready."

	def _format_eval_summary(query, k, hits, p_at_k):
	lines = []
	lines.append(f"Query: {query or '[image query]'}")
	lines.append(f"K: {k}")
	lines.append(f"Relevant marked: {hits} of {k}")
	lines.append(f"Precision@{k}: {p_at_k:.2f}")
	lines.append("Saved to eval_runs.jsonl")
	return "\n".join(lines)

	def _save_eval_run(record):
	try:
	with open("eval_runs.jsonl", "a", encoding="utf-8") as f:
	f.write(json.dumps(record) + "\n")
	except Exception:
	pass

	def _compute_avg_from_file():
	try:
	total = 0.0
	n = 0
	with open("eval_runs.jsonl", "r", encoding="utf-8") as f:
	for line in f:
	rec = json.loads(line)
	if "precision_at_k" in rec:
	total += float(rec["precision_at_k"])
	n += 1
	if n == 0:
	return "No runs recorded yet."
	return f"Macro average Precision@K across {n} runs: {total/n:.2f}"
	except FileNotFoundError:
	return "No eval_runs.jsonl yet. Run at least one evaluation."




	# ---------- UI ----------
	with gr.Blocks() as demo:
	gr.Markdown("JWST multimodal search build the index")

	# Build
	n = gr.Slider(50, 1000, value=200, step=10, label="How many images to index")
	build_btn = gr.Button("Build index")
	status = gr.Textbox(label="Status", lines=2)
	build_btn.click(build_index, inputs=n, outputs=status)

	# Search
	gr.Markdown("Search the index with text or an example image")

	q_text = gr.Textbox(label="Text query", placeholder="e.g., spiral galaxy")
	q_img = gr.Image(label="Image query", type="pil")
	k = gr.Slider(1, 12, value=6, step=1, label="Top K")

	search_btn = gr.Button("Search")
	gallery = gr.Gallery(label="Results", columns=6, height=300)
	info2 = gr.Textbox(label="Search status", lines=1)
	search_btn.click(search, inputs=[q_text, q_img, k], outputs=[gallery, info2])

	# ---------- Evaluation (guided) ----------
	with gr.Accordion("Evaluation", open=False):
	gr.Markdown(
	"### What this does\n"
	"We evaluate text to image retrieval using Precision at K.\n"
	"Steps: pick a preset or type a query, click Run and label, "
	"tick the results that match the rule shown, then click Compute metrics. "
	"Each run is saved so you can average later."
	)

	# Preset prompts with plain English relevance rules
	PRESETS = {
	"star with spikes": "Relevant = bright point source with clear 4 to 6 diffraction spikes. Minimal extended glow.",
	"edge-on galaxy": "Relevant = thin elongated streak. Looks like a narrow line. No round diffuse blob.",
	"spiral galaxy": "Relevant = visible spiral arms or a spiral outline. Arms can be faint.",
	"diffuse nebula": "Relevant = fuzzy cloud like structure. No sharp round core.",
	"ring or annulus": "Relevant = ring or donut shape is the main feature.",
	"two merging objects": "Relevant = two bright blobs touching or overlapping."
	}

	with gr.Row():
	preset = gr.Dropdown(choices=list(PRESETS.keys()), label="Preset query (optional)")
	eval_k = gr.Slider(1, 12, value=6, step=1, label="K for evaluation")

	eval_query = gr.Textbox(label="Evaluation query (you can edit or type your own)")
	eval_img = gr.Image(label="Evaluation image (optional)", type="pil")
	rules_md = gr.Markdown()

	run_and_label = gr.Button("Run and label this query")

	eval_gallery = gr.Gallery(label="Eval top K results", columns=6, height=300)
	relevant_picker = gr.CheckboxGroup(label="Select indices of relevant results (1..K)")
	eval_md = gr.Markdown()

	# state bag for this panel
	eval_state = gr.State({"result_indices": [], "k": 5, "query": ""})

	def _on_preset_change(name):
	if name in PRESETS:
	return gr.update(value=name), PRESETS[name]
	return gr.update(), ""

	preset.change(fn=_on_preset_change, inputs=preset, outputs=[eval_query, rules_md])

	# uses helper _search_topk_for_eval defined above
	def _run_eval_query(q_txt, q_img_in, k_in, state):
	items, idxs, _ = _search_topk_for_eval(q_txt, q_img_in, k_in)
	state["result_indices"] = idxs
	state["k"] = int(k_in)
	state["query"] = q_txt if (q_txt and q_txt.strip()) else "[image query]"
	choice_labels = [str(i+1) for i in range(len(idxs))]
	help_text = PRESETS.get((q_txt or "").strip().lower(), "Mark results that match the concept you typed.")
	return (items,
	gr.update(choices=choice_labels, value=[]),
	f"Relevance rule: {help_text}\n\nThen click Compute metrics.",
	state)

	run_and_label.click(
	fn=_run_eval_query,
	inputs=[eval_query, eval_img, eval_k, eval_state],
	outputs=[eval_gallery, relevant_picker, eval_md, eval_state]
	)

	compute_btn = gr.Button("Compute metrics")

	# uses helpers _save_eval_run and _format_eval_summary defined above
	def _compute_pk(selected_indices, state):
	k_val = int(state.get("k", 5))
	query = state.get("query", "")
	hits = len(selected_indices)
	p_at_k = hits / max(k_val, 1)
	record = {
	"ts": int(time.time()),
	"query": query,
	"k": k_val,
	"relevant_indices": sorted([int(s) for s in selected_indices]),
	"precision_at_k": p_at_k
	}
	_save_eval_run(record)
	return _format_eval_summary(query, k_val, hits, p_at_k)

	compute_btn.click(fn=_compute_pk, inputs=[relevant_picker, eval_state], outputs=eval_md)

	avg_btn = gr.Button("Compute average across saved runs")
	avg_md = gr.Markdown()
	avg_btn.click(fn=_compute_avg_from_file, outputs=avg_md)

	demo.launch()