Spaces:

avid-ml
/

indie-label

Runtime error

indie-label / indie_label_svelte /src /Auditing.svelte

Michelle Lam

Refreshes overall plot when model is edited. Uses user ID in preds_df. Exports reports and chart to json. Streamlines performance plot and description.

c55019b about 1 year ago

raw

history blame

16.5 kB

	<script lang="ts">
	import { onMount } from "svelte";
	import Section from "./Section.svelte";
	import KeywordSearch from "./KeywordSearch.svelte";
	import OverallResults from "./OverallResults.svelte";
	import ClusterResults from "./ClusterResults.svelte";
	import HelpTooltip from "./HelpTooltip.svelte";
	import TopicTraining from "./TopicTraining.svelte";

	import { error_type } from './stores/error_type_store.js';
	import { topic_chosen } from './stores/cur_topic_store.js';
	import { model_chosen } from './stores/cur_model_store.js';

	import Button, { Label } from "@smui/button";
	import LinearProgress from "@smui/linear-progress";
	import LayoutGrid, { Cell } from "@smui/layout-grid";
	import Radio from '@smui/radio';
	import FormField from '@smui/form-field';
	import{ Wrapper } from '@smui/tooltip';
	import IconButton from '@smui/icon-button';
	import Svelecte from '../node_modules/svelecte/src/Svelecte.svelte';

	export let personalized_model;
	export let cur_error_type = "Both";
	export let cur_user;

	let evidence = [];
	let show_audit_settings = false;

	let error_type_options = [
	{
	"opt": 'Both',
	"descr": '(System is under- or over-sensitive)',
	"help": "View both types of potential system errors"
	},
	{
	"opt": 'System is under-sensitive',
	"descr": '(Incorrectly rates as non-toxic)',
	"help": "Focus on system errors where the system labeled content as Non-toxic when it should have been labeled as Toxic."
	},
	{
	"opt": 'System is over-sensitive',
	"descr": '(Incorrectly rates as toxic)',
	"help": "Focus on system errors where the system labeled content as Toxic when it should have been labeled as Non-toxic."
	},
	{
	"opt": 'Show errors and non-errors',
	"descr": '',
	"help": "Also show cases that are not likely to be potential errors"
	},
	]

	let personalized_models = [];
	let systems = ["YouSocial comment toxicity classifier"]; // Only one system for now
	let clusters = [];
	let clusters_for_tuning = []
	let promise = Promise.resolve(null);

	// Handle routing
	let searchParams = new URLSearchParams(window.location.search);
	let scaffold_method = searchParams.get("scaffold");
	let mode = searchParams.get("mode");
	let topic_vis_method = searchParams.get("topic_vis_method");

	// Set audit type
	let audit_types = [
	"All topic exploration",
	"Single topic exploration"
	];
	let audit_type;
	if (scaffold_method == "fixed" \|\| scaffold_method == "personal" \|\| scaffold_method == "personal_group" \|\| scaffold_method == "personal_test" \|\| scaffold_method == "personal_cluster" \|\| scaffold_method == "topic_train" \|\| scaffold_method == "prompts") {
	audit_type = audit_types[1];
	} else {
	// No scaffolding mode or tutorial
	audit_type = audit_types[0];
	}

	let show_topic_training = false;
	if (scaffold_method == "topic_train") {
	show_topic_training = true;
	}

	// Handle non-model mode
	let use_model = true;
	if (mode == "no_model") {
	use_model = false;
	cur_error_type = "Show errors and non-errors";
	}

	// Handle group model
	let use_group_model = false;
	if (scaffold_method == "personal_group") {
	use_group_model = true;
	}

	let promise_cluster = Promise.resolve(null);

	// Get current topic from store
	let topic;
	topic_chosen.subscribe(value => {
	topic = value;
	handleClusterButton(); // re-render cluster results
	});

	// Get current model from store
	model_chosen.subscribe(value => {
	personalized_model = value;
	// Add to personalized_models if not there
	if (!personalized_models.includes(personalized_model)) {
	personalized_models.push(personalized_model);
	}
	getAuditResults();
	});

	// Save current error type
	async function updateErrorType() {
	error_type.update((value) => cur_error_type);
	handleAuditButton();
	handleClusterButton();
	}

	async function updateTopicChosen() {
	if (topic != null) {
	topic_chosen.update((value) => topic);
	}
	}

	function getAuditResults() {
	let req_params = {
	user: cur_user,
	scaffold_method: scaffold_method,
	};
	let params = new URLSearchParams(req_params).toString();
	fetch("./audit_settings?" + params)
	.then((r) => r.text())
	.then(function (r_orig) {
	let r = JSON.parse(r_orig);
	personalized_models = r["personalized_models"];
	if (use_group_model) {
	let personalized_model_grp = r["personalized_model_grp"];
	personalized_model = personalized_model_grp[0];
	} else {
	personalized_model = personalized_models[0]; // TEMP
	}

	model_chosen.update((value) => personalized_model);
	clusters = r["clusters"];
	clusters_for_tuning = r["clusters_for_tuning"];
	topic = clusters[0]["options"][0]["text"];
	topic_chosen.update((value) => topic);
	handleAuditButton();
	handleClusterButton();
	});
	}
	onMount(async () => {
	getAuditResults();
	});

	function handleAuditButton() {
	model_chosen.update((value) => personalized_model);
	if (personalized_model == "" \|\| personalized_model == undefined) {
	return;
	}
	promise = getAudit(personalized_model);
	}

	async function getAudit(pers_model) {
	let req_params = {
	pers_model: pers_model,
	perf_metric: "avg_diff",
	breakdown_sort: "difference",
	n_topics: 10,
	error_type: "Both", // Only allow both error types
	cur_user: cur_user,
	topic_vis_method: topic_vis_method,
	};
	let params = new URLSearchParams(req_params).toString();
	const response = await fetch("./get_audit?" + params);
	const text = await response.text();
	const data = JSON.parse(text);
	return data;
	}

	function handleClusterButton() {
	promise_cluster = getCluster(personalized_model);
	}

	async function getCluster(pers_model) {
	if (pers_model == "" \|\| pers_model == undefined) {
	return null;
	}
	let req_params = {
	cluster: topic,
	topic_df_ids: [],
	cur_user: cur_user,
	pers_model: pers_model,
	example_sort: "descending", // TEMP
	comparison_group: "status_quo", // TEMP
	search_type: "cluster",
	keyword: "",
	error_type: cur_error_type,
	use_model: use_model,
	scaffold_method: scaffold_method,
	};
	let params = new URLSearchParams(req_params).toString();
	const response = await fetch("./get_cluster_results?" + params);
	const text = await response.text();
	const data = JSON.parse(text);
	return data;
	}
	</script>

	<div>
	<!-- 0: Audit settings -->
	<div>
	<div style="margin-top: 30px">
	<span class="head_3">Auditing</span>
	</div>
	<div style="width: 80%">
	{#if personalized_model}
	<p>In this section, we'll be auditing the content moderation system. Here, you’ll be aided by a personalized model that will help direct your attention towards potential problem areas in the model’s performance. This model isn’t meant to be perfect, but is designed to help you better focus on areas that need human review.</p>
	{:else}
	<p>Please first train your personalized model by following the steps in the "Labeling" tab (click the top left tab above).</p>
	{/if}
	</div>

	{#if show_audit_settings}
	<div class="audit_section">
	<div class="head_5">Audit settings</div>
	<div style="width: 50%">
	<p>Choose your audit settings here. These settings will affect all of the visualizations that follow, so you can return back here to make changes.</p>
	</div>
	<div class="section_indent">
	<Section
	section_id="systems"
	section_title="What status-quo system would you like to audit?"
	section_opts={systems}
	bind:value={systems[0]}
	width_pct={40}
	/>
	{#key personalized_model}
	<Section
	section_id="personalized_model"
	section_title="What model would you like to use to represent your views?"
	section_opts={personalized_models}
	bind:value={personalized_model}
	width_pct={40}
	on:change
	/>
	{/key}

	<Section
	section_id="audit_type"
	section_title="What type of audit are you conducting?"
	section_opts={audit_types}
	bind:value={audit_type}
	width_pct={40}
	on:change
	/>

	<LayoutGrid>
	<Cell span={7}>
	<Button
	on:click={handleAuditButton}
	variant="outlined"
	class="button_float_right"
	>
	<Label>Start your audit</Label>
	</Button>
	</Cell>
	</LayoutGrid>
	</div>
	</div>
	{/if}
	{#if personalized_model}
	<p>Current model: {personalized_model}</p>
	{/if}
	</div>

	<!-- 1: All topics overview -->
	{#if personalized_model}
	{#if audit_type == audit_types[0]}
	<div class="audit_section">
	<div class="head_5">Overview of all topics</div>
	<p>First, browse the system performance by different auto-generated comment topic areas.</p>

	<div class="section_indent">
	{#await promise}
	<div class="app_loading">
	<LinearProgress indeterminate />
	</div>
	{:then audit_results}
	{#if audit_results}
	<OverallResults
	data={audit_results}
	clusters={clusters}
	personalized_model={personalized_model}
	cluster={topic}
	/>
	{/if}
	{:catch error}
	<p style="color: red">{error.message}</p>
	{/await}
	</div>
	</div>
	{/if}

	<!-- 2a: Topic training -->
	{#if show_topic_training}
	<div class="audit_section">
	<div class="head_5">Topic model training</div>
	<p></p>
	<div class="section_indent">
	<div>
	<p>In what topic area would you like to tune your model?</p>
	<Svelecte
	options={clusters_for_tuning}
	labelAsValue={true}
	bind:value={topic}
	placeholder="Select topic"
	on:change={null}
	style="width: 50%"
	>
	</Svelecte>
	</div>

	<div style="padding-top: 30px">
	<!-- Labeling -->
	<h6>Comments to label</h6>
	<ul>
	<li>
	Comments with scores <b>0</b> and <b>1</b> will be allowed to <b>remain</b> on the platform.
	</li>
	<li>
	Comments with scores <b>2</b>, <b>3</b>, or <b>4</b> will be <b>deleted</b> from the platform.
	</li>
	<li>
	Given that some comments may lack context, if you're not sure, feel free to mark the <b>unsure</b> option to skip a comment.
	</li>
	</ul>
	{#key topic}
	<TopicTraining topic={topic} cur_user={cur_user}/>
	{/key}
	</div>

	</div>
	</div>
	{/if}

	<!-- 2: Topic overview -->
	<div class="audit_section">
	<div class="head_5">Topic exploration</div>
	<p></p>
	<div class="section_indent">
	<div>
	<div>
	<p><b>What topic would you like to explore further?</b></p>
	<Svelecte
	options={clusters}
	labelAsValue={true}
	bind:value={topic}
	placeholder="Select topic"
	on:change={updateTopicChosen}
	style="width: 50%"
	>
	</Svelecte>
	</div>

	{#if use_model}
	<div style="padding-top: 30px">
	<p><b>What kind of system errors do you want to focus on?</b></p>
	{#each error_type_options as e}
	<div style="display: flex; align-items: center;">
	<Wrapper rich>
	<FormField>
	<Radio bind:group={cur_error_type} value={e.opt} on:change={updateErrorType} color="secondary" />
	<span slot="label">
	<b>{e.opt}</b> {e.descr}
	<IconButton class="material-icons" size="button" disabled>help_outline</IconButton>
	</span>
	</FormField>
	<HelpTooltip text={e.help} />
	</Wrapper>
	</div>
	{/each}
	</div>
	{/if}
	</div>

	<div style="padding-top: 30px">
	{#await promise_cluster}
	<div class="app_loading">
	<LinearProgress indeterminate />
	</div>
	{:then cluster_results}
	{#if cluster_results}
	{#if topic}
	<ClusterResults
	cluster={topic}
	clusters={clusters}
	model={personalized_model}
	data={cluster_results}
	table_width_pct={100}
	table_id={"main"}
	use_model={use_model}
	bind:evidence={evidence}
	on:change
	/>
	{/if}
	{/if}
	{:catch error}
	<p style="color: red">{error.message}</p>
	{/await}
	</div>

	</div>
	</div>

	<!-- 3: Gather evidence -->
	<div class="audit_section">
	<div class="head_5">Gather additional evidence</div>
	<p>Next, you can optionally search for more comments to serve as evidence through manual keyword search (for individual words or phrases).</p>
	<div class="section_indent">
	{#key error_type}
	<KeywordSearch clusters={clusters} personalized_model={personalized_model} cur_user={cur_user} bind:evidence={evidence} use_model={use_model} on:change/>
	{/key}
	</div>
	</div>

	<!-- 4: Test hunch -->
	<div class="audit_section">
	<div class="head_5">Finalize your current report</div>
	<p>Finally, review the report you've generated on the side panel and provide a brief summary of the problem you see. You may also list suggestions or insights into addressing this problem if you have ideas. This report will be directly used by the model developers to address the issue you've raised</p>
	</div>
	{/if}
	</div>

	<style>
	</style>