Spaces:

avanigupta
/

dataqa-env

Running

avanigupta Claude Opus 4.6 (1M context) commited on 17 days ago

Commit

8560706

1 Parent(s): 887c1aa

fix moderation issue row collisions and verify all data

- Move out_of_range issue to row 13 (was colliding with row 29 duplicate)
- Move duplicate to row 30 (clean separation)
- Full audit: 46 issues across 5 tasks all verified correct
- All moderation label flips are deterministic
- 128 tests passing

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

Files changed (2) hide show

dataqa_env/server/gradio_ui.py +5 -5
dataqa_env/server/tasks.py +9 -10

dataqa_env/server/gradio_ui.py CHANGED Viewed

@@ -168,16 +168,16 @@ AGENT_TRAJECTORIES = {
                 "row:16,col:hate,issue:inconsistent_value",
                 "row:17,col:harassment,issue:inconsistent_value",
                 "row:20,col:violence,issue:inconsistent_value",
-                "row:11,col:hate,issue:out_of_range",
                 "row:15,col:text,issue:missing_value",
-                "row:29,col:text,issue:duplicate_row",
             ],
             "fixes": [],
         },
         {
             "issues": [
                 "row:5,col:hate,issue:inconsistent_value",
-                "row:11,col:hate,issue:out_of_range",
                 "row:15,col:text,issue:missing_value",
                 "row:16,col:hate,issue:inconsistent_value",
                 "row:17,col:harassment,issue:inconsistent_value",
@@ -185,7 +185,7 @@ AGENT_TRAJECTORIES = {
                 "row:22,col:self_harm,issue:inconsistent_value",
                 "row:24,col:hate,issue:inconsistent_value",
                 "row:26,col:harassment,issue:inconsistent_value",
-                "row:29,col:text,issue:duplicate_row",
             ],
             "fixes": [
                 # All deterministic label flips:
@@ -196,7 +196,7 @@ AGENT_TRAJECTORIES = {
                 "row:5,col:hate,fix:0",             # false positive on idiom → unflag
                 "row:24,col:hate,fix:1",            # subset rule: hate_threatening needs hate
                 "row:26,col:harassment,fix:0",      # false positive on moral judgment → unflag
-                "row:11,col:hate,fix:0",            # out of range 2 → 0
             ],
         },
     ],

                 "row:16,col:hate,issue:inconsistent_value",
                 "row:17,col:harassment,issue:inconsistent_value",
                 "row:20,col:violence,issue:inconsistent_value",
+                "row:13,col:violence,issue:out_of_range",
                 "row:15,col:text,issue:missing_value",
+                "row:30,col:text,issue:duplicate_row",
             ],
             "fixes": [],
         },
         {
             "issues": [
                 "row:5,col:hate,issue:inconsistent_value",
+                "row:13,col:violence,issue:out_of_range",
                 "row:15,col:text,issue:missing_value",
                 "row:16,col:hate,issue:inconsistent_value",
                 "row:17,col:harassment,issue:inconsistent_value",
                 "row:22,col:self_harm,issue:inconsistent_value",
                 "row:24,col:hate,issue:inconsistent_value",
                 "row:26,col:harassment,issue:inconsistent_value",
+                "row:30,col:text,issue:duplicate_row",
             ],
             "fixes": [
                 # All deterministic label flips:
                 "row:5,col:hate,fix:0",             # false positive on idiom → unflag
                 "row:24,col:hate,fix:1",            # subset rule: hate_threatening needs hate
                 "row:26,col:harassment,fix:0",      # false positive on moral judgment → unflag
+                "row:13,col:violence,fix:0",         # out of range 3 → 0
             ],
         },
     ],

dataqa_env/server/tasks.py CHANGED Viewed

@@ -929,10 +929,10 @@ def create_task_moderation(seed: int = 42) -> Task:
                                difficulty=1.5))
     # Issue 7: Label value out of range (deterministic: must be 0 or 1)
-    r = 10  # row 11
-    data[r][3] = "2"  # hate=2 — invalid, must be 0 or 1
-    issues.append(PlantedIssue(row=r + 1, col="hate", issue_type="out_of_range",
-                               description="hate label is 2 but must be 0 or 1 — should be 0 (text is about immigration policy not hate speech)",
                                difficulty=1.0))
     # Issue 8: Empty text field (data pipeline artifact)
@@ -943,16 +943,15 @@ def create_task_moderation(seed: int = 42) -> Task:
                                difficulty=1.5))
     # Issue 9: Duplicate text (dedup failure)
-    r = 28  # row 29, copy text from row 4
-    data[r][1] = data[3][1]  # copy from row 4
     issues.append(PlantedIssue(row=r + 1, col="text", issue_type="duplicate_row",
                                description="Text is identical to row 4 — duplicate moderation example",
                                difficulty=1.5))
-    # Issue 10: Restaurant review falsely flagged as harassment
-    r = 28  # already changed text above, use different row
-    r = 25  # row 26, "ashamed of themselves" — strong language but not harassment
-    data[r][5] = "1"  # harassment=1 but it's moral judgment, not harassment
     issues.append(PlantedIssue(row=r + 1, col="harassment", issue_type="inconsistent_value",
                                description="Text expresses moral judgment ('should be ashamed') but is not harassment — harassment should be 0",
                                difficulty=2.5))

                                difficulty=1.5))
     # Issue 7: Label value out of range (deterministic: must be 0 or 1)
+    r = 12  # row 13, neutral text
+    data[r][4] = "3"  # violence=3 — invalid, must be 0 or 1
+    issues.append(PlantedIssue(row=r + 1, col="violence", issue_type="out_of_range",
+                               description="violence label is 3 but must be 0 or 1 — should be 0 (text is about adjusting strategy not violence)",
                                difficulty=1.0))
     # Issue 8: Empty text field (data pipeline artifact)
                                difficulty=1.5))
     # Issue 9: Duplicate text (dedup failure)
+    r = 29  # row 30, copy text from row 4
+    data[r][1] = data[3][1]  # copy from row 4 ("respectful of other people")
     issues.append(PlantedIssue(row=r + 1, col="text", issue_type="duplicate_row",
                                description="Text is identical to row 4 — duplicate moderation example",
                                difficulty=1.5))
+    # Issue 10: Moral judgment falsely flagged as harassment
+    r = 25  # row 26, "ashamed of themselves" — strong but not harassment
+    data[r][5] = "1"  # harassment=1 but it's moral judgment
     issues.append(PlantedIssue(row=r + 1, col="harassment", issue_type="inconsistent_value",
                                description="Text expresses moral judgment ('should be ashamed') but is not harassment — harassment should be 0",
                                difficulty=2.5))