model update

Browse files

Files changed (2) hide show

README.md +29 -30
relation_mapping.json +1 -0

README.md CHANGED Viewed

@@ -14,7 +14,7 @@ model-index:
     metrics:
     - name: Accuracy
       type: accuracy
-      value: None
   - task:
       name: Analogy Questions (SAT full)
       type: multiple-choice-qa
@@ -25,7 +25,7 @@ model-index:
     metrics:
     - name: Accuracy
       type: accuracy
-      value: None
   - task:
       name: Analogy Questions (SAT)
       type: multiple-choice-qa
@@ -36,7 +36,7 @@ model-index:
     metrics:
     - name: Accuracy
       type: accuracy
-      value: None
   - task:
       name: Analogy Questions (BATS)
       type: multiple-choice-qa
@@ -47,7 +47,7 @@ model-index:
     metrics:
     - name: Accuracy
       type: accuracy
-      value: None
   - task:
       name: Analogy Questions (Google)
       type: multiple-choice-qa
@@ -58,7 +58,7 @@ model-index:
     metrics:
     - name: Accuracy
       type: accuracy
-      value: None
   - task:
       name: Analogy Questions (U2)
       type: multiple-choice-qa
@@ -69,7 +69,7 @@ model-index:
     metrics:
     - name: Accuracy
       type: accuracy
-      value: None
   - task:
       name: Analogy Questions (U4)
       type: multiple-choice-qa
@@ -80,7 +80,7 @@ model-index:
     metrics:
     - name: Accuracy
       type: accuracy
-      value: None
   - task:
       name: Lexical Relation Classification (BLESS)
       type: classification
@@ -91,10 +91,10 @@ model-index:
     metrics:
     - name: F1
       type: f1
-      value: None
     - name: F1 (macro)
       type: f1_macro
-      value: None
   - task:
       name: Lexical Relation Classification (CogALexV)
       type: classification
@@ -105,10 +105,10 @@ model-index:
     metrics:
     - name: F1
       type: f1
-      value: None
     - name: F1 (macro)
       type: f1_macro
-      value: None
   - task:
       name: Lexical Relation Classification (EVALution)
       type: classification
@@ -119,10 +119,10 @@ model-index:
     metrics:
     - name: F1
       type: f1
-      value: None
     - name: F1 (macro)
       type: f1_macro
-      value: None
   - task:
       name: Lexical Relation Classification (K&H+N)
       type: classification
@@ -133,10 +133,10 @@ model-index:
     metrics:
     - name: F1
       type: f1
-      value: None
     - name: F1 (macro)
       type: f1_macro
-      value: None
   - task:
       name: Lexical Relation Classification (ROOT09)
       type: classification
@@ -147,10 +147,10 @@ model-index:
     metrics:
     - name: F1
       type: f1
-      value: None
     - name: F1 (macro)
       type: f1_macro
-      value: None
 ---
 # relbert/relbert-roberta-base-semeval2012-v6-average-prompt-b-triplet-1
@@ -160,20 +160,20 @@ RelBERT fine-tuned from [roberta-base](https://huggingface.co/roberta-base) on
 Fine-tuning is done via [RelBERT](https://github.com/asahi417/relbert) library (see the repository for more detail).
 It achieves the following results on the relation understanding tasks:
 - Analogy Question ([dataset](https://huggingface.co/datasets/relbert/analogy_questions), [full result](https://huggingface.co/relbert/relbert-roberta-base-semeval2012-v6-average-prompt-b-triplet-1/raw/main/analogy.json)):
-    - Accuracy on SAT (full): None
-    - Accuracy on SAT: None
-    - Accuracy on BATS: None
-    - Accuracy on U2: None
-    - Accuracy on U4: None
-    - Accuracy on Google: None
 - Lexical Relation Classification ([dataset](https://huggingface.co/datasets/relbert/lexical_relation_classification), [full result](https://huggingface.co/relbert/relbert-roberta-base-semeval2012-v6-average-prompt-b-triplet-1/raw/main/classification.json)):
-    - Micro F1 score on BLESS: None
-    - Micro F1 score on CogALexV: None
-    - Micro F1 score on EVALution: None
-    - Micro F1 score on K&H+N: None
-    - Micro F1 score on ROOT09: None
 - Relation Mapping ([dataset](https://huggingface.co/datasets/relbert/relation_mapping), [full result](https://huggingface.co/relbert/relbert-roberta-base-semeval2012-v6-average-prompt-b-triplet-1/raw/main/relation_mapping.json)):
-    - Accuracy on Relation Mapping: None
 ### Usage
@@ -198,7 +198,6 @@ The following hyperparameters were used during training:
  - split: train
  - split_eval: validation
  - template_mode: manual
- - template: Today, I finally discovered the relation between <subj> and <obj> : <obj>  is <subj>'s <mask>
  - loss_function: triplet
  - classification_loss: False
  - temperature_nce_constant: 0.05

     metrics:
     - name: Accuracy
       type: accuracy
+      value: 0.7449603174603174
   - task:
       name: Analogy Questions (SAT full)
       type: multiple-choice-qa
     metrics:
     - name: Accuracy
       type: accuracy
+      value: 0.3502673796791444
   - task:
       name: Analogy Questions (SAT)
       type: multiple-choice-qa
     metrics:
     - name: Accuracy
       type: accuracy
+      value: 0.3560830860534125
   - task:
       name: Analogy Questions (BATS)
       type: multiple-choice-qa
     metrics:
     - name: Accuracy
       type: accuracy
+      value: 0.3468593663146192
   - task:
       name: Analogy Questions (Google)
       type: multiple-choice-qa
     metrics:
     - name: Accuracy
       type: accuracy
+      value: 0.432
   - task:
       name: Analogy Questions (U2)
       type: multiple-choice-qa
     metrics:
     - name: Accuracy
       type: accuracy
+      value: 0.37719298245614036
   - task:
       name: Analogy Questions (U4)
       type: multiple-choice-qa
     metrics:
     - name: Accuracy
       type: accuracy
+      value: 0.38425925925925924
   - task:
       name: Lexical Relation Classification (BLESS)
       type: classification
     metrics:
     - name: F1
       type: f1
+      value: 0.8523429260207925
     - name: F1 (macro)
       type: f1_macro
+      value: 0.8411456349485952
   - task:
       name: Lexical Relation Classification (CogALexV)
       type: classification
     metrics:
     - name: F1
       type: f1
+      value: 0.8157276995305164
     - name: F1 (macro)
       type: f1_macro
+      value: 0.5982289168562968
   - task:
       name: Lexical Relation Classification (EVALution)
       type: classification
     metrics:
     - name: F1
       type: f1
+      value: 0.6386782231852655
     - name: F1 (macro)
       type: f1_macro
+      value: 0.6034154846314037
   - task:
       name: Lexical Relation Classification (K&H+N)
       type: classification
     metrics:
     - name: F1
       type: f1
+      value: 0.95875356472143
     - name: F1 (macro)
       type: f1_macro
+      value: 0.8723815565345302
   - task:
       name: Lexical Relation Classification (ROOT09)
       type: classification
     metrics:
     - name: F1
       type: f1
+      value: 0.846443121278596
     - name: F1 (macro)
       type: f1_macro
+      value: 0.8238870756074439
 ---
 # relbert/relbert-roberta-base-semeval2012-v6-average-prompt-b-triplet-1
 Fine-tuning is done via [RelBERT](https://github.com/asahi417/relbert) library (see the repository for more detail).
 It achieves the following results on the relation understanding tasks:
 - Analogy Question ([dataset](https://huggingface.co/datasets/relbert/analogy_questions), [full result](https://huggingface.co/relbert/relbert-roberta-base-semeval2012-v6-average-prompt-b-triplet-1/raw/main/analogy.json)):
+    - Accuracy on SAT (full): 0.3502673796791444
+    - Accuracy on SAT: 0.3560830860534125
+    - Accuracy on BATS: 0.3468593663146192
+    - Accuracy on U2: 0.37719298245614036
+    - Accuracy on U4: 0.38425925925925924
+    - Accuracy on Google: 0.432
 - Lexical Relation Classification ([dataset](https://huggingface.co/datasets/relbert/lexical_relation_classification), [full result](https://huggingface.co/relbert/relbert-roberta-base-semeval2012-v6-average-prompt-b-triplet-1/raw/main/classification.json)):
+    - Micro F1 score on BLESS: 0.8523429260207925
+    - Micro F1 score on CogALexV: 0.8157276995305164
+    - Micro F1 score on EVALution: 0.6386782231852655
+    - Micro F1 score on K&H+N: 0.95875356472143
+    - Micro F1 score on ROOT09: 0.846443121278596
 - Relation Mapping ([dataset](https://huggingface.co/datasets/relbert/relation_mapping), [full result](https://huggingface.co/relbert/relbert-roberta-base-semeval2012-v6-average-prompt-b-triplet-1/raw/main/relation_mapping.json)):
+    - Accuracy on Relation Mapping: 0.7449603174603174
 ### Usage
  - split: train
  - split_eval: validation
  - template_mode: manual
  - loss_function: triplet
  - classification_loss: False
  - temperature_nce_constant: 0.05

relation_mapping.json ADDED Viewed

	@@ -0,0 +1 @@

+ {"accuracy": 0.7449603174603174, "prediction": [{"source": ["solar system", "sun", "planet", "mass", "attracts", "revolves", "gravity"], "true": ["atom", "nucleus", "electron", "charge", "attracts", "revolves", "electromagnetism"], "pred": ["electromagnetism", "atom", "nucleus", "charge", "attracts", "revolves", "electron"], "alignment_match": false, "accuracy": 0.42857142857142855, "similarity": 0.9978007003830888, "similarity_true": 0.9975875796811317}, {"source": ["water", "flows", "pressure", "water tower", "bucket", "filling", "emptying", "hydrodynamics"], "true": ["heat", "transfers", "temperature", "burner", "kettle", "heating", "cooling", "thermodynamics"], "pred": ["kettle", "transfers", "heat", "temperature", "burner", "cooling", "heating", "thermodynamics"], "alignment_match": false, "accuracy": 0.25, "similarity": 0.9949383115958428, "similarity_true": 0.9947620909443101}, {"source": ["waves", "shore", "reflects", "water", "breakwater", "rough", "calm", "crashing"], "true": ["sounds", "wall", "echoes", "air", "insulation", "loud", "quiet", "vibrating"], "pred": ["sounds", "wall", "echoes", "air", "vibrating", "loud", "quiet", "insulation"], "alignment_match": false, "accuracy": 0.75, "similarity": 0.9968483759183417, "similarity_true": 0.9967963112911737}, {"source": ["combustion", "fire", "fuel", "burning", "hot", "intense", "oxygen", "carbon dioxide"], "true": ["respiration", "animal", "food", "breathing", "living", "vigorous", "oxygen", "carbon dioxide"], "pred": ["respiration", "animal", "food", "breathing", "living", "vigorous", "oxygen", "carbon dioxide"], "alignment_match": true, "accuracy": 1, "similarity": 0.9981043172055925, "similarity_true": 0.9981043172055925}, {"source": ["sound", "low", "high", "echoes", "loud", "quiet", "horn"], "true": ["light", "red", "violet", "reflects", "bright", "dim", "lens"], "pred": ["light", "red", "bright", "reflects", "dim", "violet", "lens"], "alignment_match": false, "accuracy": 0.5714285714285714, "similarity": 0.9970595350651401, "similarity_true": 0.9969368095324194}, {"source": ["projectile", "trajectory", "earth", "parabolic", "air", "gravity", "attracts"], "true": ["planet", "orbit", "sun", "elliptical", "space", "gravity", "attracts"], "pred": ["sun", "orbit", "planet", "elliptical", "space", "gravity", "attracts"], "alignment_match": false, "accuracy": 0.7142857142857143, "similarity": 0.9983016817773436, "similarity_true": 0.9983015096314236}, {"source": ["breeds", "selection", "conformance", "artificial", "popularity", "breeding", "domesticated"], "true": ["species", "competition", "adaptation", "natural", "fitness", "mating", "wild"], "pred": ["species", "adaptation", "competition", "natural", "fitness", "mating", "wild"], "alignment_match": false, "accuracy": 0.7142857142857143, "similarity": 0.9964612059134946, "similarity_true": 0.9964290024743016}, {"source": ["ball", "billiards", "speed", "table", "bouncing", "moving", "slow", "fast"], "true": ["molecules", "gas", "temperature", "container", "pressing", "moving", "cold", "hot"], "pred": ["molecules", "gas", "temperature", "container", "pressing", "moving", "cold", "hot"], "alignment_match": true, "accuracy": 1, "similarity": 0.9975199728114164, "similarity_true": 0.9975199728114164}, {"source": ["computer", "processing", "erasing", "write", "read", "memory", "outputs", "inputs", "bug"], "true": ["mind", "thinking", "forgetting", "memorize", "remember", "memory", "muscles", "senses", "mistake"], "pred": ["mind", "thinking", "memorize", "forgetting", "remember", "memory", "muscles", "senses", "mistake"], "alignment_match": false, "accuracy": 0.7777777777777778, "similarity": 0.9965320817380313, "similarity_true": 0.9964552173386212}, {"source": ["slot machines", "reels", "spinning", "winning", "losing"], "true": ["bacteria", "genes", "mutating", "reproducing", "dying"], "pred": ["mutating", "genes", "bacteria", "reproducing", "dying"], "alignment_match": false, "accuracy": 0.6, "similarity": 0.9945571008641886, "similarity_true": 0.9945563331831058}, {"source": ["war", "soldier", "destroy", "fighting", "defeat", "attacks", "weapon"], "true": ["argument", "debater", "refute", "arguing", "acceptance", "criticizes", "logic"], "pred": ["argument", "debater", "refute", "arguing", "acceptance", "criticizes", "logic"], "alignment_match": true, "accuracy": 1, "similarity": 0.9945850218735248, "similarity_true": 0.9945850218735248}, {"source": ["buyer", "merchandise", "buying", "selling", "returning", "valuable", "worthless"], "true": ["believer", "belief", "accepting", "advocating", "rejecting", "true", "false"], "pred": ["believer", "belief", "rejecting", "advocating", "accepting", "true", "false"], "alignment_match": false, "accuracy": 0.7142857142857143, "similarity": 0.9957467710289237, "similarity_true": 0.995739333833242}, {"source": ["foundations", "buildings", "supporting", "solid", "weak", "crack"], "true": ["reasons", "theories", "confirming", "rational", "dubious", "flaw"], "pred": ["reasons", "theories", "confirming", "rational", "dubious", "flaw"], "alignment_match": true, "accuracy": 1, "similarity": 0.996877981935695, "similarity_true": 0.996877981935695}, {"source": ["obstructions", "destination", "route", "traveller", "traveling", "companion", "arriving"], "true": ["difficulties", "goal", "plan", "person", "problem solving", "partner", "succeeding"], "pred": ["problem solving", "goal", "plan", "person", "difficulties", "partner", "succeeding"], "alignment_match": false, "accuracy": 0.7142857142857143, "similarity": 0.9947483897730063, "similarity_true": 0.9947357996316091}, {"source": ["money", "allocate", "budget", "effective", "cheap", "expansive"], "true": ["time", "invest", "schedule", "efficient", "quick", "slow"], "pred": ["time", "invest", "schedule", "efficient", "quick", "slow"], "alignment_match": true, "accuracy": 1, "similarity": 0.997373157147748, "similarity_true": 0.997373157147748}, {"source": ["seeds", "planted", "fruitful", "fruit", "grow", "wither", "blossom"], "true": ["ideas", "inspired", "productive", "product", "develop", "fail", "succeed"], "pred": ["ideas", "inspired", "productive", "product", "develop", "fail", "succeed"], "alignment_match": true, "accuracy": 1, "similarity": 0.9964193622914028, "similarity_true": 0.9964193622914028}, {"source": ["machine", "working", "turned on", "turned off", "broken", "power", "repair"], "true": ["mind", "thinking", "awake", "asleep", "confused", "intelligence", "therapy"], "pred": ["mind", "asleep", "awake", "thinking", "confused", "intelligence", "therapy"], "alignment_match": false, "accuracy": 0.7142857142857143, "similarity": 0.9956977474695079, "similarity_true": 0.9956832817196968}, {"source": ["object", "hold", "weight", "heavy", "light"], "true": ["idea", "understand", "analyze", "important", "trivial"], "pred": ["idea", "analyze", "understand", "trivial", "important"], "alignment_match": false, "accuracy": 0.2, "similarity": 0.9954065370534377, "similarity_true": 0.9947540103505097}, {"source": ["follow", "leader", "path", "follower", "lost", "wanders", "twisted", "straight"], "true": ["understand", "speaker", "argument", "listener", "misunderstood", "digresses", "complicated", "simple"], "pred": ["understand", "speaker", "argument", "listener", "complicated", "digresses", "misunderstood", "simple"], "alignment_match": false, "accuracy": 0.75, "similarity": 0.9958884956064967, "similarity_true": 0.9958305143006762}, {"source": ["seeing", "light", "illuminating", "darkness", "view", "hidden"], "true": ["understanding", "knowledge", "explaining", "confusion", "interpretation", "secret"], "pred": ["understanding", "knowledge", "explaining", "confusion", "interpretation", "secret"], "alignment_match": true, "accuracy": 1, "similarity": 0.9966974449211523, "similarity_true": 0.9966974449211523}]}