manishiitg commited on
Commit
6980b87
1 Parent(s): 6e7d32a

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +53 -3
README.md CHANGED
@@ -10,6 +10,58 @@ model-index:
10
  results: []
11
  ---
12
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
13
  DHARMA TINY EVAL
14
  ============
15
 
@@ -27,8 +79,6 @@ DHARMA TINY EVAL
27
  | OpenHathi-7B-Hi-v0.1-Base | 0.2862 | 0.3333 | 0.5130 | 0.6077 | 0.4907 | 0.2301 | 0.3017 | 0.2677 | 0.1933 |
28
  | Airavata | 0.2751 | 0.1274 | 0.2268 | 0.0615 | 0.3866 | 0.1104 | 0.2845 | 0.1450 | 0.3383 |
29
  | gemma-7b-it | 0.1227 | 0.0786 | 0.0743 | 0.1808 | 0.1561 | 0.0491 | 0.1078 | 0.0818 | 0.0855 |
30
- | Qwen1.5-72B-Chat-AWQ | 0.0000 | 0.0000 | 0.0000 | 0.0000 | 0.0000 | 0.0000 | 0.0000 | 0.0000 | 0.0000 |
31
- | Qwen1.5-7B-Chat | 0.0000 | 0.0000 | 0.0000 | 0.0000 | 0.0000 | 0.0000 | 0.0000 | 0.0000 | 0.0000 |
32
 
33
  #### Language En
34
 
@@ -44,7 +94,7 @@ DHARMA TINY EVAL
44
  | open-aditi-hi-v1 | 0.8104 | 0.3902 | 0.2491 | 0.6962 | 0.5539 | 0.3681 | 0.6379 | 0.5056 | 0.5911 |
45
  | Airavata | 0.7026 | 0.4282 | 0.3123 | 0.7192 | 0.5651 | 0.3313 | 0.5172 | 0.3792 | 0.5093 |
46
  | OpenHathi-7B-Hi-v0.1-Base | 0.4684 | 0.3062 | 0.4758 | 0.6346 | 0.5167 | 0.2577 | 0.3017 | 0.2788 | 0.2714 |
47
- | gemma-7b-it | 0.0000 | 0.0000 | 0.0000 | 0.0000 | 0.0000 | 0.0000 | 0.0000 | 0.0000 | 0.0000 |
48
 
49
  Task: BoolQ Metric: score
50
 
 
10
  results: []
11
  ---
12
 
13
+ Preview of dataset trained on: https://huggingface.co/datasets/manishiitg/aditi-syn-v2
14
+
15
+ The synthetic dataset (https://huggingface.co/datasets/manishiitg/aditi-syn-v2) and the full data creation pipeline (https://github.com/manishiitg/aditi_dataset) have been open-sourced, enabling transparency and fostering further research in this domain. The dataset is a rich tapestry of Hinglish (a blend of Hindi and English) data, as well as a diverse array of tasks spanning tools, retrieval-augmented generation (RAG), mathematics, and reasoning – all in the Hindi language.
16
+
17
+ LMJudge Eval
18
+ ============
19
+
20
+ https://github.com/manishiitg/IndicLMJudge
21
+
22
+
23
+ #### LLM Judge Language: hi
24
+ | Model | Language | Score | No# Questions |
25
+ | --- | --- | --- | --- |
26
+ | mistralai/Mixtral-8x7B-Instruct-v0.1 | hi | 8.7148 | 554 |
27
+ | Qwen/Qwen1.5-72B-Chat-AWQ | hi | 8.3695 | 554 |
28
+ | manishiitg/open-aditi-v6-llama3 | hi | 8.2659 | 551 |
29
+ | Qwen/Qwen1.5-14B-Chat | hi | 8.2404 | 554 |
30
+ | google/gemma-7b-it | hi | 7.9152 | 554 |
31
+ | manishiitg/open-aditi-v6-gemma | hi | 7.8634 | 549 |
32
+ | Qwen/Qwen1.5-7B-Chat | hi | 7.8587 | 554 |
33
+ | manishiitg/open-aditi-hi-v3 | hi | 7.7644 | 554 |
34
+ | manishiitg/open-aditi-hi-v4 | hi | 7.6150 | 554 |
35
+ | manishiitg/open-aditi-hi-v2 | hi | 7.2518 | 554 |
36
+ | teknium/OpenHermes-2.5-Mistral-7B | hi | 7.2489 | 554 |
37
+ | ai4bharat/Airavata | hi | 6.9468 | 554 |
38
+ | 01-ai/Yi-34B-Chat | hi | 6.5801 | 554 |
39
+ | manishiitg/open-aditi-hi-v1 | hi | 4.7022 | 554 |
40
+ | sarvamai/OpenHathi-7B-Hi-v0.1-Base | hi | 4.2834 | 598 |
41
+ | Qwen/Qwen1.5-4B-Chat | hi | 4.1101 | 554 |
42
+
43
+
44
+ #### LLM Judge Language: en
45
+ | Model | Language | Score | No# Questions |
46
+ | --- | --- | --- | --- |
47
+ | Qwen/Qwen1.5-14B-Chat | en | 9.1947 | 356 |
48
+ | Qwen/Qwen1.5-72B-Chat-AWQ | en | 9.1618 | 356 |
49
+ | Qwen/Qwen1.5-7B-Chat | en | 9.1570 | 356 |
50
+ | 01-ai/Yi-34B-Chat | en | 9.1368 | 356 |
51
+ | mistralai/Mixtral-8x7B-Instruct-v0.1 | en | 9.1306 | 356 |
52
+ | manishiitg/open-aditi-v6-gemma | en | 9.1003 | 356 |
53
+ | teknium/OpenHermes-2.5-Mistral-7B | en | 9.0230 | 356 |
54
+ | manishiitg/open-aditi-v6-llama3 | en | 9.0197 | 356 |
55
+ | manishiitg/open-aditi-hi-v3 | en | 8.9615 | 356 |
56
+ | manishiitg/open-aditi-hi-v4 | en | 8.9188 | 356 |
57
+ | google/gemma-7b-it | en | 8.8191 | 356 |
58
+ | Qwen/Qwen1.5-4B-Chat | en | 8.7500 | 356 |
59
+ | google/gemma-2b-it | en | 8.4671 | 356 |
60
+ | manishiitg/open-aditi-hi-v2 | en | 8.4584 | 356 |
61
+ | ai4bharat/Airavata | en | 7.3834 | 356 |
62
+ | manishiitg/open-aditi-hi-v1 | en | 6.6559 | 356 |
63
+ | sarvamai/OpenHathi-7B-Hi-v0.1-Base | en | 5.9567 | 312 |
64
+
65
  DHARMA TINY EVAL
66
  ============
67
 
 
79
  | OpenHathi-7B-Hi-v0.1-Base | 0.2862 | 0.3333 | 0.5130 | 0.6077 | 0.4907 | 0.2301 | 0.3017 | 0.2677 | 0.1933 |
80
  | Airavata | 0.2751 | 0.1274 | 0.2268 | 0.0615 | 0.3866 | 0.1104 | 0.2845 | 0.1450 | 0.3383 |
81
  | gemma-7b-it | 0.1227 | 0.0786 | 0.0743 | 0.1808 | 0.1561 | 0.0491 | 0.1078 | 0.0818 | 0.0855 |
 
 
82
 
83
  #### Language En
84
 
 
94
  | open-aditi-hi-v1 | 0.8104 | 0.3902 | 0.2491 | 0.6962 | 0.5539 | 0.3681 | 0.6379 | 0.5056 | 0.5911 |
95
  | Airavata | 0.7026 | 0.4282 | 0.3123 | 0.7192 | 0.5651 | 0.3313 | 0.5172 | 0.3792 | 0.5093 |
96
  | OpenHathi-7B-Hi-v0.1-Base | 0.4684 | 0.3062 | 0.4758 | 0.6346 | 0.5167 | 0.2577 | 0.3017 | 0.2788 | 0.2714 |
97
+
98
 
99
  Task: BoolQ Metric: score
100