manishiitg
commited on
Commit
•
cefe1b9
1
Parent(s):
714cebb
Update README.md
Browse files
README.md
CHANGED
@@ -11,6 +11,58 @@ model-index:
|
|
11 |
---
|
12 |
|
13 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
14 |
DHARMA TINY EVAL
|
15 |
============
|
16 |
|
@@ -28,8 +80,6 @@ DHARMA TINY EVAL
|
|
28 |
| OpenHathi-7B-Hi-v0.1-Base | 0.2862 | 0.3333 | 0.5130 | 0.6077 | 0.4907 | 0.2301 | 0.3017 | 0.2677 | 0.1933 |
|
29 |
| Airavata | 0.2751 | 0.1274 | 0.2268 | 0.0615 | 0.3866 | 0.1104 | 0.2845 | 0.1450 | 0.3383 |
|
30 |
| gemma-7b-it | 0.1227 | 0.0786 | 0.0743 | 0.1808 | 0.1561 | 0.0491 | 0.1078 | 0.0818 | 0.0855 |
|
31 |
-
| Qwen1.5-72B-Chat-AWQ | 0.0000 | 0.0000 | 0.0000 | 0.0000 | 0.0000 | 0.0000 | 0.0000 | 0.0000 | 0.0000 |
|
32 |
-
| Qwen1.5-7B-Chat | 0.0000 | 0.0000 | 0.0000 | 0.0000 | 0.0000 | 0.0000 | 0.0000 | 0.0000 | 0.0000 |
|
33 |
|
34 |
#### Language En
|
35 |
|
@@ -45,7 +95,6 @@ DHARMA TINY EVAL
|
|
45 |
| open-aditi-hi-v1 | 0.8104 | 0.3902 | 0.2491 | 0.6962 | 0.5539 | 0.3681 | 0.6379 | 0.5056 | 0.5911 |
|
46 |
| Airavata | 0.7026 | 0.4282 | 0.3123 | 0.7192 | 0.5651 | 0.3313 | 0.5172 | 0.3792 | 0.5093 |
|
47 |
| OpenHathi-7B-Hi-v0.1-Base | 0.4684 | 0.3062 | 0.4758 | 0.6346 | 0.5167 | 0.2577 | 0.3017 | 0.2788 | 0.2714 |
|
48 |
-
| gemma-7b-it | 0.0000 | 0.0000 | 0.0000 | 0.0000 | 0.0000 | 0.0000 | 0.0000 | 0.0000 | 0.0000 |
|
49 |
|
50 |
Task: BoolQ Metric: score
|
51 |
|
|
|
11 |
---
|
12 |
|
13 |
|
14 |
+
Preview of dataset trained on: https://huggingface.co/datasets/manishiitg/aditi-syn-v2
|
15 |
+
|
16 |
+
The synthetic dataset (https://huggingface.co/datasets/manishiitg/aditi-syn-v2) and the full data creation pipeline (https://github.com/manishiitg/aditi_dataset) have been open-sourced, enabling transparency and fostering further research in this domain. The dataset is a rich tapestry of Hinglish (a blend of Hindi and English) data, as well as a diverse array of tasks spanning tools, retrieval-augmented generation (RAG), mathematics, and reasoning – all in the Hindi language.
|
17 |
+
|
18 |
+
LMJudge Eval
|
19 |
+
============
|
20 |
+
|
21 |
+
https://github.com/manishiitg/IndicLMJudge
|
22 |
+
|
23 |
+
|
24 |
+
#### LLM Judge Language: hi
|
25 |
+
| Model | Language | Score | No# Questions |
|
26 |
+
| --- | --- | --- | --- |
|
27 |
+
| mistralai/Mixtral-8x7B-Instruct-v0.1 | hi | 8.7148 | 554 |
|
28 |
+
| Qwen/Qwen1.5-72B-Chat-AWQ | hi | 8.3695 | 554 |
|
29 |
+
| manishiitg/open-aditi-v6-llama3 | hi | 8.2659 | 551 |
|
30 |
+
| Qwen/Qwen1.5-14B-Chat | hi | 8.2404 | 554 |
|
31 |
+
| google/gemma-7b-it | hi | 7.9152 | 554 |
|
32 |
+
| manishiitg/open-aditi-v6-gemma | hi | 7.8634 | 549 |
|
33 |
+
| Qwen/Qwen1.5-7B-Chat | hi | 7.8587 | 554 |
|
34 |
+
| manishiitg/open-aditi-hi-v3 | hi | 7.7644 | 554 |
|
35 |
+
| manishiitg/open-aditi-hi-v4 | hi | 7.6150 | 554 |
|
36 |
+
| manishiitg/open-aditi-hi-v2 | hi | 7.2518 | 554 |
|
37 |
+
| teknium/OpenHermes-2.5-Mistral-7B | hi | 7.2489 | 554 |
|
38 |
+
| ai4bharat/Airavata | hi | 6.9468 | 554 |
|
39 |
+
| 01-ai/Yi-34B-Chat | hi | 6.5801 | 554 |
|
40 |
+
| manishiitg/open-aditi-hi-v1 | hi | 4.7022 | 554 |
|
41 |
+
| sarvamai/OpenHathi-7B-Hi-v0.1-Base | hi | 4.2834 | 598 |
|
42 |
+
| Qwen/Qwen1.5-4B-Chat | hi | 4.1101 | 554 |
|
43 |
+
|
44 |
+
|
45 |
+
#### LLM Judge Language: en
|
46 |
+
| Model | Language | Score | No# Questions |
|
47 |
+
| --- | --- | --- | --- |
|
48 |
+
| Qwen/Qwen1.5-14B-Chat | en | 9.1947 | 356 |
|
49 |
+
| Qwen/Qwen1.5-72B-Chat-AWQ | en | 9.1618 | 356 |
|
50 |
+
| Qwen/Qwen1.5-7B-Chat | en | 9.1570 | 356 |
|
51 |
+
| 01-ai/Yi-34B-Chat | en | 9.1368 | 356 |
|
52 |
+
| mistralai/Mixtral-8x7B-Instruct-v0.1 | en | 9.1306 | 356 |
|
53 |
+
| manishiitg/open-aditi-v6-gemma | en | 9.1003 | 356 |
|
54 |
+
| teknium/OpenHermes-2.5-Mistral-7B | en | 9.0230 | 356 |
|
55 |
+
| manishiitg/open-aditi-v6-llama3 | en | 9.0197 | 356 |
|
56 |
+
| manishiitg/open-aditi-hi-v3 | en | 8.9615 | 356 |
|
57 |
+
| manishiitg/open-aditi-hi-v4 | en | 8.9188 | 356 |
|
58 |
+
| google/gemma-7b-it | en | 8.8191 | 356 |
|
59 |
+
| Qwen/Qwen1.5-4B-Chat | en | 8.7500 | 356 |
|
60 |
+
| google/gemma-2b-it | en | 8.4671 | 356 |
|
61 |
+
| manishiitg/open-aditi-hi-v2 | en | 8.4584 | 356 |
|
62 |
+
| ai4bharat/Airavata | en | 7.3834 | 356 |
|
63 |
+
| manishiitg/open-aditi-hi-v1 | en | 6.6559 | 356 |
|
64 |
+
| sarvamai/OpenHathi-7B-Hi-v0.1-Base | en | 5.9567 | 312 |
|
65 |
+
|
66 |
DHARMA TINY EVAL
|
67 |
============
|
68 |
|
|
|
80 |
| OpenHathi-7B-Hi-v0.1-Base | 0.2862 | 0.3333 | 0.5130 | 0.6077 | 0.4907 | 0.2301 | 0.3017 | 0.2677 | 0.1933 |
|
81 |
| Airavata | 0.2751 | 0.1274 | 0.2268 | 0.0615 | 0.3866 | 0.1104 | 0.2845 | 0.1450 | 0.3383 |
|
82 |
| gemma-7b-it | 0.1227 | 0.0786 | 0.0743 | 0.1808 | 0.1561 | 0.0491 | 0.1078 | 0.0818 | 0.0855 |
|
|
|
|
|
83 |
|
84 |
#### Language En
|
85 |
|
|
|
95 |
| open-aditi-hi-v1 | 0.8104 | 0.3902 | 0.2491 | 0.6962 | 0.5539 | 0.3681 | 0.6379 | 0.5056 | 0.5911 |
|
96 |
| Airavata | 0.7026 | 0.4282 | 0.3123 | 0.7192 | 0.5651 | 0.3313 | 0.5172 | 0.3792 | 0.5093 |
|
97 |
| OpenHathi-7B-Hi-v0.1-Base | 0.4684 | 0.3062 | 0.4758 | 0.6346 | 0.5167 | 0.2577 | 0.3017 | 0.2788 | 0.2714 |
|
|
|
98 |
|
99 |
Task: BoolQ Metric: score
|
100 |
|