huseinzol05 commited on
Commit
5f16d53
β€’
1 Parent(s): aaab57e

improve score

Browse files
Files changed (1) hide show
  1. app.py +9 -8
app.py CHANGED
@@ -15,9 +15,7 @@ INTRODUCTION_TEXT = """
15
  - This test is for 15 years old Malaysia student, it is about reading comprehension and general knowledge for malay language.
16
  2. Tatabahasa, contains 349 questions, https://github.com/mesolitica/malaysian-dataset/tree/master/llm-benchmark/tatabahasabm.tripod.com
17
  - This test is general test for malay grammar.
18
- 3. Translated IndoNLI to Malay, tested on `test_expert` dataset, https://huggingface.co/datasets/mesolitica/translated-indonli
19
- - This test is general test to language reasoning.
20
- 4. HumanEval, https://github.com/openai/human-eval
21
  - This test is for programming language understanding.
22
  """
23
 
@@ -71,10 +69,13 @@ open_source = [
71
  'Tatabahasa 3-shots': 27.507163323782237,
72
  },
73
  {
74
- 'model': '[malaysian-llama2-7b-32k-instructions](https://huggingface.co/mesolitica/malaysian-llama2-7b-32k-instructions)',
75
- 'BM-PT3 0-shot': 35.294117647058826,
76
- 'BM-PT3 1-shot': 21.153846153846153,
77
- 'BM-PT3 3-shots': 28.30188679245283,
 
 
 
78
  },
79
  {
80
  'model': '[malaysian-llama2-13b-32k](https://huggingface.co/mesolitica/llama-13b-hf-32768-fpf)',
@@ -120,7 +121,7 @@ open_source = [
120
  'BM-PT3 0-shot': 40.74074074074074,
121
  'BM-PT3 1-shot': 31.48148148148148,
122
  'BM-PT3 3-shots': 24.074074074074073,
123
- 'Tatabahasa 0-shot': 56.446991404011456,
124
  'Tatabahasa 1-shot': 49.28366762177651,
125
  'Tatabahasa 3-shots': 53.86819484240688
126
  },
 
15
  - This test is for 15 years old Malaysia student, it is about reading comprehension and general knowledge for malay language.
16
  2. Tatabahasa, contains 349 questions, https://github.com/mesolitica/malaysian-dataset/tree/master/llm-benchmark/tatabahasabm.tripod.com
17
  - This test is general test for malay grammar.
18
+ 3. HumanEval, https://github.com/openai/human-eval
 
 
19
  - This test is for programming language understanding.
20
  """
21
 
 
69
  'Tatabahasa 3-shots': 27.507163323782237,
70
  },
71
  {
72
+ 'model': '[malaysian-llama2-7b-32k-instructions](https://huggingface.co/mesolitica/malaysian-llama2-7b-32k-instructions-v2)',
73
+ 'BM-PT3 0-shot': 33.33333333333333,
74
+ 'BM-PT3 1-shot': 37.03703703703704,
75
+ 'BM-PT3 3-shots': 35.18518518518518,
76
+ 'Tatabahasa 0-shot': 54.72779369627507,
77
+ 'Tatabahasa 1-shot': 48.42406876790831,
78
+ 'Tatabahasa 3-shots': 41.833810888252145,
79
  },
80
  {
81
  'model': '[malaysian-llama2-13b-32k](https://huggingface.co/mesolitica/llama-13b-hf-32768-fpf)',
 
121
  'BM-PT3 0-shot': 40.74074074074074,
122
  'BM-PT3 1-shot': 31.48148148148148,
123
  'BM-PT3 3-shots': 24.074074074074073,
124
+ 'Tatabahasa 0-shot': 57.879656160458445,
125
  'Tatabahasa 1-shot': 49.28366762177651,
126
  'Tatabahasa 3-shots': 53.86819484240688
127
  },