huseinzol05 commited on
Commit
c4e2aeb
β€’
1 Parent(s): 3607302

initial app

Browse files
Files changed (2) hide show
  1. .gitignore +1 -0
  2. app.py +39 -2
.gitignore ADDED
@@ -0,0 +1 @@
 
 
1
+ __pycache__
app.py CHANGED
@@ -11,15 +11,52 @@ INTRODUCTION_TEXT = """
11
 
12
  πŸ“ˆ We evaluate models based on 4 datasets,
13
 
14
- 1. CrossRef Melayu related DOI, https://huggingface.co/datasets/mesolitica/malaysian-ultrachat/resolve/main/ultrachat-crossref-melayu-malay.jsonl
15
  2. Epenerbitan, https://huggingface.co/datasets/mesolitica/malaysian-ultrachat/resolve/main/ultrachat-epenerbitan-malay.jsonl
16
  3. gov.my PDF files, https://huggingface.co/datasets/mesolitica/malaysian-ultrachat/resolve/main/ultrachat-gov.my.jsonl
17
- 4. lom.agc.gov.my PDF files, https://huggingface.co/datasets/mesolitica/malaysian-ultrachat/resolve/main/ultrachat-lom-agc.jsonl
18
  """
19
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
20
  demo = gr.Blocks(css=custom_css)
21
  with demo:
22
  gr.HTML(TITLE)
23
  gr.Markdown(INTRODUCTION_TEXT, elem_classes="markdown-text")
 
24
 
25
  demo.launch()
 
11
 
12
  πŸ“ˆ We evaluate models based on 4 datasets,
13
 
14
+ 1. Research paper keyword `melayu` using Crossref, https://huggingface.co/datasets/mesolitica/malaysian-ultrachat/resolve/main/ultrachat-crossref-melayu-malay.jsonl
15
  2. Epenerbitan, https://huggingface.co/datasets/mesolitica/malaysian-ultrachat/resolve/main/ultrachat-epenerbitan-malay.jsonl
16
  3. gov.my PDF files, https://huggingface.co/datasets/mesolitica/malaysian-ultrachat/resolve/main/ultrachat-gov.my.jsonl
 
17
  """
18
 
19
+ close_source = [
20
+ {
21
+ 'model': 'OpenAI ADA-002',
22
+ 'Crossref Melayu top-1': 0.3155939351340496,
23
+ 'Crossref Melayu top-3': 0.5120996083944171,
24
+ 'Crossref Melayu top-5': 0.5878100210864544,
25
+ 'Crossref Melayu top-10': 0.6721558389396526,
26
+ }
27
+ ]
28
+
29
+ open_source = [
30
+ {
31
+ 'model': '[llama2-embedding-600m-8k](https://huggingface.co/mesolitica/llama2-embedding-600m-8k)',
32
+ 'Crossref Melayu top-1': 0.09549151521237072,
33
+ 'Crossref Melayu top-3': 0.1834521538307059,
34
+ 'Crossref Melayu top-5': 0.23375840947886334,
35
+ 'Crossref Melayu top-10': 0.3098704689225826,
36
+ 'lom.agc.gov.my top-1': 0.05215334826985312,
37
+ 'lom.agc.gov.my top-3': 0.09932785660941,
38
+ 'lom.agc.gov.my top-5': 0.12969878018421707,
39
+ 'lom.agc.gov.my top-10': 0.1797361214836943,
40
+ },
41
+ {
42
+ 'model': '[llama2-embedding-1b-8k](https://huggingface.co/mesolitica/llama2-embedding-1b-8k)',
43
+ 'Crossref Melayu top-1': 0.06777788934631991,
44
+ 'Crossref Melayu top-3': 0.142584596847073,
45
+ 'Crossref Melayu top-5': 0.18817150316296816,
46
+ 'Crossref Melayu top-10': 0.25715433276433375,
47
+ 'lom.agc.gov.my top-1': 0.06870799103808813,
48
+ 'lom.agc.gov.my top-3': 0.1343042071197411,
49
+ 'lom.agc.gov.my top-5': 0.1717699775952203,
50
+ 'lom.agc.gov.my top-10': 0.23089370176748816,
51
+ },
52
+ ]
53
+
54
+ data = pd.DataFrame(close_source + open_source)
55
+
56
  demo = gr.Blocks(css=custom_css)
57
  with demo:
58
  gr.HTML(TITLE)
59
  gr.Markdown(INTRODUCTION_TEXT, elem_classes="markdown-text")
60
+ gr.DataFrame(data, datatype = 'markdown')
61
 
62
  demo.launch()