huseinzol05
commited on
Commit
β’
c4e2aeb
1
Parent(s):
3607302
initial app
Browse files- .gitignore +1 -0
- app.py +39 -2
.gitignore
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
__pycache__
|
app.py
CHANGED
@@ -11,15 +11,52 @@ INTRODUCTION_TEXT = """
|
|
11 |
|
12 |
π We evaluate models based on 4 datasets,
|
13 |
|
14 |
-
1.
|
15 |
2. Epenerbitan, https://huggingface.co/datasets/mesolitica/malaysian-ultrachat/resolve/main/ultrachat-epenerbitan-malay.jsonl
|
16 |
3. gov.my PDF files, https://huggingface.co/datasets/mesolitica/malaysian-ultrachat/resolve/main/ultrachat-gov.my.jsonl
|
17 |
-
4. lom.agc.gov.my PDF files, https://huggingface.co/datasets/mesolitica/malaysian-ultrachat/resolve/main/ultrachat-lom-agc.jsonl
|
18 |
"""
|
19 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
20 |
demo = gr.Blocks(css=custom_css)
|
21 |
with demo:
|
22 |
gr.HTML(TITLE)
|
23 |
gr.Markdown(INTRODUCTION_TEXT, elem_classes="markdown-text")
|
|
|
24 |
|
25 |
demo.launch()
|
|
|
11 |
|
12 |
π We evaluate models based on 4 datasets,
|
13 |
|
14 |
+
1. Research paper keyword `melayu` using Crossref, https://huggingface.co/datasets/mesolitica/malaysian-ultrachat/resolve/main/ultrachat-crossref-melayu-malay.jsonl
|
15 |
2. Epenerbitan, https://huggingface.co/datasets/mesolitica/malaysian-ultrachat/resolve/main/ultrachat-epenerbitan-malay.jsonl
|
16 |
3. gov.my PDF files, https://huggingface.co/datasets/mesolitica/malaysian-ultrachat/resolve/main/ultrachat-gov.my.jsonl
|
|
|
17 |
"""
|
18 |
|
19 |
+
close_source = [
|
20 |
+
{
|
21 |
+
'model': 'OpenAI ADA-002',
|
22 |
+
'Crossref Melayu top-1': 0.3155939351340496,
|
23 |
+
'Crossref Melayu top-3': 0.5120996083944171,
|
24 |
+
'Crossref Melayu top-5': 0.5878100210864544,
|
25 |
+
'Crossref Melayu top-10': 0.6721558389396526,
|
26 |
+
}
|
27 |
+
]
|
28 |
+
|
29 |
+
open_source = [
|
30 |
+
{
|
31 |
+
'model': '[llama2-embedding-600m-8k](https://huggingface.co/mesolitica/llama2-embedding-600m-8k)',
|
32 |
+
'Crossref Melayu top-1': 0.09549151521237072,
|
33 |
+
'Crossref Melayu top-3': 0.1834521538307059,
|
34 |
+
'Crossref Melayu top-5': 0.23375840947886334,
|
35 |
+
'Crossref Melayu top-10': 0.3098704689225826,
|
36 |
+
'lom.agc.gov.my top-1': 0.05215334826985312,
|
37 |
+
'lom.agc.gov.my top-3': 0.09932785660941,
|
38 |
+
'lom.agc.gov.my top-5': 0.12969878018421707,
|
39 |
+
'lom.agc.gov.my top-10': 0.1797361214836943,
|
40 |
+
},
|
41 |
+
{
|
42 |
+
'model': '[llama2-embedding-1b-8k](https://huggingface.co/mesolitica/llama2-embedding-1b-8k)',
|
43 |
+
'Crossref Melayu top-1': 0.06777788934631991,
|
44 |
+
'Crossref Melayu top-3': 0.142584596847073,
|
45 |
+
'Crossref Melayu top-5': 0.18817150316296816,
|
46 |
+
'Crossref Melayu top-10': 0.25715433276433375,
|
47 |
+
'lom.agc.gov.my top-1': 0.06870799103808813,
|
48 |
+
'lom.agc.gov.my top-3': 0.1343042071197411,
|
49 |
+
'lom.agc.gov.my top-5': 0.1717699775952203,
|
50 |
+
'lom.agc.gov.my top-10': 0.23089370176748816,
|
51 |
+
},
|
52 |
+
]
|
53 |
+
|
54 |
+
data = pd.DataFrame(close_source + open_source)
|
55 |
+
|
56 |
demo = gr.Blocks(css=custom_css)
|
57 |
with demo:
|
58 |
gr.HTML(TITLE)
|
59 |
gr.Markdown(INTRODUCTION_TEXT, elem_classes="markdown-text")
|
60 |
+
gr.DataFrame(data, datatype = 'markdown')
|
61 |
|
62 |
demo.launch()
|