magilogi
commited on
Commit
Β·
49b4a14
1
Parent(s):
3fd0dba
explanation
Browse files- app.py +2 -2
- src/models_info.py +3 -3
app.py
CHANGED
@@ -17,7 +17,7 @@ explanation_data = {
|
|
17 |
"Description": [
|
18 |
"Model accuracy on the [Come up with a fitting name] task.",
|
19 |
"[How do we best explain this?]",
|
20 |
-
"
|
21 |
"Model accuracy on MedMCQA task with original data. (Only includes questions that overlap with the g2b dataset)",
|
22 |
"Difference in MedMCQA accuracy for swapped and non-swapped datasets, highlighting the impact of G2B drug name substitution on performance.",
|
23 |
"Model accuracy on MedQA (4 options) task where generic drug names are substituted with brand names.",
|
@@ -75,7 +75,7 @@ def create_bar_plot(df, col, title):
|
|
75 |
with gr.Blocks(css="custom.css") as demo:
|
76 |
with gr.Column():
|
77 |
gr.Markdown(
|
78 |
-
"""<div style="text-align: center;"><h1> <span style='color: #E6B800;'>π° RABBITS
|
79 |
<span style='color: #E6B800;'>T</span>erm <span style='color: #E6B800;'>S</span>ubstitutions for Language Models <span style='color: #E6B800;'></span></h1></div>"""
|
80 |
)
|
81 |
with gr.Row():
|
|
|
17 |
"Description": [
|
18 |
"Model accuracy on the [Come up with a fitting name] task.",
|
19 |
"[How do we best explain this?]",
|
20 |
+
"G2B Refers to the 'Generic' to 'Brand' name swap. This is model accuracy on MedMCQA task where generic drug names are substituted with brand names.",
|
21 |
"Model accuracy on MedMCQA task with original data. (Only includes questions that overlap with the g2b dataset)",
|
22 |
"Difference in MedMCQA accuracy for swapped and non-swapped datasets, highlighting the impact of G2B drug name substitution on performance.",
|
23 |
"Model accuracy on MedQA (4 options) task where generic drug names are substituted with brand names.",
|
|
|
75 |
with gr.Blocks(css="custom.css") as demo:
|
76 |
with gr.Column():
|
77 |
gr.Markdown(
|
78 |
+
"""<div style="text-align: center;"><h1> <span style='color: #E6B800;'>π° RABBITS</span>:<span style='color: #E6B800;'>R</span>obust <span style='color: #E6B800;'>A</span>ssessment of <span style='color: #E6B800;'>B</span>iomedical <span style='color: #E6B800;'>B</span>enchmarks <span style='color: #E6B800;'>I</span>nvolving drug
|
79 |
<span style='color: #E6B800;'>T</span>erm <span style='color: #E6B800;'>S</span>ubstitutions for Language Models <span style='color: #E6B800;'></span></h1></div>"""
|
80 |
)
|
81 |
with gr.Row():
|
src/models_info.py
CHANGED
@@ -54,15 +54,15 @@ model_info = {
|
|
54 |
},
|
55 |
"mistralai-Mistral-7B-v0.3": {
|
56 |
"link": "https://huggingface.co/mistralai/Mistral-7B-v0.3",
|
57 |
-
"tuning": "π’" #
|
58 |
},
|
59 |
"mistralai-Mixtral-8x22B-v0.1": {
|
60 |
"link": "https://huggingface.co/mistralai/Mixtral-8x22B-v0.1",
|
61 |
-
"tuning": "π’" #
|
62 |
},
|
63 |
"mistralai-Mixtral-8x7B-v0.1": {
|
64 |
"link": "https://huggingface.co/mistralai/Mixtral-8x7B-v0.1",
|
65 |
-
"tuning": "π’" #
|
66 |
},
|
67 |
"ProbeMedicalYonseiMAILab-medllama3-v20": {
|
68 |
"link": "https://huggingface.co/ProbeMedicalYonseiMAILab/medllama3-v20",
|
|
|
54 |
},
|
55 |
"mistralai-Mistral-7B-v0.3": {
|
56 |
"link": "https://huggingface.co/mistralai/Mistral-7B-v0.3",
|
57 |
+
"tuning": "π’" # pre-trained
|
58 |
},
|
59 |
"mistralai-Mixtral-8x22B-v0.1": {
|
60 |
"link": "https://huggingface.co/mistralai/Mixtral-8x22B-v0.1",
|
61 |
+
"tuning": "π’" # pre-trained
|
62 |
},
|
63 |
"mistralai-Mixtral-8x7B-v0.1": {
|
64 |
"link": "https://huggingface.co/mistralai/Mixtral-8x7B-v0.1",
|
65 |
+
"tuning": "π’" # pre-trained
|
66 |
},
|
67 |
"ProbeMedicalYonseiMAILab-medllama3-v20": {
|
68 |
"link": "https://huggingface.co/ProbeMedicalYonseiMAILab/medllama3-v20",
|