Spaces:

AIM-Harvard
/

rabbits-leaderboard

Running

magilogi commited on Jun 12, 2024

Commit

49b4a14

1 Parent(s): 3fd0dba

explanation

Files changed (2) hide show

app.py CHANGED Viewed

@@ -17,7 +17,7 @@ explanation_data = {
     "Description": [
         "Model accuracy on the [Come up with a fitting name] task.",
         "[How do we best explain this?]",
-        "Model accuracy on MedMCQA task where generic drug names are substituted with brand names.",
         "Model accuracy on MedMCQA task with original data. (Only includes questions that overlap with the g2b dataset)",
         "Difference in MedMCQA accuracy for swapped and non-swapped datasets, highlighting the impact of G2B drug name substitution on performance.",
         "Model accuracy on MedQA (4 options) task where generic drug names are substituted with brand names.",
@@ -75,7 +75,7 @@ def create_bar_plot(df, col, title):
 with gr.Blocks(css="custom.css") as demo:
     with gr.Column():
         gr.Markdown(
-            """<div style="text-align: center;"><h1> <span style='color: #E6B800;'>🐰 RABBITS:</span> <span style='color: #E6B800;'>R</span>obust <span style='color: #E6B800;'>A</span>ssessment of <span style='color: #E6B800;'>B</span>iomedical <span style='color: #E6B800;'>B</span>enchmarks <span style='color: #E6B800;'>I</span>nvolving drug
 <span style='color: #E6B800;'>T</span>erm <span style='color: #E6B800;'>S</span>ubstitutions for Language Models <span style='color: #E6B800;'></span></h1></div>"""
         )
     with gr.Row():

     "Description": [
         "Model accuracy on the [Come up with a fitting name] task.",
         "[How do we best explain this?]",
+        "G2B Refers to the 'Generic' to 'Brand' name swap. This is model accuracy on MedMCQA task where generic drug names are substituted with brand names.",
         "Model accuracy on MedMCQA task with original data. (Only includes questions that overlap with the g2b dataset)",
         "Difference in MedMCQA accuracy for swapped and non-swapped datasets, highlighting the impact of G2B drug name substitution on performance.",
         "Model accuracy on MedQA (4 options) task where generic drug names are substituted with brand names.",
 with gr.Blocks(css="custom.css") as demo:
     with gr.Column():
         gr.Markdown(
+            """<div style="text-align: center;"><h1> <span style='color: #E6B800;'>🐰 RABBITS</span>:<span style='color: #E6B800;'>R</span>obust <span style='color: #E6B800;'>A</span>ssessment of <span style='color: #E6B800;'>B</span>iomedical <span style='color: #E6B800;'>B</span>enchmarks <span style='color: #E6B800;'>I</span>nvolving drug
 <span style='color: #E6B800;'>T</span>erm <span style='color: #E6B800;'>S</span>ubstitutions for Language Models <span style='color: #E6B800;'></span></h1></div>"""
         )
     with gr.Row():

src/models_info.py CHANGED Viewed

@@ -54,15 +54,15 @@ model_info = {
     },
     "mistralai-Mistral-7B-v0.3": {
         "link": "https://huggingface.co/mistralai/Mistral-7B-v0.3",
-        "tuning": "🟢"  # Continuously pre-trained
     },
     "mistralai-Mixtral-8x22B-v0.1": {
         "link": "https://huggingface.co/mistralai/Mixtral-8x22B-v0.1",
-        "tuning": "🟢"  # Continuously pre-trained
     },
     "mistralai-Mixtral-8x7B-v0.1": {
         "link": "https://huggingface.co/mistralai/Mixtral-8x7B-v0.1",
-        "tuning": "🟢"  # Continuously pre-trained
     },
     "ProbeMedicalYonseiMAILab-medllama3-v20": {
         "link": "https://huggingface.co/ProbeMedicalYonseiMAILab/medllama3-v20",

     },
     "mistralai-Mistral-7B-v0.3": {
         "link": "https://huggingface.co/mistralai/Mistral-7B-v0.3",
+        "tuning": "🟢"  # pre-trained
     },
     "mistralai-Mixtral-8x22B-v0.1": {
         "link": "https://huggingface.co/mistralai/Mixtral-8x22B-v0.1",
+        "tuning": "🟢"  #  pre-trained
     },
     "mistralai-Mixtral-8x7B-v0.1": {
         "link": "https://huggingface.co/mistralai/Mixtral-8x7B-v0.1",
+        "tuning": "🟢"  #  pre-trained
     },
     "ProbeMedicalYonseiMAILab-medllama3-v20": {
         "link": "https://huggingface.co/ProbeMedicalYonseiMAILab/medllama3-v20",