Spaces:

gaia-benchmark
/

leaderboard

Running on CPU Upgrade

App Files Files Community

Clémentine commited on Mar 5

Commit

06fe586

1 Parent(s): 676e2ea

added debug mode locally, fixed a couple typos

Browse files

Files changed (1) hide show

app.py +36 -22

app.py CHANGED Viewed

@@ -33,6 +33,8 @@ ref_level_len = {"validation": {1: 53, 2: 86, 3: 26}, "test": {1: 93, 2: 159, 3:
 os.makedirs("scored", exist_ok=True)
 # Display the results
 eval_results = load_dataset(RESULTS_DATASET, YEAR_VERSION, token=TOKEN, download_mode="force_redownload", verification_mode=VerificationMode.NO_CHECKS, trust_remote_code=True)
 contact_infos = load_dataset(CONTACT_DATASET, YEAR_VERSION, token=TOKEN, download_mode="force_redownload", verification_mode=VerificationMode.NO_CHECKS, trust_remote_code=True)
@@ -81,8 +83,8 @@ def add_new_eval(
     profile: gr.OAuthProfile,
 ):
     contact_infos = load_dataset(CONTACT_DATASET, YEAR_VERSION, token=TOKEN, download_mode="force_redownload", verification_mode=VerificationMode.NO_CHECKS, trust_remote_code=True)
-    user_submission_dates = sorted(row["date"] for row in contact_info[val_or_test] if row["username"] == profile.username)
-    if user_submission_dates[-1] == datetime.datetime.today().strftime('%Y-%m-%d'):
         return format_error("You already submitted once today, please try again tomorrow.")
@@ -102,13 +104,16 @@ def add_new_eval(
         return format_warning("Please attach a file.")
     # Save submitted file
-    api.upload_file(
-        repo_id=SUBMISSION_DATASET,
-        path_or_fileobj=path_to_file.name,
-        path_in_repo=f"{organisation}/{model}/{YEAR_VERSION}_{val_or_test}_raw_{datetime.datetime.today()}.jsonl",
-        repo_type="dataset",
-        token=TOKEN
-    )
     # Compute score
     file_path = path_to_file.name
@@ -157,24 +162,27 @@ def add_new_eval(
         return format_error(f"Your submission has {num_questions[1]} questions for level 1, {num_questions[2]} for level 2, and {num_questions[3]} for level 3, but it should have {ref_level_len[val_or_test][1]}, {ref_level_len[val_or_test][2]}, and {ref_level_len[val_or_test][3]} respectively. Please check your submission.")
     # Save scored file
-    api.upload_file(
-        repo_id=SUBMISSION_DATASET,
-        path_or_fileobj=f"scored/{organisation}_{model}.jsonl",
-        path_in_repo=f"{organisation}/{model}/{YEAR_VERSION}_{val_or_test}_scored_{datetime.datetime.today()}.jsonl",
-        repo_type="dataset",
-        token=TOKEN
-    )
-    # Save scored file
-    if is_validation:
         api.upload_file(
-            repo_id=SUBMISSION_DATASET_PUBLIC,
             path_or_fileobj=f"scored/{organisation}_{model}.jsonl",
             path_in_repo=f"{organisation}/{model}/{YEAR_VERSION}_{val_or_test}_scored_{datetime.datetime.today()}.jsonl",
             repo_type="dataset",
             token=TOKEN
         )
     # Actual submission
     eval_entry = {
         "model": model,
@@ -193,7 +201,10 @@ def add_new_eval(
     eval_results[val_or_test] = eval_results[val_or_test].add_item(eval_entry)
     print(eval_results)
-    eval_results.push_to_hub(RESULTS_DATASET, config_name = YEAR_VERSION, token=TOKEN)
     contact_info = {
         "model": model,
@@ -205,7 +216,10 @@ def add_new_eval(
         "date": datetime.datetime.today().strftime('%Y-%m-%d')
     }
     contact_infos[val_or_test]= contact_infos[val_or_test].add_item(contact_info)
-    contact_infos.push_to_hub(CONTACT_DATASET, config_name = YEAR_VERSION, token=TOKEN)
     return format_log(f"Model {model} submitted by {organisation} successfully.\nPlease wait a few hours and refresh the leaderboard to see your score displayed.")

 os.makedirs("scored", exist_ok=True)
+LOCAL_DEBUG = False
 # Display the results
 eval_results = load_dataset(RESULTS_DATASET, YEAR_VERSION, token=TOKEN, download_mode="force_redownload", verification_mode=VerificationMode.NO_CHECKS, trust_remote_code=True)
 contact_infos = load_dataset(CONTACT_DATASET, YEAR_VERSION, token=TOKEN, download_mode="force_redownload", verification_mode=VerificationMode.NO_CHECKS, trust_remote_code=True)
     profile: gr.OAuthProfile,
 ):
     contact_infos = load_dataset(CONTACT_DATASET, YEAR_VERSION, token=TOKEN, download_mode="force_redownload", verification_mode=VerificationMode.NO_CHECKS, trust_remote_code=True)
+    user_submission_dates = sorted(row["date"] for row in contact_infos[val_or_test] if row["username"] == profile.username)
+    if len(user_submission_dates) > 0 and user_submission_dates[-1] == datetime.datetime.today().strftime('%Y-%m-%d'):
         return format_error("You already submitted once today, please try again tomorrow.")
         return format_warning("Please attach a file.")
     # Save submitted file
+    if LOCAL_DEBUG:
+        print("mock uploaded submission")
+    else:
+        api.upload_file(
+            repo_id=SUBMISSION_DATASET,
+            path_or_fileobj=path_to_file.name,
+            path_in_repo=f"{organisation}/{model}/{YEAR_VERSION}_{val_or_test}_raw_{datetime.datetime.today()}.jsonl",
+            repo_type="dataset",
+            token=TOKEN
+        )
     # Compute score
     file_path = path_to_file.name
         return format_error(f"Your submission has {num_questions[1]} questions for level 1, {num_questions[2]} for level 2, and {num_questions[3]} for level 3, but it should have {ref_level_len[val_or_test][1]}, {ref_level_len[val_or_test][2]}, and {ref_level_len[val_or_test][3]} respectively. Please check your submission.")
     # Save scored file
+    if LOCAL_DEBUG:
+        print("mock uploaded scored submission")
+    else:
         api.upload_file(
+            repo_id=SUBMISSION_DATASET,
             path_or_fileobj=f"scored/{organisation}_{model}.jsonl",
             path_in_repo=f"{organisation}/{model}/{YEAR_VERSION}_{val_or_test}_scored_{datetime.datetime.today()}.jsonl",
             repo_type="dataset",
             token=TOKEN
         )
+        # Save scored file
+        if is_validation:
+            api.upload_file(
+                repo_id=SUBMISSION_DATASET_PUBLIC,
+                path_or_fileobj=f"scored/{organisation}_{model}.jsonl",
+                path_in_repo=f"{organisation}/{model}/{YEAR_VERSION}_{val_or_test}_scored_{datetime.datetime.today()}.jsonl",
+                repo_type="dataset",
+                token=TOKEN
+            )
     # Actual submission
     eval_entry = {
         "model": model,
     eval_results[val_or_test] = eval_results[val_or_test].add_item(eval_entry)
     print(eval_results)
+    if LOCAL_DEBUG:
+        print("mock uploaded results to lb")
+    else:
+        eval_results.push_to_hub(RESULTS_DATASET, config_name = YEAR_VERSION, token=TOKEN)
     contact_info = {
         "model": model,
         "date": datetime.datetime.today().strftime('%Y-%m-%d')
     }
     contact_infos[val_or_test]= contact_infos[val_or_test].add_item(contact_info)
+    if LOCAL_DEBUG:
+        print("mock uploaded contact info")
+    else:
+        contact_infos.push_to_hub(CONTACT_DATASET, config_name = YEAR_VERSION, token=TOKEN)
     return format_log(f"Model {model} submitted by {organisation} successfully.\nPlease wait a few hours and refresh the leaderboard to see your score displayed.")