Spaces:

gaia-benchmark
/

leaderboard

Running on CPU Upgrade

Clémentine commited on 14 days ago

Commit

ce98da8

1 Parent(s): f278160

forbid duplicates

Files changed (1) hide show

app.py CHANGED Viewed

@@ -106,6 +106,7 @@ def add_new_eval(
     file_path = path_to_file.name
     scores = {"all": 0, 1: 0, 2: 0, 3: 0}
     num_questions = {"all": 0, 1: 0, 2: 0, 3: 0}
     with open(f"scored/{organisation}_{model}.jsonl", "w") as scored_file:
         with open(file_path, 'r') as f:
             for ix, line in enumerate(f):
@@ -133,12 +134,17 @@ def add_new_eval(
                         "level": level
                     }) + "\n"
                 )
                 scores["all"] += score
                 scores[level] += score
                 num_questions["all"] += 1
                 num_questions[level] += 1
     # Save scored file
     api.upload_file(
         repo_id=SUBMISSION_DATASET,
@@ -165,7 +171,7 @@ def add_new_eval(
         "system_prompt": system_prompt,
         "url": url,
         "organisation": organisation,
-        "score": scores["all"]/num_questions["all"],
         "score_level1": scores[1]/num_questions[1],
         "score_level2": scores[2]/num_questions[2],
         "score_level3": scores[3]/num_questions[3],

     file_path = path_to_file.name
     scores = {"all": 0, 1: 0, 2: 0, 3: 0}
     num_questions = {"all": 0, 1: 0, 2: 0, 3: 0}
+    task_ids = []
     with open(f"scored/{organisation}_{model}.jsonl", "w") as scored_file:
         with open(file_path, 'r') as f:
             for ix, line in enumerate(f):
                         "level": level
                     }) + "\n"
                 )
+                task_ids.append(task_id)
                 scores["all"] += score
                 scores[level] += score
                 num_questions["all"] += 1
                 num_questions[level] += 1
+    # Check if there's any duplicate in the submission
+    if len(task_ids) != len(set(task_ids)):
+        return format_error("There are duplicates in your submission. Please check your file and resubmit it.")
     # Save scored file
     api.upload_file(
         repo_id=SUBMISSION_DATASET,
         "system_prompt": system_prompt,
         "url": url,
         "organisation": organisation,
+        "score": scores["all"]/ref_scores_len,
         "score_level1": scores[1]/num_questions[1],
         "score_level2": scores[2]/num_questions[2],
         "score_level3": scores[3]/num_questions[3],