Spaces:

snap-stanford
/

stark-leaderboard

Running

App Files Files Community

Shiyu Zhao commited on Oct 24, 2024

Commit

be954af

1 Parent(s): 86d5a63

Update space

Browse files

Files changed (12) hide show

app.py +12 -11
submissions/ance_test2_tester2/latest.json +0 -6
submissions/ance_test2_tester2/metadata_20241024_043111.json +0 -21
submissions/ance_test2_tester2/metadata_20241024_044359.json +0 -21
submissions/ance_test2_tester2/predictions_20241024_043111.csv +0 -0
submissions/ance_test2_tester2/predictions_20241024_044359.csv +0 -0
submissions/ance_test3_tester3/latest.json +0 -6
submissions/ance_test3_tester3/metadata_20241024_051521.json +0 -21
submissions/ance_test3_tester3/predictions_20241024_051521.csv +0 -0
submissions/ance_test_tester1/latest.json +0 -6
submissions/ance_test_tester1/metadata_20241024_004918.json +0 -20
submissions/ance_test_tester1/predictions_20241024_004918.csv +0 -0

app.py CHANGED Viewed

@@ -876,7 +876,7 @@ with gr.Blocks(css=css) as demo:
     gr.Markdown("## Submit Your Results")
     gr.Markdown("""
     Submit your results to be included in the leaderboard. Please ensure your submission meets all requirements.
-    For questions, contact stark-qa@cs.stanford.edu
     """)
     with gr.Row():
@@ -885,10 +885,6 @@ with gr.Blocks(css=css) as demo:
                 label="Method Name (max 25 chars)*",
                 placeholder="e.g., MyRetrievalModel-v1"
             )
-            team_name = gr.Textbox(
-                label="Team Name (max 25 chars)*",
-                placeholder="e.g., Stanford NLP"
-            )
             dataset = gr.Dropdown(
                 choices=["amazon", "mag", "prime"],
                 label="Dataset*",
@@ -899,6 +895,10 @@ with gr.Blocks(css=css) as demo:
                 label="Split*",
                 value="test"
             )
             contact_email = gr.Textbox(
                 label="Contact Email(s)*",
                 placeholder="email@example.com; another@example.com"
@@ -909,6 +909,9 @@ with gr.Blocks(css=css) as demo:
                 value="Others",
                 info="Select the appropriate category for your model"
             )
             model_description = gr.Textbox(
                 label="Model Description*",
                 lines=3,
@@ -918,17 +921,15 @@ with gr.Blocks(css=css) as demo:
                 label="Code Repository*",
                 placeholder="https://github.com/snap-stanford/stark-leaderboard"
             )
-        with gr.Column():
             csv_file = gr.File(
                 label="Prediction CSV*",
                 file_types=[".csv"],
                 type="filepath"
             )
-            hardware = gr.Textbox(
-                label="Hardware Specifications*",
-                placeholder="e.g., 4x NVIDIA A100 80GB"
-            )
             paper_link = gr.Textbox(
                 label="Paper Link (Optional)",
                 placeholder="https://arxiv.org/abs/..."

     gr.Markdown("## Submit Your Results")
     gr.Markdown("""
     Submit your results to be included in the leaderboard. Please ensure your submission meets all requirements.
+    For questions, contact stark-qa@cs.stanford.edu. Detailed instructions can be referred at [submission instructions](https://docs.google.com/document/d/11coGjTmOEi9p9-PUq1oy0eTOj8f_8CVQhDl5_0FKT14/edit?usp=sharing).
     """)
     with gr.Row():
                 label="Method Name (max 25 chars)*",
                 placeholder="e.g., MyRetrievalModel-v1"
             )
             dataset = gr.Dropdown(
                 choices=["amazon", "mag", "prime"],
                 label="Dataset*",
                 label="Split*",
                 value="test"
             )
+            team_name = gr.Textbox(
+                label="Team Name (max 25 chars)*",
+                placeholder="e.g., Stanford NLP"
+            )
             contact_email = gr.Textbox(
                 label="Contact Email(s)*",
                 placeholder="email@example.com; another@example.com"
                 value="Others",
                 info="Select the appropriate category for your model"
             )
+        with gr.Column():
             model_description = gr.Textbox(
                 label="Model Description*",
                 lines=3,
                 label="Code Repository*",
                 placeholder="https://github.com/snap-stanford/stark-leaderboard"
             )
+            hardware = gr.Textbox(
+                label="Hardware Specifications*",
+                placeholder="e.g., 4x NVIDIA A100 80GB"
+            )
             csv_file = gr.File(
                 label="Prediction CSV*",
                 file_types=[".csv"],
                 type="filepath"
             )
             paper_link = gr.Textbox(
                 label="Paper Link (Optional)",
                 placeholder="https://arxiv.org/abs/..."

submissions/ance_test2_tester2/latest.json DELETED Viewed

@@ -1,6 +0,0 @@
-{
-    "latest_submission": "20241024_044359",
-    "status": "approved",
-    "method_name": "ance-test2",
-    "team_name": "tester2"
-}

submissions/ance_test2_tester2/metadata_20241024_043111.json DELETED Viewed

@@ -1,21 +0,0 @@
-{
-    "Method Name": "ance_test2",
-    "Team Name": "tester2",
-    "Dataset": "amazon",
-    "Split": "human_generated_eval",
-    "Contact Email(s)": "shiyuz@stanford.edu",
-    "Code Repository": "https://github.com/snap-stanford/stark",
-    "Model Description": "test",
-    "Hardware": "a100",
-    "(Optional) Paper link": "",
-    "Model Type": "Others",
-    "results": {
-        "hit@1": 25.93,
-        "hit@5": 54.32,
-        "recall@20": 23.69,
-        "mrr": 37.08
-    },
-    "status": "approved",
-    "submission_date": "2024-10-24 04:32:14",
-    "csv_path": "submissions/ance_test2_tester2/predictions_20241024_043111.csv"
-}

submissions/ance_test2_tester2/metadata_20241024_044359.json DELETED Viewed

@@ -1,21 +0,0 @@
-{
-    "Method Name": "ance-test2",
-    "Team Name": "tester2",
-    "Dataset": "amazon",
-    "Split": "human_generated_eval",
-    "Contact Email(s)": "shiyuz@stanford.edu",
-    "Code Repository": "https://github.com/snap-stanford/stark",
-    "Model Description": "tester2",
-    "Hardware": "a100",
-    "(Optional) Paper link": "",
-    "Model Type": "Others",
-    "results": {
-        "hit@1": 25.93,
-        "hit@5": 54.32,
-        "recall@20": 23.69,
-        "mrr": 37.08
-    },
-    "status": "approved",
-    "submission_date": "2024-10-24 04:44:32",
-    "csv_path": "submissions/ance_test2_tester2/predictions_20241024_044359.csv"
-}

submissions/ance_test2_tester2/predictions_20241024_043111.csv DELETED Viewed

The diff for this file is too large to render. See raw diff

submissions/ance_test2_tester2/predictions_20241024_044359.csv DELETED Viewed

The diff for this file is too large to render. See raw diff

submissions/ance_test3_tester3/latest.json DELETED Viewed

@@ -1,6 +0,0 @@
-{
-    "latest_submission": "20241024_051521",
-    "status": "approved",
-    "method_name": "ance-test3",
-    "team_name": "tester3"
-}

submissions/ance_test3_tester3/metadata_20241024_051521.json DELETED Viewed

@@ -1,21 +0,0 @@
-{
-    "Method Name": "ance-test3",
-    "Team Name": "tester3",
-    "Dataset": "amazon",
-    "Split": "human_generated_eval",
-    "Contact Email(s)": "shiyuz@stanford.edu",
-    "Code Repository": "https://huggingface.co/spaces/snap-stanford/stark-leaderboard",
-    "Model Description": "tester3",
-    "Hardware": "tester3",
-    "(Optional) Paper link": "",
-    "Model Type": "Small Dense Retrievers",
-    "results": {
-        "hit@1": 25.93,
-        "hit@5": 54.32,
-        "recall@20": 23.69,
-        "mrr": 37.08
-    },
-    "status": "approved",
-    "submission_date": "2024-10-24 05:15:52",
-    "csv_path": "submissions/ance_test3_tester3/predictions_20241024_051521.csv"
-}

submissions/ance_test3_tester3/predictions_20241024_051521.csv DELETED Viewed

The diff for this file is too large to render. See raw diff

submissions/ance_test_tester1/latest.json DELETED Viewed

@@ -1,6 +0,0 @@
-{
-    "latest_submission": "20241024_004918",
-    "status": "approved",
-    "method_name": "ance-test",
-    "team_name": "tester1"
-}

submissions/ance_test_tester1/metadata_20241024_004918.json DELETED Viewed

@@ -1,20 +0,0 @@
-{
-    "Method Name": "ance-test",
-    "Team Name": "tester1",
-    "Dataset": "amazon",
-    "Split": "human_generated_eval",
-    "Contact Email(s)": "shiyuz@stanford.edu",
-    "Code Repository": "https://github.com/snap-stanford/stark",
-    "Model Description": "tester1",
-    "Hardware": "a100",
-    "(Optional) Paper link": "",
-    "results": {
-        "hit@1": 25.93,
-        "hit@5": 54.32,
-        "recall@20": 23.69,
-        "mrr": 37.08
-    },
-    "status": "approved",
-    "submission_date": "2024-10-24 00:49:49",
-    "csv_path": "submissions/ance_test_tester1/predictions_20241024_004918.csv"
-}

submissions/ance_test_tester1/predictions_20241024_004918.csv DELETED Viewed

The diff for this file is too large to render. See raw diff