Spaces:

valbuc
/

GenCeption

Sleeping

Valentin Buchner commited on Mar 15, 2024

Commit

968c326

1 Parent(s): c951815

adjusted column width and sorting

Files changed (3) hide show

README.md CHANGED Viewed

@@ -1,5 +1,5 @@
 ---
-title: Genception Leaderboard
 emoji: 🔥
 colorFrom: red
 colorTo: green
@@ -7,6 +7,8 @@ sdk: gradio
 sdk_version: 4.19.2
 app_file: leaderboard/app.py
 pinned: true
 ---
 # GenCeption: Evaluate Multimodal LLMs with Unlabeled Unimodal Data

 ---
+title: GenCeption Leaderboard
 emoji: 🔥
 colorFrom: red
 colorTo: green
 sdk_version: 4.19.2
 app_file: leaderboard/app.py
 pinned: true
+short_description: The annotation-free MLLM evaluation benchmark.
+license: mit
 ---
 # GenCeption: Evaluate Multimodal LLMs with Unlabeled Unimodal Data

leaderboard/app.py CHANGED Viewed

@@ -39,6 +39,7 @@ def create_dataframe(data):
         rows.append(row)
     df = pd.DataFrame(rows)
     for col in df.columns:
         if "Mean" in col:
@@ -52,6 +53,7 @@ def update_display(show_all, df):
     legend_visibility = gr.update(visible=show_all)
     return filtered_df, legend_visibility
 update_data()
 demo = gr.Blocks()
 with demo:
@@ -60,7 +62,8 @@ with demo:
     gr.Markdown(INTRO, elem_classes="markdown-text")
     gr.Markdown(INTRO2, elem_classes="markdown-text")
     show_all_columns = gr.Checkbox(label="Show all datasets", value=True)
-    data_display = gr.Dataframe(df, datatype="markdown")
     legend_accordion = gr.Accordion("Legend:", open=False, visible=True)
     with legend_accordion:

         rows.append(row)
     df = pd.DataFrame(rows)
+    df = df.sort_values(by="Mean", ascending=False)
     for col in df.columns:
         if "Mean" in col:
     legend_visibility = gr.update(visible=show_all)
     return filtered_df, legend_visibility
 update_data()
 demo = gr.Blocks()
 with demo:
     gr.Markdown(INTRO, elem_classes="markdown-text")
     gr.Markdown(INTRO2, elem_classes="markdown-text")
     show_all_columns = gr.Checkbox(label="Show all datasets", value=True)
+    column_widths = ["125px"] + [None] * (len(df.columns) - 1)
+    data_display = gr.Dataframe(df, datatype="markdown", column_widths=column_widths)
     legend_accordion = gr.Accordion("Legend:", open=False, visible=True)
     with legend_accordion:

leaderboard/leaderboard.json CHANGED Viewed

@@ -1,5 +1,28 @@
 {
     "models": [
       {
         "name": "ChatGPT-4V",
         "url": "https://cdn.openai.com/papers/GPTV_System_Card.pdf",

 {
     "models": [
+      {
+        "name": "Claude3-Opus",
+        "url": "https://www.anthropic.com/news/claude-3-family",
+        "scores": {
+          "Mean": 0.340,
+          "Exist": 0.382,
+          "Count": 0.348,
+          "Posi": 0.357,
+          "Col": 0.385,
+          "Post": 0.360,
+          "Cel": 0.317,
+          "Sce": 0.374,
+          "Lan": 0.344,
+          "Art": 0.385,
+          "Comm": 0.432,
+          "VisMean": 0.368,
+          "Code": 0.245,
+          "Num": 0.229,
+          "Tran": 0.236,
+          "OCR": 0.362,
+          "TextMean": 0.268
+        }
+      },
       {
         "name": "ChatGPT-4V",
         "url": "https://cdn.openai.com/papers/GPTV_System_Card.pdf",