gremlin97 commited on
Commit
f5ff4ae
·
1 Parent(s): b7e427f

Update to new Mars-Bench dataset structure with Author field

Browse files
Files changed (4) hide show
  1. app.py +19 -19
  2. data/classification.csv +10 -16
  3. data/detection.csv +4 -16
  4. data/segmentation.csv +9 -16
app.py CHANGED
@@ -49,7 +49,7 @@ def build_tab(df, name):
49
  datasets = sorted(df["Dataset"].unique().tolist())
50
  models = sorted(df["Model"].unique().tolist())
51
  organizations = sorted(df["Organization"].unique().tolist())
52
- metric_cols = [col for col in df.columns if col not in ["Model", "Organization", "Dataset", "First Author", "Author Link"]]
53
 
54
  # Create pivoted dataframe
55
  pivoted_data = []
@@ -57,17 +57,17 @@ def build_tab(df, name):
57
  for org in organizations:
58
  model_org_data = df[(df["Model"] == model) & (df["Organization"] == org)]
59
  if not model_org_data.empty:
60
- # Get First Author and Author Link from the first entry (they should be the same for model+org)
61
- first_author = model_org_data["First Author"].values[0]
62
  author_link = model_org_data["Author Link"].values[0]
63
 
64
  # Format as markdown link if author_link exists
65
  if pd.notna(author_link) and author_link.strip():
66
- author_display = f"[{first_author}]({author_link})"
67
  else:
68
- author_display = first_author
69
 
70
- row = {"Model": model, "Organization": org, "First Author": author_display}
71
  for dataset in datasets:
72
  dataset_data = model_org_data[model_org_data["Dataset"] == dataset]
73
  if not dataset_data.empty:
@@ -88,7 +88,7 @@ def build_tab(df, name):
88
  for metric in metric_cols:
89
  metric_combo_cols.append(f"{dataset} ({metric})")
90
 
91
- all_cols = ["Model", "Organization", "First Author"] + metric_combo_cols
92
 
93
  with gr.TabItem(name, elem_id="llm-benchmark-tab-table"):
94
  with gr.Row():
@@ -100,7 +100,7 @@ def build_tab(df, name):
100
  )
101
 
102
  # Column selector for base columns only (not dataset+metric combos)
103
- base_cols = ["Model", "Organization", "First Author"]
104
  col_selector = gr.CheckboxGroup(
105
  choices=base_cols,
106
  value=base_cols,
@@ -108,10 +108,10 @@ def build_tab(df, name):
108
  elem_classes="column-select"
109
  )
110
 
111
- # Set datatype to 'markdown' for First Author column to enable clickable links
112
  datatypes = []
113
  for col in pivoted_df.columns:
114
- if col == "First Author":
115
  datatypes.append("markdown")
116
  else:
117
  datatypes.append("str")
@@ -246,7 +246,7 @@ custom_css = """
246
  min-width: 120px;
247
  }
248
 
249
- /* Style links in First Author column */
250
  #leaderboard-table a {
251
  color: #0066cc;
252
  text-decoration: none;
@@ -354,10 +354,10 @@ with demo:
354
  )
355
 
356
  with gr.Column():
357
- submit_first_author = gr.Textbox(
358
- label="First Author",
359
  placeholder="e.g., K. He",
360
- info="Name of the first author"
361
  )
362
  submit_author_link = gr.Textbox(
363
  label="Author Page Link (Optional)",
@@ -404,9 +404,9 @@ with demo:
404
  We'll review your submission and add it to the leaderboard if approved.
405
  """)
406
 
407
- def generate_submission_text(task, model, org, dataset, first_author, author_link, metrics, paper, code, email, notes):
408
- if not all([task, model, org, dataset, first_author, metrics, email]):
409
- return "❌ Error: Please fill in all required fields (Task Type, Model Name, Organization, Dataset, First Author, Metrics, Contact Email)"
410
 
411
  submission_text = f"""## New Model Submission
412
 
@@ -414,7 +414,7 @@ with demo:
414
  **Model Name:** {model}
415
  **Organization:** {org}
416
  **Dataset:** {dataset}
417
- **First Author:** {first_author}
418
  **Author Page Link:** {author_link if author_link else "N/A"}
419
 
420
  ### Metrics
@@ -439,7 +439,7 @@ with demo:
439
 
440
  generate_btn.click(
441
  generate_submission_text,
442
- inputs=[submit_task, submit_model, submit_org, submit_dataset, submit_first_author,
443
  submit_author_link, submit_metrics, submit_paper, submit_code, submit_email, submit_notes],
444
  outputs=submission_output
445
  )
 
49
  datasets = sorted(df["Dataset"].unique().tolist())
50
  models = sorted(df["Model"].unique().tolist())
51
  organizations = sorted(df["Organization"].unique().tolist())
52
+ metric_cols = [col for col in df.columns if col not in ["Model", "Organization", "Dataset", "Author", "Author Link"]]
53
 
54
  # Create pivoted dataframe
55
  pivoted_data = []
 
57
  for org in organizations:
58
  model_org_data = df[(df["Model"] == model) & (df["Organization"] == org)]
59
  if not model_org_data.empty:
60
+ # Get Author and Author Link from the first entry (they should be the same for model+org)
61
+ author = model_org_data["Author"].values[0]
62
  author_link = model_org_data["Author Link"].values[0]
63
 
64
  # Format as markdown link if author_link exists
65
  if pd.notna(author_link) and author_link.strip():
66
+ author_display = f"[{author}]({author_link})"
67
  else:
68
+ author_display = author
69
 
70
+ row = {"Model": model, "Organization": org, "Author": author_display}
71
  for dataset in datasets:
72
  dataset_data = model_org_data[model_org_data["Dataset"] == dataset]
73
  if not dataset_data.empty:
 
88
  for metric in metric_cols:
89
  metric_combo_cols.append(f"{dataset} ({metric})")
90
 
91
+ all_cols = ["Model", "Organization", "Author"] + metric_combo_cols
92
 
93
  with gr.TabItem(name, elem_id="llm-benchmark-tab-table"):
94
  with gr.Row():
 
100
  )
101
 
102
  # Column selector for base columns only (not dataset+metric combos)
103
+ base_cols = ["Model", "Organization", "Author"]
104
  col_selector = gr.CheckboxGroup(
105
  choices=base_cols,
106
  value=base_cols,
 
108
  elem_classes="column-select"
109
  )
110
 
111
+ # Set datatype to 'markdown' for Author column to enable clickable links
112
  datatypes = []
113
  for col in pivoted_df.columns:
114
+ if col == "Author":
115
  datatypes.append("markdown")
116
  else:
117
  datatypes.append("str")
 
246
  min-width: 120px;
247
  }
248
 
249
+ /* Style links in Author column */
250
  #leaderboard-table a {
251
  color: #0066cc;
252
  text-decoration: none;
 
354
  )
355
 
356
  with gr.Column():
357
+ submit_author = gr.Textbox(
358
+ label="Author",
359
  placeholder="e.g., K. He",
360
+ info="Name of the author"
361
  )
362
  submit_author_link = gr.Textbox(
363
  label="Author Page Link (Optional)",
 
404
  We'll review your submission and add it to the leaderboard if approved.
405
  """)
406
 
407
+ def generate_submission_text(task, model, org, dataset, author, author_link, metrics, paper, code, email, notes):
408
+ if not all([task, model, org, dataset, author, metrics, email]):
409
+ return "❌ Error: Please fill in all required fields (Task Type, Model Name, Organization, Dataset, Author, Metrics, Contact Email)"
410
 
411
  submission_text = f"""## New Model Submission
412
 
 
414
  **Model Name:** {model}
415
  **Organization:** {org}
416
  **Dataset:** {dataset}
417
+ **Author:** {author}
418
  **Author Page Link:** {author_link if author_link else "N/A"}
419
 
420
  ### Metrics
 
439
 
440
  generate_btn.click(
441
  generate_submission_text,
442
+ inputs=[submit_task, submit_model, submit_org, submit_dataset, submit_author,
443
  submit_author_link, submit_metrics, submit_paper, submit_code, submit_email, submit_notes],
444
  outputs=submission_output
445
  )
data/classification.csv CHANGED
@@ -1,16 +1,10 @@
1
- Model,Organization,Dataset,Accuracy,F1-Score,First Author,Author Link
2
- ResNet-50,Microsoft,DoMars16,92.5,91.8,K. He,https://kaiminghe.github.io/
3
- ViT-Base,Google,DoMars16,94.2,93.5,A. Dosovitskiy,https://scholar.google.com/citations?user=UfvnhKcAAAAJ
4
- Swin-T,Microsoft,DoMars16,95.8,94.9,Z. Liu,https://scholar.google.com/citations?user=nHh9PSsAAAAJ
5
- InceptionV3,Google,DoMars16,93.1,92.4,C. Szegedy,https://scholar.google.com/citations?user=3QeF7mAAAAAJ
6
- SqueezeNet,DeepMind,DoMars16,89.7,88.6,F. Iandola,https://scholar.google.com/citations?user=LvWAIwUAAAAJ
7
- ResNet-50,Microsoft,Atmospheric Dust,88.3,87.5,K. He,https://kaiminghe.github.io/
8
- ViT-Base,Google,Atmospheric Dust,90.1,89.2,A. Dosovitskiy,https://scholar.google.com/citations?user=UfvnhKcAAAAJ
9
- Swin-T,Microsoft,Atmospheric Dust,91.5,90.7,Z. Liu,https://scholar.google.com/citations?user=nHh9PSsAAAAJ
10
- InceptionV3,Google,Atmospheric Dust,89.8,88.9,C. Szegedy,https://scholar.google.com/citations?user=3QeF7mAAAAAJ
11
- SqueezeNet,DeepMind,Atmospheric Dust,87.2,86.3,F. Iandola,https://scholar.google.com/citations?user=LvWAIwUAAAAJ
12
- ResNet-50,Microsoft,Martian Frost,85.6,84.8,K. He,https://kaiminghe.github.io/
13
- ViT-Base,Google,Martian Frost,87.9,86.9,A. Dosovitskiy,https://scholar.google.com/citations?user=UfvnhKcAAAAJ
14
- Swin-T,Microsoft,Martian Frost,88.4,87.5,Z. Liu,https://scholar.google.com/citations?user=nHh9PSsAAAAJ
15
- InceptionV3,Google,Martian Frost,86.7,85.8,C. Szegedy,https://scholar.google.com/citations?user=3QeF7mAAAAAJ
16
- SqueezeNet,DeepMind,Martian Frost,84.3,83.4,F. Iandola,https://scholar.google.com/citations?user=LvWAIwUAAAAJ
 
1
+ Model,Organization,Dataset,Accuracy,F1-Score,Author,Author Link
2
+ Under Construction,Under Construction,atmospheric_dust_cls_edr,Under Construction,Under Construction,Under Construction,
3
+ Under Construction,Under Construction,atmospheric_dust_cls_rdr,Under Construction,Under Construction,Under Construction,
4
+ Under Construction,Under Construction,change_cls_ctx,Under Construction,Under Construction,Under Construction,
5
+ Under Construction,Under Construction,change_cls_hirise,Under Construction,Under Construction,Under Construction,
6
+ Under Construction,Under Construction,domars16k,Under Construction,Under Construction,Under Construction,
7
+ Under Construction,Under Construction,frost_cls,Under Construction,Under Construction,Under Construction,
8
+ Under Construction,Under Construction,landmark_cls,Under Construction,Under Construction,Under Construction,
9
+ Under Construction,Under Construction,surface_cls,Under Construction,Under Construction,Under Construction,
10
+ Under Construction,Under Construction,surface_multi_label_cls,Under Construction,Under Construction,Under Construction,
 
 
 
 
 
 
data/detection.csv CHANGED
@@ -1,16 +1,4 @@
1
- Model,Organization,Dataset,mAP,IoU,First Author,Author Link
2
- Faster R-CNN,Meta,Mars Crater,78.5,0.72,S. Ren,https://scholar.google.com/citations?user=L_hq4a0AAAAJ
3
- YOLOv5,Ultralytics,Mars Crater,80.2,0.74,G. Jocher,https://github.com/glenn-jocher
4
- DETR,Meta,Mars Crater,82.1,0.76,N. Carion,https://scholar.google.com/citations?user=p1wMCUUAAAAJ
5
- RetinaNet,Meta,Mars Crater,79.3,0.73,T. Lin,https://scholar.google.com/citations?user=7zQoaFkAAAAJ
6
- SSD,Google,Mars Crater,77.8,0.71,W. Liu,https://scholar.google.com/citations?user=PQ7QBjYAAAAJ
7
- Faster R-CNN,Meta,Rover Component,75.6,0.69,S. Ren,https://scholar.google.com/citations?user=L_hq4a0AAAAJ
8
- YOLOv5,Ultralytics,Rover Component,77.3,0.71,G. Jocher,https://github.com/glenn-jocher
9
- DETR,Meta,Rover Component,78.9,0.73,N. Carion,https://scholar.google.com/citations?user=p1wMCUUAAAAJ
10
- RetinaNet,Meta,Rover Component,76.7,0.70,T. Lin,https://scholar.google.com/citations?user=7zQoaFkAAAAJ
11
- SSD,Google,Rover Component,75.1,0.68,W. Liu,https://scholar.google.com/citations?user=PQ7QBjYAAAAJ
12
- Faster R-CNN,Meta,Geological Feature,73.4,0.67,S. Ren,https://scholar.google.com/citations?user=L_hq4a0AAAAJ
13
- YOLOv5,Ultralytics,Geological Feature,75.1,0.69,G. Jocher,https://github.com/glenn-jocher
14
- DETR,Meta,Geological Feature,76.7,0.71,N. Carion,https://scholar.google.com/citations?user=p1wMCUUAAAAJ
15
- RetinaNet,Meta,Geological Feature,74.5,0.68,T. Lin,https://scholar.google.com/citations?user=7zQoaFkAAAAJ
16
- SSD,Google,Geological Feature,73.0,0.67,W. Liu,https://scholar.google.com/citations?user=PQ7QBjYAAAAJ
 
1
+ Model,Organization,Dataset,mAP,IoU,Author,Author Link
2
+ Under Construction,Under Construction,boulder_det,Under Construction,Under Construction,Under Construction,
3
+ Under Construction,Under Construction,conequest_det,Under Construction,Under Construction,Under Construction,
4
+ Under Construction,Under Construction,dust_devil_det,Under Construction,Under Construction,Under Construction,
 
 
 
 
 
 
 
 
 
 
 
 
data/segmentation.csv CHANGED
@@ -1,16 +1,9 @@
1
- Model,Organization,Dataset,Dice Score,IoU,First Author,Author Link
2
- U-Net,OpenAI,Mars Terrain,0.85,0.74,O. Ronneberger,https://scholar.google.com/citations?user=MXXkjXkAAAAJ
3
- DeepLabV3+,Google,Mars Terrain,0.87,0.76,L. Chen,https://scholar.google.com/citations?user=WicCTRsAAAAJ
4
- Mask R-CNN,Meta,Mars Terrain,0.88,0.78,K. He,https://kaiminghe.github.io/
5
- SegFormer,NVIDIA,Mars Terrain,0.86,0.75,E. Xie,https://scholar.google.com/citations?user=txgkZ0kAAAAJ
6
- HRNet,Microsoft,Mars Terrain,0.84,0.73,J. Wang,https://scholar.google.com/citations?user=aYKQn88AAAAJ
7
- U-Net,OpenAI,Dust Storm,0.82,0.70,O. Ronneberger,https://scholar.google.com/citations?user=MXXkjXkAAAAJ
8
- DeepLabV3+,Google,Dust Storm,0.84,0.72,L. Chen,https://scholar.google.com/citations?user=WicCTRsAAAAJ
9
- Mask R-CNN,Meta,Dust Storm,0.85,0.74,K. He,https://kaiminghe.github.io/
10
- SegFormer,NVIDIA,Dust Storm,0.83,0.71,E. Xie,https://scholar.google.com/citations?user=txgkZ0kAAAAJ
11
- HRNet,Microsoft,Dust Storm,0.82,0.70,J. Wang,https://scholar.google.com/citations?user=aYKQn88AAAAJ
12
- U-Net,OpenAI,Geological Feature,0.81,0.68,O. Ronneberger,https://scholar.google.com/citations?user=MXXkjXkAAAAJ
13
- DeepLabV3+,Google,Geological Feature,0.83,0.70,L. Chen,https://scholar.google.com/citations?user=WicCTRsAAAAJ
14
- Mask R-CNN,Meta,Geological Feature,0.84,0.72,K. He,https://kaiminghe.github.io/
15
- SegFormer,NVIDIA,Geological Feature,0.82,0.69,E. Xie,https://scholar.google.com/citations?user=txgkZ0kAAAAJ
16
- HRNet,Microsoft,Geological Feature,0.81,0.68,J. Wang,https://scholar.google.com/citations?user=aYKQn88AAAAJ
 
1
+ Model,Organization,Dataset,Dice Score,IoU,Author,Author Link
2
+ Under Construction,Under Construction,boulder_seg,Under Construction,Under Construction,Under Construction,
3
+ Under Construction,Under Construction,conequest_seg,Under Construction,Under Construction,Under Construction,
4
+ Under Construction,Under Construction,crater_binary_seg,Under Construction,Under Construction,Under Construction,
5
+ Under Construction,Under Construction,crater_multi_seg,Under Construction,Under Construction,Under Construction,
6
+ Under Construction,Under Construction,mars_seg_mer,Under Construction,Under Construction,Under Construction,
7
+ Under Construction,Under Construction,mars_seg_msl,Under Construction,Under Construction,Under Construction,
8
+ Under Construction,Under Construction,mmls,Under Construction,Under Construction,Under Construction,
9
+ Under Construction,Under Construction,s5mars,Under Construction,Under Construction,Under Construction,