Skip to content

Commit b40b605

Browse files
authored
feat: add competition level filter and extract constants to utils (#869)
* feat: add competition level filter and extract constants to utils * lint
1 parent c2c505f commit b40b605

File tree

2 files changed

+104
-28
lines changed

2 files changed

+104
-28
lines changed

rdagent/log/ui/ds_summary.py

Lines changed: 19 additions & 28 deletions
Original file line numberDiff line numberDiff line change
@@ -14,6 +14,7 @@
1414
from rdagent.log.mle_summary import extract_mle_json
1515
from rdagent.log.ui.conf import UI_SETTING
1616
from rdagent.log.ui.ds_trace import load_times
17+
from rdagent.log.ui.utils import ALL, HIGH, LITE, MEDIUM
1718
from rdagent.scenarios.kaggle.kaggle_crawler import leaderboard_scores
1819

1920

@@ -352,32 +353,6 @@ def mean_func(x: pd.DataFrame):
352353
st.dataframe(df)
353354

354355

355-
LITE = [
356-
"aerial-cactus-identification",
357-
"aptos2019-blindness-detection",
358-
"denoising-dirty-documents",
359-
"detecting-insults-in-social-commentary",
360-
"dog-breed-identification",
361-
"dogs-vs-cats-redux-kernels-edition",
362-
"histopathologic-cancer-detection",
363-
"jigsaw-toxic-comment-classification-challenge",
364-
"leaf-classification",
365-
"mlsp-2013-birds",
366-
"new-york-city-taxi-fare-prediction",
367-
"nomad2018-predict-transparent-conductors",
368-
"plant-pathology-2020-fgvc7",
369-
"random-acts-of-pizza",
370-
"ranzcr-clip-catheter-line-classification",
371-
"siim-isic-melanoma-classification",
372-
"spooky-author-identification",
373-
"tabular-playground-series-dec-2021",
374-
"tabular-playground-series-may-2022",
375-
"text-normalization-challenge-english-language",
376-
"text-normalization-challenge-russian-language",
377-
"the-icml-2013-whale-challenge-right-whale-redux",
378-
]
379-
380-
381356
def all_summarize_win():
382357
def shorten_folder_name(folder: str) -> str:
383358
if "amlt" in folder:
@@ -401,8 +376,24 @@ def shorten_folder_name(folder: str) -> str:
401376
base_df = percent_df(base_df)
402377
base_df.insert(0, "Select", True)
403378
bt1, bt2 = st.columns(2)
404-
if bt2.toggle("Select Lite Competitions", key="select_lite"):
405-
base_df["Select"] = base_df["Competition"].isin(LITE)
379+
select_lite_level = bt2.selectbox(
380+
"Select MLE-Bench Competitions Level",
381+
options=["ALL", "HIGH", "MEDIUM", "LITE"],
382+
index=0,
383+
key="select_lite_level",
384+
)
385+
if select_lite_level != "ALL":
386+
if select_lite_level == "HIGH":
387+
lite_set = set(HIGH)
388+
elif select_lite_level == "MEDIUM":
389+
lite_set = set(MEDIUM)
390+
elif select_lite_level == "LITE":
391+
lite_set = set(LITE)
392+
else:
393+
lite_set = set()
394+
base_df["Select"] = base_df["Competition"].isin(lite_set)
395+
else:
396+
base_df["Select"] = True # select all if ALL is chosen
406397

407398
if bt1.toggle("Select Best", key="select_best"):
408399

rdagent/log/ui/utils.py

Lines changed: 85 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,85 @@
1+
LITE = [
2+
"aerial-cactus-identification",
3+
"aptos2019-blindness-detection",
4+
"denoising-dirty-documents",
5+
"detecting-insults-in-social-commentary",
6+
"dog-breed-identification",
7+
"dogs-vs-cats-redux-kernels-edition",
8+
"histopathologic-cancer-detection",
9+
"jigsaw-toxic-comment-classification-challenge",
10+
"leaf-classification",
11+
"mlsp-2013-birds",
12+
"new-york-city-taxi-fare-prediction",
13+
"nomad2018-predict-transparent-conductors",
14+
"plant-pathology-2020-fgvc7",
15+
"random-acts-of-pizza",
16+
"ranzcr-clip-catheter-line-classification",
17+
"siim-isic-melanoma-classification",
18+
"spooky-author-identification",
19+
"tabular-playground-series-dec-2021",
20+
"tabular-playground-series-may-2022",
21+
"text-normalization-challenge-english-language",
22+
"text-normalization-challenge-russian-language",
23+
"the-icml-2013-whale-challenge-right-whale-redux",
24+
]
25+
26+
HIGH = [
27+
"3d-object-detection-for-autonomous-vehicles",
28+
"bms-molecular-translation",
29+
"google-research-identify-contrails-reduce-global-warming",
30+
"hms-harmful-brain-activity-classification",
31+
"iwildcam-2019-fgvc6",
32+
"nfl-player-contact-detection",
33+
"predict-volcanic-eruptions-ingv-oe",
34+
"rsna-2022-cervical-spine-fracture-detection",
35+
"rsna-breast-cancer-detection",
36+
"rsna-miccai-brain-tumor-radiogenomic-classification",
37+
"siim-covid19-detection",
38+
"smartphone-decimeter-2022",
39+
"stanford-covid-vaccine",
40+
"vesuvius-challenge-ink-detection",
41+
"vinbigdata-chest-xray-abnormalities-detection",
42+
]
43+
44+
MEDIUM = [
45+
"AI4Code",
46+
"alaska2-image-steganalysis",
47+
"billion-word-imputation",
48+
"cassava-leaf-disease-classification",
49+
"cdiscount-image-classification-challenge",
50+
"chaii-hindi-and-tamil-question-answering",
51+
"champs-scalar-coupling",
52+
"facebook-recruiting-iii-keyword-extraction",
53+
"freesound-audio-tagging-2019",
54+
"google-quest-challenge",
55+
"h-and-m-personalized-fashion-recommendations",
56+
"herbarium-2020-fgvc7",
57+
"herbarium-2021-fgvc8",
58+
"herbarium-2022-fgvc9",
59+
"hotel-id-2021-fgvc8",
60+
"hubmap-kidney-segmentation",
61+
"icecube-neutrinos-in-deep-ice",
62+
"imet-2020-fgvc7",
63+
"inaturalist-2019-fgvc6",
64+
"iwildcam-2020-fgvc7",
65+
"jigsaw-unintended-bias-in-toxicity-classification",
66+
"kuzushiji-recognition",
67+
"learning-agency-lab-automated-essay-scoring-2",
68+
"lmsys-chatbot-arena",
69+
"multi-modal-gesture-recognition",
70+
"osic-pulmonary-fibrosis-progression",
71+
"petfinder-pawpularity-score",
72+
"plant-pathology-2021-fgvc8",
73+
"seti-breakthrough-listen",
74+
"statoil-iceberg-classifier-challenge",
75+
"tensorflow-speech-recognition-challenge",
76+
"tensorflow2-question-answering",
77+
"tgs-salt-identification-challenge",
78+
"tweet-sentiment-extraction",
79+
"us-patent-phrase-to-phrase-matching",
80+
"uw-madison-gi-tract-image-segmentation",
81+
"ventilator-pressure-prediction",
82+
"whale-categorization-playground",
83+
]
84+
85+
ALL = HIGH + MEDIUM + LITE

0 commit comments

Comments
 (0)