Spaces:
Running
Running
Commit
·
fc0a17a
1
Parent(s):
74cd82e
Please work!!
Browse files- Assests/MLRC_Bench_overview.png +2 -2
- src/components/tasks.py +2 -1
- src/utils/config.py +3 -1
Assests/MLRC_Bench_overview.png
CHANGED
|
Git LFS Details
|
|
Git LFS Details
|
src/components/tasks.py
CHANGED
|
@@ -70,7 +70,8 @@ While current results suggest that LLM-based research agents still fall short of
|
|
| 70 |
"Perception Temporal Action Loc": "https://ptchallenge-workshop.github.io",
|
| 71 |
"Product Recommendation": "https://www.aicrowd.com/challenges/amazon-kdd-cup-23-multilingual-recommendation-challenge",
|
| 72 |
"Meta Learning": "https://metalearning.chalearn.org/",
|
| 73 |
-
"Llm Merging": "https://llm-merging.github.io"
|
|
|
|
| 74 |
}
|
| 75 |
|
| 76 |
# Update links mapping to use display names as keys
|
|
|
|
| 70 |
"Perception Temporal Action Loc": "https://ptchallenge-workshop.github.io",
|
| 71 |
"Product Recommendation": "https://www.aicrowd.com/challenges/amazon-kdd-cup-23-multilingual-recommendation-challenge",
|
| 72 |
"Meta Learning": "https://metalearning.chalearn.org/",
|
| 73 |
+
"Llm Merging": "https://llm-merging.github.io",
|
| 74 |
+
"Rainfall Prediction": "https://weather4cast.net/neurips-2023/"
|
| 75 |
}
|
| 76 |
|
| 77 |
# Update links mapping to use display names as keys
|
src/utils/config.py
CHANGED
|
@@ -100,5 +100,7 @@ tasks_info = {
|
|
| 100 |
task_display_names.get("Machine Unlearning", "Machine Unlearning"):
|
| 101 |
"Evaluating how well models can 'unlearn' specific information when required.",
|
| 102 |
task_display_names.get("Backdoor Trigger Recovery", "Backdoor Trigger Recovery"):
|
| 103 |
-
"Testing resilience against backdoor attacks and ability to recover from triggered behaviors."
|
|
|
|
|
|
|
| 104 |
}
|
|
|
|
| 100 |
task_display_names.get("Machine Unlearning", "Machine Unlearning"):
|
| 101 |
"Evaluating how well models can 'unlearn' specific information when required.",
|
| 102 |
task_display_names.get("Backdoor Trigger Recovery", "Backdoor Trigger Recovery"):
|
| 103 |
+
"Testing resilience against backdoor attacks and ability to recover from triggered behaviors.",
|
| 104 |
+
task_display_names.get("Rainfall Prediction", "Rainfall Prediction"):
|
| 105 |
+
"Testing the model's ability to predict rainfall based on historical data and weather patterns."
|
| 106 |
}
|