feat(bench): support zero-shot proposal writing (#910)

* update with zero-shot * update with zero-shot * update with zero-shot
ulab-uiuc · Nov 26, 2024 · 51fbad1 · 51fbad1
1 parent 5e7ac3c
commit 51fbad1
Show file tree

Hide file tree

Showing 3 changed files with 37 additions and 2 deletions.
diff --git a/research_bench/proposal_writing.py b/research_bench/proposal_writing.py
@@ -55,6 +55,38 @@ def write_proposal_researchtown(
         raise ValueError('Failed to generate proposal')
 
 
+def write_proposal_zero_shot(config: Config) -> str:
+    prompt = [
+        {
+            'role': 'user',
+            'content': (
+                'You are a AI researcher. Here is a high-level summarized insight of a research field Machine Learning.\n\n'
+                'Here are the five core questions:\n\n'
+                '[Question 1] - What is the problem?\n\n'
+                'Formulate the specific research question you aim to address. Only output one question and do not include any more information.\n\n'
+                '[Question 2] - Why is it interesting and important?\n\n'
+                'Explain the broader implications of solving this problem for the research community.\n'
+                'Discuss how such paper will affect the future research.\n'
+                'Discuss how addressing this question could advance knowledge or lead to practical applications.\n\n'
+                '[Question 3] - Why is it hard?\n\n'
+                'Discuss the challenges and complexities involved in solving this problem.\n'
+                'Explain why naive or straightforward approaches may fail.\n'
+                'Identify any technical, theoretical, or practical obstacles that need to be overcome. MAKE IT CLEAR.\n\n'
+                "[Question 4] - Why hasn't it been solved before?\n\n"
+                'Identify gaps or limitations in previous research or existing solutions.\n'
+                'Discuss any barriers that have prevented this problem from being solved until now.\n'
+                'Explain how your approach differs from or improves upon prior work. MAKE IT CLEAR.\n\n'
+                '[Question 5] - What are the key components of my approach and results?\n\n'
+                'Outline your proposed methodology in detail, including the method, dataset, metric that you plan to use.\n'
+                'Describe the expected outcomes. MAKE IT CLEAR.\n\n'
+                'Please provide the five core questions contents for a brand new future research that you think are the most promising one.'
+            ),
+        }
+    ]
+    response = model_prompting(config.param.base_llm, prompt)[0]
+    return response
+
+
 def write_proposal_with_only_profiles(profiles: List[Profile], config: Config) -> str:
     bio_strs = '\n'.join([profile.bio for profile in profiles])
 
@@ -291,7 +323,9 @@ def write_proposal(
     ref_contents: List[str],
     config: Config,
 ) -> str:
-    if mode == 'author_only':
+    if mode == 'zero_shot':
+        return write_proposal_zero_shot(config=config)
+    elif mode == 'author_only':
         return write_proposal_with_only_profiles(profiles=profiles, config=config)
     elif mode == 'citation_only':
         return write_proposal_with_only_citations(

diff --git a/research_bench/run_eval.py b/research_bench/run_eval.py
@@ -75,6 +75,7 @@ def main() -> None:
         type=str,
         required=True,
         choices=[
+            'zero_shot',
             'author_only',
             'citation_only',
             'author_citation',

diff --git a/research_bench/run_eval.sh b/research_bench/run_eval.sh
@@ -3,7 +3,7 @@
 # Define the input and output paths, along with the modes to test
 INPUT_PATH="./mlbench/mlbench.json"
 OUTPUT_DIR="./results"
-MODES=("sakana_ai_scientist") #("citation_only" "author_only" "author_citation")
+MODES=("citation_only")
 NUM_PROCESSES=4
 
 # Loop through each mode and run the evaluation