[Fix] use new prompt

open-compass · Nov 30, 2023 · b35d117 · b35d117
1 parent e51f46f
commit b35d117
Show file tree

Hide file tree

Showing 3 changed files with 72 additions and 110 deletions.
diff --git a/configs/datasets/gsm8k/gsm8k_gen_3ac57d.py b/configs/datasets/gsm8k/gsm8k_gen_3ac57d.py
@@ -0,0 +1,55 @@
+from opencompass.openicl.icl_prompt_template import PromptTemplate
+from opencompass.openicl.icl_retriever import ZeroRetriever
+from opencompass.openicl.icl_inferencer import AgentInferencer
+from opencompass.datasets import (
+    GSM8KDataset,
+    gsm8k_postprocess,
+    gsm8k_dataset_postprocess,
+    Gsm8kAgentEvaluator,
+)
+
+gsm8k_reader_cfg = dict(input_columns=["question"], output_column="answer")
+
+gsm8k_infer_cfg = dict(
+    prompt_template=dict(
+        type=PromptTemplate,
+        template=dict(
+            round=[
+                # # ################################### NEW SHOT ###################################
+                dict(role='HUMAN', prompt='Mark\'s basketball team scores 25 2 pointers, 8 3 pointers and 10 free throws.  Their opponents score double the 2 pointers but half the 3 pointers and free throws.  What\'s the total number of points scored by both teams added together?'),
+                dict(role='BOT', prompt='Tool:PythonInterpreter\nTool Input:def solution():\n    mark_pointers_2 = 25 * 2\n    mark_pointers_3 = 8 * 3\n    mark_free_throws = 10 * 1\n    mark_points_scored = mark_pointers_2 + mark_pointers_3 + mark_free_throws\n    opponents_pointers_2 = mark_pointers_2 * 2\n    opponents_pointers_3 = mark_pointers_3 / 2\n    opponents_free_throws = mark_free_throws / 2\n    opponents_points_scored = opponents_pointers_2 + opponents_pointers_3 + opponents_free_throws\n    total_points_scored = mark_points_scored + opponents_points_scored\n    result = total_points_scored\n    return result'),
+                dict(role='SYSTEM', prompt='Response:210'),
+                dict(role='BOT', prompt='Thought: According to the response, I got the answer\nFinalAnswer: 210'),
+
+                dict(role='HUMAN', prompt='Bella has two times as many marbles as frisbees. She also has 20 more frisbees than deck cards. If she buys 2/5 times more of each item, what would be the total number of the items she will have if she currently has 60 marbles?'),
+                dict(role='BOT', prompt='Tool:PythonInterpreter\nTool Input:def solution():\n    marbles = 60\n    num_increased_marbles = marbles * 2 / 5\n    num_total_marbles = marbles + num_increased_marbles\n    frisbees = marbles / 2\n    num_increased_frisbees = frisbees * 2 / 5\n    num_total_frisbees = frisbees + num_increased_frisbees\n    deck_cards = frisbees - 20\n    num_increased_deck_cards = deck_cards * 2 / 5\n    num_total_deck_cards = deck_cards + num_increased_deck_cards\n    num_total = num_total_marbles + num_total_frisbees + num_total_deck_cards\n    result = num_total\n    return result'),
+                dict(role='SYSTEM', prompt='Response:140'),
+                dict(role='BOT', prompt='Thought: According to the response, I got the answer\nFinalAnswer: 140'),
+
+                dict(role='HUMAN', prompt='A group of 4 fruit baskets contains 9 apples, 15 oranges, and 14 bananas in the first three baskets and 2 less of each fruit in the fourth basket. How many fruits are there?'),
+                dict(role='BOT', prompt="""Tool:PythonInterpreter\nTool Input:def solution():\n    num_fruits_per_first_three_basket = 9 + 15 + 14\n    num_fruits_first_three_basket = num_fruits_per_first_three_basket * 3\n    num_apple_fourth_basket = 9 - 2\n    num_orange_fourth_basket = 15 - 2\n    num_banana_fourth_basket = 14 - 2\n    num_fruits_fourth_basket = num_apple_fourth_basket + num_orange_fourth_basket + num_banana_fourth_basket\n    num_fruits_total = num_fruits_first_three_basket + num_fruits_fourth_basket\n    result = num_fruits_total\n    return result"""),
+                dict(role='SYSTEM', prompt='Response:146'),  
+                dict(role='BOT', prompt='Thought: According to the response, I got the answer\nFinalAnswer: 146'),
+
+                dict(role='HUMAN', prompt='{question}'),
+            ])),
+    retriever=dict(type=ZeroRetriever),
+    inferencer=dict(type=AgentInferencer),
+)
+
+gsm8k_eval_cfg = dict(
+    evaluator=dict(type=Gsm8kAgentEvaluator),
+    pred_postprocessor=dict(type=gsm8k_postprocess),
+    dataset_postprocessor=dict(type=gsm8k_dataset_postprocess),
+)
+
+gsm8k_datasets = [
+    dict(
+        abbr='gsm8k',
+        type=GSM8KDataset,
+        path='./data/gsm8k',
+        reader_cfg=gsm8k_reader_cfg,
+        infer_cfg=gsm8k_infer_cfg,
+        eval_cfg=gsm8k_eval_cfg,
+    )
+]
diff --git a/configs/eval_chat_agent.py b/configs/eval_chat_agent.py
@@ -3,109 +3,28 @@
 from opencompass.partitioners import SizePartitioner
 from opencompass.runners import LocalRunner
 from opencompass.tasks import OpenICLInferTask
-from opencompass.openicl import AgentInferencer
-
-with read_base():
-    from .datasets.gsm8k.gsm8k_gen import gsm8k_datasets as datasets
-
 from opencompass.models.lagent import LagentAgent
 from lagent import PythonInterpreter, ReAct
 from lagent.agents.react import ReActProtocol
 
-FORCE_STOP_PROMPT_EN = """You should directly give results based on history information."""
-
-FEWSHOT_INSTRUCTION = """\
-You are a assistant who can utilize external tools.
-{tool_description}
-To use a tool, please use the following format:
-```
-{thought} Think what you need to solve, do you need to use tools?
-{action} the tool name, should be one of [{action_names}]
-{action_input} the input to the action
-```
-I will give you response after utilizing tools should using the following format:
-```
-{response} the results after call the tool.
-``
-If you already know the answer, or you do not need to use tools,
-please using the following format to reply:
-```
-{thought} the thought process to get the final answer
-{finish} final answer
-```
-
-Examples:
-
-<HUMAN>A group of 4 fruit baskets contains 9 apples, 15 oranges, and 14 bananas in the first three baskets and 2 less of each fruit in the fourth basket. How many fruits are there?
-<ASSISTANT>{thought} We need to calculate the total number of fruits. The total number of fruits in the first three baskets is given, while for the fourth basket, we need to subtract 2 from each fruit category. We can solve this problem using simple arithmetic.
-{action} PythonInterpreter
-{action_input}
-```python
-def solution():
-    # Fruits in the first three baskets
-    apples_first_three = 9
-    oranges_first_three = 15
-    bananas_first_three = 14
-
-    # Fruits in the fourth basket
-    apples_fourth = apples_first_three - 2
-    oranges_fourth = oranges_first_three - 2
-    bananas_fourth = bananas_first_three - 2
-
-    # Total fruits
-    total_fruits = ((apples_first_three + oranges_first_three + bananas_first_three) * 3 +
-                    apples_fourth + oranges_fourth + bananas_fourth)
-
-    return {{"total_fruits": total_fruits}}
-```
-<SYSTEM>{response}{{'total_fruits': 146}}
-<ASSISTANT> {thought} By adding the given numbers of apples, oranges, and bananas in the first three baskets, then subtracting 2 from each category for the fourth basket, we have found the total number of fruits.
-{finish} 146
-
-<HUMAN>Bella has two times as many marbles as frisbees. She also has 20 more frisbees than deck cards. If she buys 2/5 times more of each item, what would be the total number of the items she will have if she currently has 60 marbles?
-<ASSISTANT>{thought} This is a problem that requires solving equations. We know the relationship between the number of marbles, frisbees, and deck cards. Bella has twice as many marbles as frisbees, and 20 more frisbees than deck cards. Finally, we are told Bella buys 2/5 times more of each item. This purchasing will increase the number of each type of item.
-{action} PythonInterpreter
-{action_input}
-```python
-def solution():
-    # Given number of marbles
-    marbles_now = 60
-
-    # Calculate number of frisbees and deck cards now
-    frisbees_now = marbles_now / 2
-    cards_now = frisbees_now - 20
-
-    # Calculate number of each item after buying more
-    marbles_then = marbles_now + (2/5) * marbles_now
-    frisbees_then = frisbees_now + (2/5) * frisbees_now
-    cards_then = cards_now + (2/5)*cards_now
+with read_base():
+    from .datasets.gsm8k.gsm8k_gen_3ac57d import gsm8k_datasets as datasets
 
-    # Total number of items then
-    total_items = marbles_then + frisbees_then + cards_then
 
-    return {{"total_items": total_items}}
+system_prompt = """You are a helpful assistant which use tools to solve mathematical reasoning questions. The code must be a function, and the function name must be 'solution'. For mathematics, please use code tool to calculate. The example format is as follows:
 ```
-<SYSTEM>{response}{{'total_items': 140.0}}
-<ASSISTANT>{thought} By establishing the relationships between the numbers of marbles, frisbees, and deck cards that Bella currently has, we can calculate how many of each item she will have after buying 2/5 more of each. Adding these quantities together gives us the total number of items.
-{finish} 140
-
-Begin!
-"""
-
-PYTHON_INTERPRETER_DESCRIPTION = '''\
-It can run a Python code. The code must be a valid code that contains only python method, and the method' name must be 'solution' and returns a dict, which key is variable name. The libraries I recommend are sympy and scipy. the format is:
-```python
-# import packages
-import xxx
 def solution():
-    # initialize some variables
-    variable_names_with_real_meaning = xxx
-    # middle steps
-    mid_variable = func(mid_variable)
-    # final answer
-    final_answer =  func(mid_variable)
-    return final_answer
-```'''
+    variable_names_with_real_meaning = func(variable)
+    return variable_names_with_real_meaning
+```"""
+
+protocol = dict(
+    type=ReActProtocol,
+    action=dict(role="ACTION", begin="Tool:", end="\n"),
+    action_input=dict(role="ARGS", begin="Tool Input:", end="\n"),
+    finish=dict(role="FINISH", begin="FinalAnswer:", end="\n"),
+    call_protocol=system_prompt,
+)
 
 models = [
     dict(
@@ -121,25 +40,13 @@ def solution():
             max_seq_len=4096,
         ),
         actions=[
-            dict(type=PythonInterpreter,
-                 description=PYTHON_INTERPRETER_DESCRIPTION),
+            dict(type=PythonInterpreter),
         ],
-        protocol=dict(
-            type=ReActProtocol,
-            call_protocol=FEWSHOT_INSTRUCTION,
-            force_stop=FORCE_STOP_PROMPT_EN,
-            finish=dict(role='FINISH', begin='Final Answer:', end='\n'),
-        ),
+        protocol=protocol,
         batch_size=1,
     ),
 ]
 
-for dataset in datasets:
-    # Use AgentInferencer instead of GenInferencer
-    dataset['infer_cfg']['inferencer'] = dict(type=AgentInferencer)
-    # Use the question as agent input directly.
-    dataset['infer_cfg']['prompt_template']['template'] = "{question}"
-
 infer = dict(
     partitioner=dict(type=SizePartitioner, max_task_size=1000),
     runner=dict(

diff --git a/opencompass/openicl/icl_inferencer/icl_chat_inferencer.py b/opencompass/openicl/icl_inferencer/icl_chat_inferencer.py
@@ -76,7 +76,7 @@ def parse_template(self, chat: List[dict], mode='gen') -> str:
         else:
             # in case the model does not have any meta template
             last_sep = ''
-            for item in dialog:
+            for item in chat:
                 prompt += last_sep + (item.get('content') or '')
                 last_sep = '\n'
         return prompt