[Feature Request]: ReasoningAgent #114

BabyCNM · 2024-11-30T04:15:24Z

Is your feature request related to a problem? Please describe.

Beam Search Agent
a. Nested chat implementation @Hk669
b. Readme @BabyCNM
c. test case @Hk669
d. Blog @BabyCNM
MCTS Agent

Describe the solution you'd like

No response

Additional context

No response

BabyCNM · 2024-11-30T04:16:13Z

Think Node for the tree

class ThinkNode:

    def __init__(self, content: str, parent: Optional['ThinkNode'] = None) -> None:
        self.content = content
        self.value = None
        self.parent = parent
        self.depth = self.parent.depth + 1 if parent else 0
        self.children = []
        self.visits = 0
        if self.parent:
            self.parent.children.append(self)

    @property
    def _trajectory_arr(self) -> List[str]:
        if self.parent:
            return self.parent._trajectory_arr + [self.content]
        return ["# Question: " + self.content]

    @property
    def trajectory(self) -> str:
        traj = self._trajectory_arr
        ans = traj[0]
        for i, option in enumerate(traj[1:]):
            ans += f"\nStep {i + 1}: {option}"
        return ans

    def __str__(self) -> str:
        return f"{self.content} -> Depth: {self.depth} Value: {self.value} Visits: {self.visits}"

    def __repr__(self) -> str:
        return self.__str__()

    def to_dict(self) -> Dict:
        """Convert ThinkNode to dictionary representation."""
        return {
            'content': self.content,
            'value': self.value,
            'depth': self.depth,
            'visits': self.visits,
            'children': [child.to_dict() for child in self.children]
        }

    @classmethod
    def from_dict(cls, data: Dict, parent: Optional['ThinkNode'] = None) -> 'ThinkNode':
        """Create ThinkNode from dictionary representation."""
        node = cls(content=data['content'], parent=parent)
        node.value = data['value']
        node.depth = data['depth']
        node.visits = data['visits']

        # Recursively create children
        for child_data in data['children']:
            cls.from_dict(child_data, parent=node)

        return node

Basic Beam Search Implementation

class BeamSearchAgent(autogen.AssistantAgent):

    def __init__(self,
                 name,
                 llm_config,
                 max_depth=4,
                 beam_size=3,
                 answer_approach="pool",
                 verbose=True) -> None:
        super().__init__(name=name, llm_config=llm_config)
        self.max_depth = max_depth
        self.beam_size = beam_size
        self.verbose = verbose
        assert answer_approach in ["pool", "best"]
        self.answer_approach = answer_approach
        self.thinker = autogen.AssistantAgent(
            name="tot_thinker",
            system_message=tot_msg,
            llm_config=llm_config)

        self.grader = autogen.AssistantAgent(
            name="tot_grader",
            system_message=
            "Rate the thinking trajectories for score 1 - 5 (1: worst, 5: best).",
            llm_config=llm_config)
        self.register_reply([autogen.Agent, None],
                            BeamSearchAgent.generate_response)

    def rate_node(self, node: ThinkNode) -> float:
        self.send(
            message=f"Rate the trajectory:\n{node.trajectory}",
            recipient=self.grader,
            request_reply=True,
            silent=False)
        rating = self.grader.last_message()["content"].strip()
        try:
            # Scale rating to [0, 1]
            reward = (float(re.findall(r"[\d.]+", rating)[0]) - 1) / 4.0
        except (IndexError, ValueError):
            reward = 0.0  # Default reward if parsing fails
        return reward

    def generate_response(self, messages, sender, config=None):
        if sender == self:
            return False, ""  # Defer the LLM call to next reply functions.

        messages = self._oai_messages[sender] if messages is None else messages
        prompt = messages[-1]["content"].strip()
        if not prompt:
            return True, "TERMINATE"

        root = ThinkNode(content=prompt, parent=None)
        prev_leafs = [root]

        final_answers = set() # store the final answers

        while prev_leafs and len(final_answers) < self.beam_size:
            new_leafs = []
            print("len(final_answers)", len(final_answers))
            print("len(prev_leafs)", len(prev_leafs))
            for node in prev_leafs:
                if (self.max_depth and node.depth >= self.max_depth) or "TERMINATE" in node.content:
                    # Reached max depth; collect possible answers
                    if node.value is None:
                        node.value = self.rate_node(node)
                    final_answers.add(node)
                    continue

                self.thinker.clear_history()
                self.send(
                    message=
                    f"{node.trajectory}\n---\nWhat are the possible next steps?",
                    recipient=self.thinker,
                    request_reply=True,
                    silent=False)
                reply = self.thinker.last_message()["content"].strip()

                options = re.findall(r"Option \d+:(.+?)(?=Option \d+:|$)", reply, re.DOTALL)
                print("Options:", options)
                for option in options:
                    new_leafs.append(ThinkNode(content=option.strip().rstrip(), parent=node))

            prev_leafs = new_leafs

            if len(prev_leafs) + len(final_answers) > self.beam_size:
                if len(final_answers) >= self.beam_size:
                    prev_leafs = []  # stop searching, max beam size reached
                    break

                # Rate
                for node in prev_leafs:
                    node.value = self.rate_node(node)
                # Beam search: keep top beam_size leaf nodes
                prev_leafs = sorted(prev_leafs,
                                    key=lambda x: x.value if x.value else 0,
                                    reverse=True)[:self.beam_size - len(final_answers)]

        assert final_answers, "No final answers found."
        visualize_tree(root)
        final_answers = list(final_answers)

        if self.answer_approach == "best":
            # Best the final answers
            best_leaf = max(final_answers, key=lambda x: x.value)
            self.send(
                message=
                f"Answer the question {prompt}. Here is my thinking processes:\n{best_leaf.trajectory}",
                recipient=self,
                request_reply=True,
                silent=not self.verbose)
        elif self.answer_approach == "pool":
            all_thoughts = "\n\n".join([
                f"--- Possibility {i+1} ---\n{node.trajectory}\n"
                for i, node in enumerate(final_answers)
            ])
            self.send(
                message=
                f"Answer the question {prompt}. You can utilize these students' thinking processes.\n\n{all_thoughts}",
                recipient=self,
                request_reply=True,
                silent=not self.verbose)

        final_answer = self.chat_messages[self][-1]["content"].strip()
        return True, final_answer



def last_meaningful_msg(sender, recipient, summary_args):
    if sender == recipient:
        return "TERMINATE"

    summary = ""
    chat_messages = recipient.chat_messages[sender]

    for msg in reversed(chat_messages):
        try:
            content = msg["content"]
            if isinstance(content, str):
                summary = content.replace("TERMINATE", "")
            elif isinstance(content, list):
                # Remove the `TERMINATE` word in the content list.
                summary = "\n".join(
                    x["text"].replace("TERMINATE", "") for x in content if isinstance(x, dict) and "text" in x
                )
            if summary.strip().rstrip():
                return summary
        except (IndexError, AttributeError) as e:
            warnings.warn(f"Cannot extract summary using last_msg: {e}. Using an empty str as summary.", UserWarning)
    return summary

def thought_reply(question: str,
                  config_list: list,
                  verbose: bool = False) -> str:
    global total_cost
    thought_agent = BeamSearchAgent(name="thought_agent",
                                  llm_config={"config_list": config_list},
                                  verbose=verbose)
    user_proxy = autogen.UserProxyAgent(
        name="user_proxy",
        human_input_mode="NEVER",
        code_execution_config={"use_docker": False},
        max_consecutive_auto_reply=10)
    ans = user_proxy.initiate_chat(thought_agent,
                                   message=question,
                                   summary_method=last_meaningful_msg)
    return ans.summary

BabyCNM added the enhancement New feature or request label Nov 30, 2024

BabyCNM assigned Hk669 and BabyCNM Nov 30, 2024

Hk669 added the roadmap label Nov 30, 2024

Hk669 linked a pull request Nov 30, 2024 that will close this issue

ReasoningAgent #115

Merged

9 tasks

Hk669 mentioned this issue Nov 30, 2024

ReasoningAgent #115

Merged

9 tasks

Hk669 changed the title ~~[Feature Request]: Reason Agent~~ [Feature Request]: ReasoningAgent Dec 3, 2024

qingyun-wu closed this as completed in #115 Dec 5, 2024

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

[Feature Request]: ReasoningAgent #114

[Feature Request]: ReasoningAgent #114

BabyCNM commented Nov 30, 2024 •

edited by Hk669

Loading

BabyCNM commented Nov 30, 2024

[Feature Request]: ReasoningAgent #114

[Feature Request]: ReasoningAgent #114

Comments

BabyCNM commented Nov 30, 2024 • edited by Hk669 Loading

Is your feature request related to a problem? Please describe.

Describe the solution you'd like

Additional context

BabyCNM commented Nov 30, 2024

BabyCNM commented Nov 30, 2024 •

edited by Hk669

Loading