File size: 31,752 Bytes

from agent.utils import *
from agent.prompt import *
import anndata
import gradio as gr
from gradio import ChatMessage
import re
import pandas as pd
import pathlib
import numpy as np

class SigSpace(Basic_Agent):
    def __init__(self, config_path:str):
        super().__init__(config_path)
        self.conversation = []
        self.system_prompt = Agent_Prompt
        self.conversation = []
        self.conversation.append({"role": "system", "content": self.system_prompt})
        
        # initialize data path
        # path = pathlib.Path("/home/ubuntu/giovanni/code/Tahoe_Hackathon/datasets") # on lambda
        path = pathlib.Path("data")
        # jump_path = pathlib.Path("/home/ubuntu/giovanni/data")
        self.jump_tahoe_drug_metadata = pd.read_csv(path/"drug_metadata_inchikey.csv")
        self.jump_similarity_score = pd.read_csv(path/"compound_genetic_perturbation_cosine_similarity_inchikey.csv")
        
        # Load PRISM IC50 matrix
        # prism_data_path = pathlib.Path("/home/ubuntu/sid/Hackathon_Tahoe/data")
        self.ic50 = pd.read_csv(path / "Tahoe_PRISM_cell_by_drug_ic50_matrix_named.csv", index_col=0)
        self.ic50.columns = self.ic50.columns.str.lower()

        # nci60_path = pathlib.Path("/home/ubuntu/ishita/tahoe/")
        self.lc50 = pd.read_csv(path / "filtered_results.csv")
        # Filter out rows where CELL is nan
        self.lc50 = self.lc50[self.lc50['CELL'].notna()]

        # Load full Tahoe metadata
        # tahoe_path = pathlib.Path("/home/ubuntu/rohit/data")
        self.tahoe_cell_meta = pd.read_csv(path / "cell_line_metadata.csv")
        self.tahoe_drug_meta = pd.read_csv(path / "drug_metadata.csv")
        self.tahoe_vision_scores = anndata.read_h5ad(path / "tahoe_vision_scores.h5ad")
        
        # Load PRISM subset of Tahoe metadata
        self.prism_tahoe_cell_meta = pd.read_csv(path / "Tahoe_PRISM_matched_cell_metadata_final.csv")
        self.prism_tahoe_drug_meta = pd.read_csv(path / "Tahoe_PRISM_matched_drug_metadata_final.csv")

        # Build cell line common name to depmap_id map (strip whitespace and case)
        self.cell_name_to_depmap = {
            row["cell_name"].strip(): row["Cell_ID_DepMap"]
            for _, row in self.prism_tahoe_cell_meta.iterrows()
        }

        self.cell_name_to_depmap_lc50 = {
            row["clean"].strip(): row["cell_line_name"]
            for _, row in self.lc50.iterrows()
        }

        self.tahoe_similarity_score = pd.read_csv(path / "in_tahoe_search_result_df.csv")
        self.tahoe_cxg_similarity_score = pd.read_csv(path / "cxg_search_result_df.csv")

    
    def initialize_conversation(self, message, conversation=None, history=None):
        if conversation is None:
            conversation = []

        conversation.append({"role": "system", "content" : Agent_Prompt})
        
        if history is not None:
            if len(history) == 0:
                conversation = []
                print("clear conversation successfully")
            else:
                for i in range(len(history)):
                    if history[i]['role'] == 'user':
                        if i-1 >= 0 and history[i-1]['role'] == 'assistant':
                            conversation.append(
                                {"role": "assistant", "content": history[i-1]['content']})
                        conversation.append(
                            {"role": "user", "content": history[i]['content']})
                    if i == len(history)-1 and history[i]['role'] == 'assistant':
                        conversation.append(
                            {"role": "assistant", "content": history[i]['content']})

        conversation.append({"role": "user", "content": message})

        return conversation

    def get_similar_disease(self, disease_name, k_value):
        if disease_name != "Alzheimer's":
            return "FAIL"
        return 'Parkinsons Disease'

    def get_validated_target_jump(self, drug_name):
        print(drug_name)
        try:
            inchikey = self.jump_tahoe_drug_metadata[self.jump_tahoe_drug_metadata.drug.isin([drug_name])]["InChIKey"].values[0]
            similarity_scores = self.jump_similarity_score[self.jump_similarity_score.InChIKey.isin([inchikey])]

            # Count ORF entries with cosine_similarity > 0.2 and < -0.2
            orf_positive = similarity_scores[(similarity_scores.Genetic_Perturbation == 'ORF') & (similarity_scores.cosine_sim > 0.2)].shape[0]
            orf_negative = similarity_scores[(similarity_scores.Genetic_Perturbation == 'ORF') & (similarity_scores.cosine_sim < -0.2)].shape[0]

            # Count CRISPR entries with cosine_similarity > 0.2 and < -0.2
            crispr_positive = similarity_scores[(similarity_scores.Genetic_Perturbation == 'CRISPR') & (similarity_scores.cosine_sim > 0.2)].shape[0]
            crispr_negative = similarity_scores[(similarity_scores.Genetic_Perturbation == 'CRISPR') & (similarity_scores.cosine_sim < -0.2)].shape[0]

            orf_targets = f"ORF: {orf_positive} positive correlations (>0.2), {orf_negative} negative correlations (<-0.2)"
            crispr_targets = f"CRISPR: {crispr_positive} positive correlations (>0.2), {crispr_negative} negative correlations (<-0.2)"

            orf_crispr_targets = orf_targets + " " +crispr_targets

            known_targets_from_jump = self.jump_tahoe_drug_metadata[self.jump_tahoe_drug_metadata.drug.isin([drug_name])]["target_list"].values[0]
            known_targets_output = f"The known targets from the JUMP dataset are: {', '.join(known_targets_from_jump.split('|'))}"
        except Exception as e:
            print(e)
            return "For the drug {drug_name}, we were not able to find the target in the JUMP dataset."
        
        orf_crispr_targets = \
        f"""
        Preturbation description:

        ORF: The ORF perturbation consists of an overexpression of the target gene.
        CRISPR: The CRISPR perturbation consists of a knockout of the target gene.

        Considering the drug "{drug_name}", we expect positive correlations with shared CRISPR targets, 
        and negative correlations with shared ORF targets.
        
        But, the measured correlations are:

        {orf_crispr_targets}

        Furthermore, the JUMP dataset has the following known targets for the drug "{drug_name}":

        {known_targets_output}
        """ 
        return orf_crispr_targets
    
    def get_similar_drug_effect_in_tahoe(self, cell_line_name: str, drug_name: str):
        """
        Get similar effect drugs in tahoe based on the drug name and cell line name.
        
        Args:
            cell_line_name (str): The name of the cell line.
            drug_name (str): The name of the drug.
        """
        cell_line_names = self.tahoe_similarity_score["source_cell_line"].unique().tolist()
        drug_names = self.tahoe_similarity_score["source_drug_name"].unique().tolist()
        if cell_line_name not in cell_line_names:
            return "FAIL: Cell line name not found in the dataset. A example: CVCL_0218"
        if drug_name not in drug_names:
            return "FAIL: Drug name not found in the dataset. A example: Daptomycin"
        hits = self.tahoe_similarity_score[
            (self.tahoe_similarity_score["source_cell_line"] == cell_line_name) &
            (self.tahoe_similarity_score["source_drug_name"] == drug_name)
        ]
        # sort by distance
        hits = hits.sort_values(by="distance", ascending=True).reset_index(drop=True)
        hits = hits.head(10)
        # keep target_drug_name and target_cell_line
        hits = hits[["target_drug_name", "target_cell_line",]]
        outputs = f"""
        The following drugs have similar effects to the drug you provided:
        hits: 
        {hits}
        """
        return outputs
    
    def get_similar_drug_effects_in_cxg(self, cell_line_name: str, drug_name: str):
        """
        Get similar effect diseases in cxg based on the drug name and cell line name.
        
        Args:
            cell_line_name (str): The name of the cell line.
            drug_name (str): The name of the drug.
        """
        cell_line_names = self.tahoe_cxg_similarity_score["cell_line"].unique().tolist()
        drug_names = self.tahoe_cxg_similarity_score["perturbation_drug_name"].unique().tolist()
        if cell_line_name not in cell_line_names:
            return "FAIL: Cell line name not found in the dataset. A valid example: CVCL_0218"
        if drug_name not in drug_names:
            return "FAIL: Drug name not found in the dataset. A valid example:: Daptomycin"
        hits = self.tahoe_cxg_similarity_score[
            (self.tahoe_cxg_similarity_score["cell_line"] == cell_line_name) &
            (self.tahoe_cxg_similarity_score["perturbation_drug_name"] == drug_name)
        ]
        hits = hits.sort_values(by="distance", ascending=True).reset_index(drop=True)
        hits = hits.head(10)
        # keeps cell_type tissue_type and disease	
        hits = hits[["cell_type", "tissue_type", "disease"]]
        outputs = f"""
        The following diseases have similar effects to the drug you provided:
        hits: 
        {hits}
        """
        return outputs

    def get_ic50_prism(self, drug_name: str, cell_line_name: str):
        drug_name_lower = drug_name.strip().lower()
        cell_line_key = cell_line_name.strip()

        if cell_line_key not in self.cell_name_to_depmap:
            print(f"Cell line name '{cell_line_key}' not found for PRISM data")
            return f"FAIL: Cell line name '{cell_line_key}' not found for PRISM data"

        depmap_id = self.cell_name_to_depmap[cell_line_key]

        if drug_name_lower not in self.ic50.columns:
            print(f"Drug name '{drug_name}' not found in IC50 matrix columns.")
            return f"FAIL: Drug name '{drug_name}' not found in IC50 matrix columns."

        try:
            ic50_val = self.ic50.loc[depmap_id, drug_name_lower]
            if pd.isna(ic50_val):
                print(f"FAIL: IC50 value is missing for '{drug_name}' in cell line '{cell_line_name}' (DepMap ID: {depmap_id}).")
                return f"FAIL: IC50 value is missing for '{drug_name}' in cell line '{cell_line_name}' (DepMap ID: {depmap_id})."

            return (
                f"The IC50 value of {ic50_val:.4f} corresponds to the log10-transformed micromolar concentration "
                f"at which {drug_name} inhibits 50% of viability in the {cell_line_name} cell line "
                f"(DepMap ID: {depmap_id}).\n\n"
                "This value comes from the PRISM Repurposing Secondary Screen, which exposes pooled barcoded cell lines "
                "to drug treatment for 5 days and infers viability from barcode abundance using sequencing.\n\n"
                "The secondary screen includes higher-confidence compound–cell line pairs with improved replicability "
                "compared to the primary screen.\n\n"
                "Lower IC50 values indicate greater sensitivity of the cell line to the drug."
            )
        except KeyError as e:
            print(f"Combination not found: {e}")
            return None


    def clean_cell_line_name(self, name):
        """
        Standardize cell line names for comparison by:
        1. Converting to string (handles any non-string values)
        2. Converting to uppercase
        3. Removing all non-alphanumeric characters
        
        Args:
            name: Cell line name (string or other type)
            
        Returns:
            Cleaned string with only uppercase letters and numbers
        """
        return re.sub(r"[^A-Z0-9]", "", str(name).upper())

    def get_lc50_nci60(self, drug_name: str, cell_line_name: str):
        cell_line_name = cell_line_name.upper()
        cell_line_key = self.clean_cell_line_name(cell_line_name)

        if cell_line_key not in self.cell_name_to_depmap_lc50:
            print(f"Cell line name '{cell_line_key}' not found for NCI60 data")
            return None
        depmap_id = self.cell_name_to_depmap_lc50[cell_line_key]
        print ("Depmap_id", depmap_id)

        # Find the drug in NCI60 dataset
        # Since drugs are in uppercase in the list, convert search term to uppercase
        drug_name_upper = drug_name.strip().upper()

        # Filter rows where the drug name is in the drug column
        # This assumes drugs in each row are comma-separated or in a format that can be searched
        matching_row = self.lc50[self.lc50['drug'].str.contains(drug_name_upper, na=False)]
        print ("Matching row", matching_row)
        if matching_row.empty:
            print(f"Drug name '{drug_name}' not found in NCI60 dataset.")
            return None

        if matching_row.empty:
            raise ValueError(f"Multiple matches found for drug '{drug_name}' in NCI60 dataset.")

        print ("Matching row", matching_row)
        # Get the LC50 value from the matching row
        lc50_val = matching_row.iloc[0]['NLOGLC50']
        lconc_val = matching_row.iloc[0]['LCONC']

        if pd.isna(lc50_val):
            return "LC50 value is missing for '{drug_name}' in cell line '{cell_line_name}' (depmap_id: {depmap_id})."
        
        lc50_output = \
        f"""
        The LC50 value of {lc50_val} represents -log10(LC50), the negative base-10 logarithm of the molar concentration that inhibits 50% of cell growth. 

        Higher LC50 values therefore indicate greater drug potency. 

        The LCONC value of {lconc_val} denotes the maximum log10 molar concentration tested in the dilution series—for example, LCONC = -4 corresponds to 10^-4 M. 

        Both metrics come from the NCI-60 drug screen, which applies a standardized 48-hour exposure assay across all compound–cell-line pairs."
        """
        
        return lc50_output
    
    def load_gene_sets_file(self, file_path):
        """
        Load gene sets from a tab-delimited file where the first column is the gene set name
        and the remaining columns are gene symbols.
        
        Parameters:
        -----------
        file_path : str
            Path to the gene sets file
            
        Returns:
        --------
        dict
            Dictionary mapping gene set names to lists of genes
        """
        gene_sets = {}
        with open(file_path, 'r') as file:
            for line in file:
                parts = line.strip().split('\t')
                if parts:
                    set_name = parts[0]
                    genes = [gene for gene in parts[1:] if gene]  # Filter out empty strings
                    gene_sets[set_name] = genes
        return gene_sets

    def get_genes_for_set(self, set_name):
        """
        Get the list of genes for a specific gene set.
        
        Parameters:
        -----------
        set_name : str
            Name of the gene set to query
            
        Returns:
        --------
        list
            List of genes in the gene set, or empty list if set not found
        """
        if not hasattr(self, 'gene_sets'):
            # Load the gene sets file if it hasn't been loaded yet
            self.gene_sets = self.load_gene_sets_file('/home/ubuntu/ishita/msigdb_all_sigs_human_symbols.txt')
        
        return self.gene_sets.get(set_name, [])
            
    def rank_vision_scores(self, drug_name: str, cell_line_name: str, k_value: int):
        self.tahoe_vision_scores.X = (self.tahoe_vision_scores.X - np.mean(self.tahoe_vision_scores.X, axis = 0)) / np.std(self.tahoe_vision_scores.X, axis = 0)

        # subset to the drug / cell line at the highest tested concentration
        filt = (
            (self.tahoe_vision_scores.obs["Cell_Name_Vevo"] == cell_line_name)
            & (self.tahoe_vision_scores.obs["drug"] == drug_name)
        )
        filtered_scores = self.tahoe_vision_scores[filt]
        if filtered_scores.n_obs == 0:
            return "VISION scores not found for this drug–cell-line combination."

        filtered_scores = filtered_scores[
            filtered_scores.obs["concentration"] == filtered_scores.obs["concentration"].max()
        ]

        # pick top-|score| gene sets
        top_idx = np.argsort(-np.abs(filtered_scores.X[0]))[:k_value]
        gene_sets = filtered_scores.var.index[top_idx].tolist()
        scores    = filtered_scores.X[0, top_idx].tolist()

        # build the narrative
        header = (
            "VISION scores are single-cell gene-set enrichment values computed by the "
            "VISION algorithm (DeTomaso & Yosef 2021). Positive scores indicate relative "
            "up-regulation of the gene set in the queried condition; negative scores indicate "
            "down-regulation.\n"
        )
        lines = []
        for gs, val in zip(gene_sets, scores):
            gs_name = gs.replace("gs_", "")
            genes = self.get_genes_for_set(gs_name)
            direction = "up-regulated" if val > 0 else "down-regulated" if val < 0 else "not changed"
            lines.append(f"{gs} has gene set {genes} : {direction} (VISION score = {val:.3f})")

        return header + "\n".join(lines)
    
    def obtain_moa(self, drug_name: str):
        row = self.tahoe_drug_meta[self.tahoe_drug_meta["drug"] == drug_name]

        if row.empty:
            return "MOA annotation not found for this drug."
        
        moa_broad = row["moa-broad"].values[0]
        moa_fine  = row["moa-fine"].values[0]

        return (
            f"Broad MOA: {moa_broad}; "
            f"Fine MOA: {moa_fine}. "
            "Fine-grained mechanism of action (MOA) annotation for the drug, "
            "specifying the biological process or molecular target affected. "
            "Derived from MedChemExpress and curated with GPT-based annotations."
        )

    def obtain_gene_targets(self, drug_name: str):
        row = self.tahoe_drug_meta[self.tahoe_drug_meta["drug"] == drug_name]
        if row.empty:
            return "Gene targets not found for this drug."
        
        targets = row["targets"].values[0]

        # Convert a stringified list/dict to a Python object, if necessary.
        if isinstance(targets, str):
            try:
                targets = eval(targets)
            except Exception:  # fall back to treating it as a single ID
                targets = [targets]

        return (
            f"Gene target token IDs: {targets}. "
            "Gene identifiers (integer token IDs) corresponding to each gene with non-zero expression in the cell."
        )

    def obtain_cell_line_data(self, cell_line_name: str):
        row = self.tahoe_cell_meta[self.tahoe_cell_meta["cell_name"] == cell_line_name]

        if row.empty:
            return "Cell-line metadata not found for this cell line."
        
        organ                 = row["Organ"].values[0]
        driver_gene_symbol    = row["Driver_Gene_Symbol"].values[0]
        driver_varzyg         = row["Driver_VarZyg"].values[0]
        driver_vartype        = row["Driver_VarType"].values[0]
        driver_proteffect     = row["Driver_ProtEffect_or_CdnaEffect"].values[0]
        driver_mech_inferdm   = row["Driver_Mech_InferDM"].values[0]
        driver_genetype_dm    = row["Driver_GeneType_DM"].values[0]

        return (
            f"Organ: {organ}; "
            f"Driver_Gene_Symbol: {driver_gene_symbol}; "
            f"Driver_VarZyg: {driver_varzyg}; "
            f"Driver_VarType: {driver_vartype}; "
            f"Driver_ProtEffect_or_CdnaEffect: {driver_proteffect}; "
            f"Driver_Mech_InferDM: {driver_mech_inferdm}; "
            f"Driver_GeneType_DM: {driver_genetype_dm}. "
            "Organ = tissue or organ of origin for the cell line (e.g., Lung), used to interpret lineage-specific responses. "
            "Driver_Gene_Symbol = HGNC-approved symbol of a driver gene with functional alterations in this cell line. "
            "Driver_VarZyg = zygosity of the driver variant (Hom = homozygous, Het = heterozygous). "
            "Driver_VarType = type of genetic alteration (e.g., Missense, Frameshift, Stopgain). "
            "Driver_ProtEffect_or_CdnaEffect = precise protein or cDNA-level annotation of the mutation (e.g., p.G12S). "
            "Driver_Mech_InferDM = inferred functional mechanism (LoF = loss-of-function, GoF = gain-of-function). "
            "Driver_GeneType_DM = classification of the driver gene as an Oncogene or Suppressor."
        )   

    def run_gradio_chat(self, message: str,
                    history: list,
                    temperature: float,
                    max_new_tokens: int,
                    max_token: int,
                    call_agent: bool,
                    conversation: gr.State,
                    max_round: int = 20,
                    seed: int = None,
                    call_agent_level: int = 0,
                    sub_agent_task: str = None):
    
        print("\033[1;32;40mstart\033[0m")
        print("len(message)", len(message))

        if len(message) <= 10:
            yield "Hi, I am Agent, an assistant for answering biomedical questions. Please provide a valid message with a string longer than 10 characters."
            return "Please provide a valid message."
        
        outputs = []
        outputs_str = ''
        last_outputs = []

        conversation = self.initialize_conversation(
            message,
            conversation=conversation,
            history=history)
        
        history = []

        next_round = True
        function_call_messages = []
        current_round = 0
        enable_summary = False
        last_status = {}  # for summary
        token_overflow = False
        # if self.enable_checker:
        #     checker = ReasoningTraceChecker(
        #         message, conversation, init_index=len(conversation))

        # try:
        self.conversation.append({"role": "user", "content": message})
        while next_round and current_round < max_round:
            current_round += 1

            response = self.llm_infer(self.conversation)
            self.conversation.append({"role": "system", "content": response})
            tool_called = False 
            print(response)
            # import pdb; pdb.set_trace()

            if 'Tool-call:' in response:
                match = re.search(r"Tool-call:\s*(.*)", response, re.DOTALL)
                response_text = match.group(1).strip()
                if "None" not in response_text and response_text.replace('-', '').rstrip().replace('FINISHED', '').rstrip():   
                    history.append(ChatMessage(
                        role="assistant", content=f"{response.replace('FINISHED', '').split('</think>')[1]}"))
                    yield history 
                    
                    tool_called = True
                    print(response_text)
                    if "FAIL" in response_text:
                        self.conversation.append({"role": "system", "content": tool_response})
                        history.append(
                            ChatMessage(role="assistant", content=f"Response from tool FAILED ")
                        )
                        next_round = False
                        yield history 
                    else:        
                        tool_call_text = response_text
                        if ';' in tool_call_text:
                            tool_calls = [i.replace('\n', '').rstrip('-').replace('FINISHED', '').replace('Response:', '') for i in tool_call_text.split(';') if i]
                        elif '\n' in tool_call_text:
                            tool_calls = [i.replace('\n', '').rstrip('-').replace('FINISHED', '').replace('Response:', '') for i in tool_call_text.split('\n') if i]
                        else:
                            tool_calls = [tool_call_text]
                    
                        tool_calls = [i.rstrip('-') for i in tool_calls if i]

                        for call in tool_calls:
                            print(f"\033[1;34;40mCalling this command now {call}\033[0m")
                            tool_response = str(eval(call))
                            self.conversation.append({"role": "system", "content": tool_response})
                            history.append(
                                ChatMessage(role="assistant", content=f"Response from tool: {tool_response}")
                            )
                            print(f"\033[1;34;40mGot this response {tool_response}\033[0m")
                            yield history
                else:
                    history.append(
                                ChatMessage(role="assistant", content=f"{response}")
                            )
                    yield history

            elif 'Response:' in response or tool_called is False:
                match = re.search(r"Response:\s*(.*)", response, re.DOTALL)
                response_text = match.group(1).strip().replace('Tool-call: None', '')
                print(f"\033[1;33;40mresponse text: {response_text}\033[0m")
                history.append(
                    ChatMessage(
                        role="assistant", content=f"{response_text.replace('FINISHED', '')}")
                )
                yield history
                
            if 'FINISHED' in response and tool_called is False:
                next_round = False





      
        #         if len(last_outputs) > 0:
        #             function_call_messages, picked_tools_prompt, special_tool_call, current_gradio_history = yield from self.run_function_call_stream(
        #                 last_outputs, return_message=True,
        #                 existing_tools_prompt=picked_tools_prompt,
        #                 message_for_call_agent=message,
        #                 call_agent=call_agent,
        #                 call_agent_level=call_agent_level,
        #                 temperature=temperature)
        #             history.extend(current_gradio_history)
        #             if special_tool_call == 'Finish':
        #                 yield history
        #                 next_round = False
        #                 conversation.extend(function_call_messages)
        #                 return function_call_messages[0]['content']
        #             elif special_tool_call == 'RequireClarification' or special_tool_call == 'DirectResponse':
        #                 history.append(
        #                     ChatMessage(role="assistant", content=history[-1].content))
        #                 yield history
        #                 next_round = False
        #                 return history[-1].content
        #             if (self.enable_summary or token_overflow) and not call_agent:
        #                 if token_overflow:
        #                     print("token_overflow, using summary")
        #                 enable_summary = True
        #             last_status = self.function_result_summary(
        #                 conversation, status=last_status,
        #                 enable_summary=enable_summary)
        #             if function_call_messages is not None:
        #                 conversation.extend(function_call_messages)
        #                 formated_md_function_call_messages = tool_result_format(
        #                     function_call_messages)
        #                 yield history
        #             else:
        #                 next_round = False
        #                 conversation.extend(
        #                     [{"role": "assistant", "content": ''.join(last_outputs)}])
        #                 return ''.join(last_outputs).replace("</s>", "")
        #         # if self.enable_checker:
        #         #     good_status, wrong_info = checker.check_conversation()
        #         #     if not good_status:
        #         #         next_round = False
        #         #         print("Internal error in reasoning: " + wrong_info)
        #         #         break
        #         last_outputs = []
        #         last_outputs_str, token_overflow = self.llm_infer(
        #             messages=conversation,
        #             temperature=temperature,
        #             tools=picked_tools_prompt,
        #             skip_special_tokens=False,
        #             max_new_tokens=max_new_tokens,
        #             max_token=max_token,
        #             seed=seed,
        #             check_token_status=True)
        #         last_thought = last_outputs_str.split("[TOOL_CALLS]")[0]
        #         for each in history:
        #             if each.metadata is not None:
        #                 each.metadata['status'] = 'done'
        #         if '[FinalAnswer]' in last_thought:
        #             final_thought, final_answer = last_thought.split(
        #                 '[FinalAnswer]')
        #             history.append(
        #                 ChatMessage(role="assistant",
        #                             content=final_thought.strip())
        #             )
        #             yield history
        #             history.append(
        #                 ChatMessage(
        #                     role="assistant", content="**Answer**:\n"+final_answer.strip())
        #             )
        #             yield history
        #         else:
        #             history.append(ChatMessage(
        #                 role="assistant", content=last_thought))
        #             yield history

        #         last_outputs.append(last_outputs_str)

        #     if self.force_finish:
        #         last_outputs_str = self.get_answer_based_on_unfinished_reasoning(
        #             conversation, temperature, max_new_tokens, max_token, return_full_thought=True)
        #         for each in history:
        #             if each.metadata is not None:
        #                 each.metadata['status'] = 'done'

        #         final_thought, final_answer = last_outputs_str.split('[FinalAnswer]')
        #         history.append(
        #             ChatMessage(role="assistant",
        #                         content=final_thought.strip())
        #         )
        #         yield history
        #         history.append(
        #             ChatMessage(
        #                 role="assistant", content="**Answer**:\n"+final_answer.strip())
        #         )
        #         yield history
        #     else:
        #         yield "The number of rounds exceeds the maximum limit!"

        # except Exception as e:
        #     print(f"Error: {e}")
        #     if self.force_finish:
        #         last_outputs_str = self.get_answer_based_on_unfinished_reasoning(
        #             conversation,
        #             temperature,
        #             max_new_tokens,
        #             max_token,
        #             return_full_thought=True)
        #         for each in history:
        #             if each.metadata is not None:
        #                 each.metadata['status'] = 'done'

        #         final_thought, final_answer = last_outputs_str.split(
        #             '[FinalAnswer]')
        #         history.append(
        #             ChatMessage(role="assistant",
        #                         content=final_thought.strip())
        #         )
        #         yield history
        #         history.append(
        #             ChatMessage(
        #                 role="assistant", content="**Answer**:\n"+final_answer.strip())
        #         )
        #         yield history
        #     else:
        #         return None