ToolBrain/examples/06_tool_retrieval.py at main · ToolBrain/ToolBrain

125 lines (100 loc) · 2.93 KB
from toolbrain import Brain, create_agent
from toolbrain.rewards import reward_exact_match
from smolagents import tool, CodeAgent, TransformersModel
from toolbrain.retriever import ToolRetriever
from openai import OpenAI
def add(a: int, b: int) -> int:
    Add two integers.
        a: First integer to add
        b: Second integer to add
    Returns:
        The sum of a and b
    return a + b
def multiply(a: int, b: int) -> int:
    Multiply two integers.
        a: First integer to multiply
        b: Second integer to multiply
    Returns:
        The product of a and b
    return a * b
def divide(a: int, b: int) -> int:
    Divide two integers.
        a: Dividend
        b: Divisor
    Returns:
        The quotient of a divided by b
    return a / b
def subtract(a: int, b: int) -> int:
    Subtract two integers.
        a: First integer
        b: Second integer to subtract from a
    Returns:
        The difference of a minus b
    return a - b
if __name__ == "__main__":
    print("📥 Initializing TransformersModel...")
    trainable_model = TransformersModel(model_id="Qwen/Qwen2.5-0.5B-Instruct",
                                        max_new_tokens=128)
    print("✅ TransformersModel initialized.")
    print("🔧 Creating CodeAgent...")
    agent = CodeAgent(
        tools=[add, multiply, divide, subtract],
        model=trainable_model,
        max_steps=1
    print("✅ Agent created.")
    # Initialize the tool retriever
    retrieval_llm_instance = OpenAI(api_key=os.getenv("OPENAI_API_KEY")).chat.completions.create
    retrieval_llm_model = "gpt-4o-mini" 
    tool_retriever = ToolRetriever(llm_model=retrieval_llm_model,
                                   llm_instance=retrieval_llm_instance,
                                   retrieval_topic="mathematics",
                                   retrieval_guidelines="Select only tools needed for mathematical calculations")
    # Initialize the training brain  
    brain = Brain(
        agent=agent,
        reward_func=reward_exact_match,
        algorithm="GRPO",
        tool_retriever=tool_retriever
    # Prepare training dataset
    training_dataset = [
            "query": "Calculate 5 + 7",
            "gold_answer": "12"
            "query": "What is 8 multiplied by 6?",
            "gold_answer": "48"
            "query": "Calculate 8 divided by 2",
            "gold_answer": "4"
            "query": "Calculate 8 subtracted from 2",
            "gold_answer": "6"
    # Run training
    brain.train(training_dataset, num_iterations=1)
    trained_agent = brain.get_agent()
    print(trained_agent.run("Calculate 6 + 9"))
    print(trained_agent.run("What is 4 multiplied by 2?"))
Provide feedback

Saved searches

Use saved searches to filter your results more quickly

FilesExpand file tree

06_tool_retrieval.py

Latest commit

History

06_tool_retrieval.py

File metadata and controls