"""Local reasoning agent using TinyLlama."""

from transformers import AutoTokenizer, AutoModelForCausalLM
import torch

class ReasoningAgent:
    """Local reasoning agent using TinyLlama with chain of thought prompting."""
    
    def __init__(self, model_name="TinyLlama/TinyLlama-1.1B-Chat-v1.0"):
        """Initialize the agent with local model."""
        # Load model and tokenizer
        self.tokenizer = AutoTokenizer.from_pretrained(model_name)
        self.model = AutoModelForCausalLM.from_pretrained(
            model_name,
            torch_dtype=torch.float16,
            device_map="auto"
        )
        
    def get_response(self, message: str) -> str:
        """Generate response using local model with chain of thought prompting."""
        try:
            # Format prompt with chain of thought structure
            prompt = f"""<|system|>
You are a helpful AI assistant that uses chain of thought reasoning to answer questions.
For each response, break down your thinking into steps before giving the final answer.
</s>