Spaces:

Agents-MCP-Hackathon
/

Patent_Architect_AI

Running

Patent_Architect_AI / real_ai_agents_implementation.py

WHG2023

fix: Improve backend parsing and frontend stability

0f743a0 about 1 month ago

21 kB

	#!/usr/bin/env python3
	"""
	True Agentic Implementation for Patent Architect AI v2
	This version implements a genuine, stateful, multi-agent negotiation workflow
	where agent outputs dynamically influence subsequent agent actions.
	"""

	import os
	import json
	import re
	import base64
	import requests
	from typing import Dict, List, Optional, Tuple, Generator
	from dataclasses import dataclass, field
	import google.generativeai as genai
	from dotenv import load_dotenv

	# --- Tool Imports ---
	def web_search(query: str, num_results: int = 5) -> List[Dict]:
	"""Performs a real web search using the free Serper.dev API."""

	api_key = os.getenv("SERPER_API_KEY")

	if not api_key:
	print("⚠️ WARNING: SERPER_API_KEY not set. Web search is disabled.")
	return [{"title": "Web Search Disabled", "link": "#", "snippet": "Please provide a Serper.dev API key to enable live web search."}]

	url = "https://google.serper.dev/search"
	payload = json.dumps({
	"q": query,
	"num": num_results
	})
	headers = {
	'X-API-KEY': api_key,
	'Content-Type': 'application/json'
	}

	try:
	print(f"Executing REAL web search for: {query} via Serper.dev")
	response = requests.post(url, headers=headers, data=payload, timeout=10)
	response.raise_for_status()
	search_results = response.json()

	# The key for organic results is 'organic'
	if 'organic' not in search_results:
	return []

	# Format the results to match the expected structure
	formatted_results = [
	{
	"title": item.get('title'),
	"link": item.get('link'),
	"snippet": item.get('snippet')
	}
	for item in search_results.get('organic', [])
	]
	return formatted_results

	except requests.exceptions.RequestException as e:
	print(f"Error during web search with Serper.dev: {e}")
	return [{"title": "Web Search Error", "link": "#", "snippet": f"An error occurred during the search: {e}"}]


	# --- Configuration ---
	load_dotenv()
	# Configure Gemini
	try:
	genai.configure(api_key=os.getenv("GEMINI_API_KEY"))
	GEMINI_AVAILABLE = True
	except (ValueError, TypeError) as e:
	print(f"Gemini API key not found or invalid: {e}")
	GEMINI_AVAILABLE = False


	# --- Data Structures ---
	@dataclass
	class NegotiationState:
	invention_disclosure: str
	key_concepts: List[str] = field(default_factory=list)
	prior_art_analysis: Dict = field(default_factory=dict)
	strategic_mandate: str = ""
	technical_summary: str = ""
	patent_claims: str = ""
	figure_description: str = ""
	ideogram_image_b64: str = ""
	negotiation_transcript: List[Dict] = field(default_factory=list)

	# --- Base Agent Class ---
	class BaseAgent:
	def __init__(self, model_name='gemini-1.5-flash'):
	if not GEMINI_AVAILABLE:
	self.model = None
	return
	self.model = genai.GenerativeModel(model_name)

	def _execute_prompt(self, prompt: str) -> str:
	if not self.model:
	return f"Error: The '{self.__class__.__name__}' agent could not run because the Gemini API is not configured. Please set the GEMINI_API_KEY."
	try:
	response = self.model.generate_content(prompt)
	return response.text
	except Exception as e:
	print(f"Error executing prompt for {self.__class__.__name__}: {e}")
	return f"Error: Could not get a response from the model. Details: {e}"

	# --- Specialized Agents ---
	class PriorArtDetective(BaseAgent):
	def analyze(self, invention_disclosure: str) -> Dict:
	# Phase 1: Extract Key Concepts
	concept_prompt = f"""
	Analyze the following invention disclosure. Your task is to extract the most important, specific, and searchable technical keywords or concepts.
	- If the disclosure is detailed, extract up to 3-5 key concepts.
	- If the disclosure is short or a single phrase, the main phrase itself may be the best concept.

	Return these concepts as a simple JSON array of strings. Do not add any other text or explanation. Your output MUST be only the JSON array.

	Invention: "{invention_disclosure}"

	Example for detailed input:
	Invention: "My invention is a smart coffee mug that uses a novel phase-change material to keep coffee at a perfect temperature. It also has a mobile app that connects via Bluetooth to let the user set their preferred temperature. The key innovation is a machine learning algorithm that learns the user's drinking habits to pre-warm or cool the mug, optimizing energy use."
	Output:
	["phase-change material thermal management", "predictive pre-warming algorithm for beverage container", "user habit machine learning for temperature control"]

	Example for short input:
	Invention: "Non-invasive glucose monitoring using Raman spectroscopy"
	Output:
	["non-invasive glucose monitoring", "Raman spectroscopy for glucose detection"]
	"""
	response_text = self._execute_prompt(concept_prompt)
	key_concepts = []
	try:
	# More robust JSON parsing
	match = re.search(r'\[(.*?)\]', response_text, re.DOTALL)
	if match:
	# Handle cases where the model might just return comma-separated strings without brackets
	key_concepts = json.loads(match.group(0))
	else:
	cleaned_response = response_text.strip().replace('"', '').replace("'", "")
	if cleaned_response:
	key_concepts = [c.strip() for c in cleaned_response.split(',') if c.strip()]

	except json.JSONDecodeError:
	# The model likely failed to return JSON. Try to parse it as a simple list.
	cleaned_response = response_text.strip().replace('"', '').replace("'", "").replace('[', '').replace(']', '')
	if cleaned_response:
	key_concepts = [c.strip() for c in cleaned_response.split(',') if c.strip()]

	# Fallback for very short disclosures if LLM still fails
	if not key_concepts and len(invention_disclosure.split()) < 10:
	# Also correct common typos as a courtesy
	corrected_disclosure = invention_disclosure.replace("Non-invasice", "Non-invasive")
	key_concepts = [corrected_disclosure]


	if not key_concepts:
	return {"key_concepts": [], "real_prior_art": [], "landscape_summary": "Could not identify key concepts to search for."}

	# Phase 2: Perform Live Web Searches
	search_findings = []
	for concept in key_concepts:
	# Search Google Patents
	patent_query = f'"{concept}" site:patents.google.com'
	patent_results = web_search(patent_query)
	search_findings.extend(patent_results)

	# Search Wikipedia for general background
	wiki_query = f'"{concept}" site:en.wikipedia.org'
	wiki_results = web_search(wiki_query)
	search_findings.extend(wiki_results)

	# Phase 3: Summarize Real Findings
	if not search_findings:
	return {"key_concepts": key_concepts, "real_prior_art": [], "landscape_summary": "No relevant prior art found in web search."}

	summary_prompt = f"""
	You are a patent analyst. Below are raw web search results for an invention related to "{', '.join(key_concepts)}".
	Your job is to analyze these results and provide a concise summary.

	Search Results:
	{json.dumps(search_findings, indent=2)}

	Tasks:
	1. Create a brief, 2-3 sentence "landscape_summary" assessing how crowded the field appears to be based on these results.
	2. Extract the top 5 most relevant findings and list them in a "real_prior_art" array, including their "title" and "link".

	Return the response as a single JSON object with keys: "landscape_summary" and "real_prior_art".
	"""
	summary_response_text = self._execute_prompt(summary_prompt)

	try:
	# Clean the response to handle markdown code blocks
	match = re.search(r'```json\s([\s\S]?)\s*```', summary_response_text)
	if match:
	json_str = match.group(1)
	else:
	json_str = summary_response_text

	summary_data = json.loads(json_str.strip())
	summary_data["key_concepts"] = key_concepts # Add concepts for context
	return summary_data
	except json.JSONDecodeError:
	print(f"Failed to parse JSON from LLM summary response: {summary_response_text}")
	return {
	"key_concepts": key_concepts,
	"real_prior_art": search_findings, # Return the raw findings
	"landscape_summary": "Error: The AI's analysis of the search results could not be parsed.",
	}

	class ChiefStrategistAgent(BaseAgent):
	def formulate_strategy(self, invention_disclosure: str, prior_art_analysis: Dict) -> str:
	prompt = f"""
	You are a Chief Patent Strategist. Your job is to determine the strongest angle for a successful patent application.

	Invention Disclosure:
	"{invention_disclosure}"

	Prior Art Analysis:
	- Key Concepts: {prior_art_analysis.get('key_concepts', [])}
	- Real Prior Art Found: {prior_art_analysis.get('real_prior_art', [])}
	- Landscape Summary: {prior_art_analysis.get('landscape_summary', '')}

	Based on the REAL prior art found, formulate a clear, one-sentence "Strategic Mandate". This mandate must identify the single most patentable aspect of the invention that appears novel and non-obvious compared to the search results.

	Example Mandates:
	- "The strategic focus shall be on the novel method for data encryption, as the search results confirm existing hardware implementations."
	- "The patentability of this invention rests on the unique chemical composition of the coating, which appears distinct from the cited art."
	- "We will patent the specific algorithm for adaptive lighting control, as the general hardware is well-known according to the search."

	Formulate the Strategic Mandate for the provided invention.
	"""
	return self._execute_prompt(prompt)

	class TechnicalWriterAgent(BaseAgent):
	def write_summary(self, invention_disclosure: str, strategic_mandate: str) -> str:
	prompt = f"""
	You are a professional patent writer. Your task is to write a "Summary of the Invention" section for a patent application.

	Invention Disclosure: "{invention_disclosure}"

	CRITICAL INSTRUCTION: You must follow this Strategic Mandate provided by the Chief Strategist:
	Strategic Mandate: "{strategic_mandate}"

	Write a concise, professional summary (2-3 paragraphs). Ensure that the summary heavily emphasizes the aspect highlighted in the Strategic Mandate as the core of the invention.
	"""
	return self._execute_prompt(prompt)

	class ClaimsDrafterAgent(BaseAgent):
	def draft_claims(self, invention_disclosure: str, strategic_mandate: str) -> str:
	prompt = f"""
	You are a patent attorney specializing in claim drafting.

	Invention Disclosure: "{invention_disclosure}"

	CRITICAL INSTRUCTION: Your claim set MUST be aligned with the following mandate:
	Strategic Mandate: "{strategic_mandate}"

	Draft a set of 5-7 patent claims.
	- The independent claim (Claim 1) must be directly focused on the feature identified in the Strategic Mandate.
	- Dependent claims should add further specifics and variations.
	- Ensure the claims are clear, concise, and properly formatted.
	"""
	return self._execute_prompt(prompt)

	class FigureDrafterAgent(BaseAgent):
	def describe_figure(self, invention_disclosure: str, strategic_mandate: str) -> str:
	prompt = f"""
	You are a patent illustrator's assistant. You need to generate the LaTeX/TikZ code for a key technical figure.

	Invention Disclosure: "{invention_disclosure}"

	CRITICAL INSTRUCTION: The figure must visually represent the core idea from the mandate:
	Strategic Mandate: "{strategic_mandate}"

	1. Decide on the best type of figure to illustrate the mandate (e.g., flowchart, system diagram, cross-section).
	2. Generate the complete LaTeX/TikZ code to create this figure.

	CRITICAL OUTPUT FORMAT:
	Return ONLY the raw LaTeX code, starting with `\\documentclass` and ending with `\\end{document}`.
	DO NOT include any description, explanation, or any text outside of the LaTeX code block.
	"""
	return self._execute_prompt(prompt)

	class SegmindIdeogramAgent:
	def __init__(self):
	self.api_key = os.getenv("SEGMIND_API_KEY") # Use user's key as default
	self.url = "https://api.segmind.com/v1/ideogram-3"

	def generate_image(self, technical_summary: str, strategic_mandate: str) -> Optional[str]:
	if not self.api_key:
	return None

	# Create a more cinematic prompt for image generation
	image_prompt = f"""
	Create a photorealistic, cinematic photograph representing the following invention.
	The image should focus on the core concept defined by the strategic mandate.

	Invention Summary: "{technical_summary}"
	Core Concept (Strategic Mandate): "{strategic_mandate}"

	Translate this technical concept into a visually stunning and professional marketing image.
	Emphasize the most innovative aspect. For example, if it's an algorithm, show a sleek user interface or an abstract representation of data flow, not just the hardware.
	"""

	data = {
	"prompt": image_prompt,
	"resolution": "1024x1024",
	"style_type": "REALISTIC"
	}
	headers = {'x-api-key': self.api_key}

	try:
	response = requests.post(self.url, json=data, headers=headers)
	if response.status_code == 200:
	return base64.b64encode(response.content).decode('utf-8')
	else:
	print(f"Segmind API Error: {response.status_code} - {response.text}")
	return None
	except Exception as e:
	print(f"Error calling Segmind API: {e}")
	return None


	# --- The Orchestrator ---
	class AgenticNegotiator:
	def __init__(self, invention_disclosure: str):
	self.state = NegotiationState(invention_disclosure=invention_disclosure)
	self.agents = {
	"Prior Art Detective": PriorArtDetective(),
	"Chief Strategist": ChiefStrategistAgent(),
	"Technical Writer": TechnicalWriterAgent(),
	"Claims Drafter": ClaimsDrafterAgent(),
	"Figure Drafter": FigureDrafterAgent(),
	"Conceptual Artist": SegmindIdeogramAgent(),
	}

	def _update_transcript(self, agent_name: str, message: str, data: Optional[Dict] = None):
	entry = {"agent": agent_name, "message": message, "data": data or {}}
	self.state.negotiation_transcript.append(entry)

	def run_negotiation(self) -> Generator[NegotiationState, None, None]:
	# Step 0: Check for Gemini API Key
	if not GEMINI_AVAILABLE:
	self._update_transcript("System", "CRITICAL ERROR: `GEMINI_API_KEY` is not set. The agentic workflow cannot proceed. Please configure the environment variable.")
	yield self.state
	return

	# Step 1: Prior Art Detective
	agent_name = "Prior Art Detective"
	self._update_transcript(agent_name, "Analyzing the invention to understand the technical landscape...")
	yield self.state

	prior_art_result = self.agents[agent_name].analyze(self.state.invention_disclosure)
	self.state.prior_art_analysis = prior_art_result
	self.state.key_concepts = prior_art_result.get("key_concepts", [])
	self._update_transcript(agent_name, f"Analysis complete. The landscape appears to be: {prior_art_result.get('landscape_summary', 'N/A')}", prior_art_result)
	yield self.state

	# Step 2: Chief Strategist
	agent_name = "Chief Strategist"
	self._update_transcript(agent_name, "Reviewing prior art to determine the most defensible patenting strategy...")
	yield self.state

	mandate = self.agents[agent_name].formulate_strategy(self.state.invention_disclosure, self.state.prior_art_analysis)
	self.state.strategic_mandate = mandate
	self._update_transcript(agent_name, f"Strategy formulated. All agents will now adhere to the following mandate: {mandate}")
	yield self.state

	# Step 3: Guided Content Generation
	# Technical Summary
	agent_name = "Technical Writer"
	self._update_transcript(agent_name, "Acknowledged. Drafting the technical summary to align with the strategic mandate.")
	yield self.state
	summary = self.agents[agent_name].write_summary(self.state.invention_disclosure, self.state.strategic_mandate)
	self.state.technical_summary = summary
	self._update_transcript(agent_name, "Technical summary drafted.")
	yield self.state

	# Patent Claims
	agent_name = "Claims Drafter"
	self._update_transcript(agent_name, "Understood. Drafting patent claims focused on the mandated novel aspect.")
	yield self.state
	claims = self.agents[agent_name].draft_claims(self.state.invention_disclosure, self.state.strategic_mandate)
	self.state.patent_claims = claims
	self._update_transcript(agent_name, "Patent claims drafted.")
	yield self.state

	# Figure Description (LaTeX)
	agent_name = "Figure Drafter"
	self._update_transcript(agent_name, "Affirmative. Designing a technical figure that visually represents the core strategic mandate.")
	yield self.state
	figure_desc = self.agents[agent_name].describe_figure(self.state.invention_disclosure, self.state.strategic_mandate)
	self.state.figure_description = figure_desc
	self._update_transcript(agent_name, "Technical figure description and LaTeX code generated.")
	yield self.state

	# Conceptual Image (Ideogram)
	agent_name = "Conceptual Artist"
	self._update_transcript(agent_name, "Now generating a high-fidelity conceptual image based on the strategy...")
	yield self.state
	image_b64 = self.agents[agent_name].generate_image(self.state.technical_summary, self.state.strategic_mandate)
	if image_b64:
	self.state.ideogram_image_b64 = image_b64
	self._update_transcript(agent_name, "Conceptual image generated successfully.")
	else:
	self._update_transcript(agent_name, "Failed to generate conceptual image. The API may be unavailable or the key may be invalid.")
	yield self.state


	self._update_transcript("AgenticNegotiator", "All tasks complete. The patent application is ready for assembly.")
	yield self.state

	def test_agentic_negotiation():
	"""Test the new agentic negotiation workflow."""
	print("🤖 Testing True Agentic Workflow")
	print("=" * 60)

	if not GEMINI_AVAILABLE:
	print("\n❌ Cannot run test: GEMINI_API_KEY is not configured.")
	return

	test_invention = """
	My invention is a smart coffee mug that uses a novel phase-change material to keep coffee at a perfect temperature. It also has a mobile app that connects via Bluetooth to let the user set their preferred temperature. The key innovation is a machine learning algorithm that learns the user's drinking habits to pre-warm or cool the mug, optimizing energy use.
	"""

	negotiator = AgenticNegotiator(invention_disclosure=test_invention)

	final_state = None
	for i, state in enumerate(negotiator.run_negotiation()):
	print(f"\n--- Turn {i+1} ---")
	last_message = state.negotiation_transcript[-1]
	print(f"{last_message['agent']}: {last_message['message']}")
	final_state = state

	print("\n\n✅ Negotiation Complete!")
	print("=" * 60)
	print(f"\nFinal Strategic Mandate:\n{final_state.strategic_mandate}")
	print(f"\nGenerated Claims Preview:\n{final_state.patent_claims[:300]}...")
	print(f"\nGenerated Figure Description Preview:\n{final_state.figure_description[:300]}...")
	if final_state.ideogram_image_b64:
	print(f"\nIdeogram Image: Generated successfully (Base64 data)")
	else:
	print(f"\nIdeogram Image: Failed to generate.")

	if __name__ == "__main__":
	test_agentic_negotiation()