Spaces:

MCP-1st-Birthday
/

gitrepo_inspector_dashboard

Running

App Files Files Community

gitrepo_inspector_dashboard / services /agent_chat.py

elismasilva

added gemini api requirement.

c11b8eb 11 days ago

raw

history blame contribute delete

7.36 kB

	# services/agent_chat.py
	import os
	import re
	import json
	from typing import Dict, List, Any, Optional
	from smolagents import LiteLLMModel, tool, ToolCallingAgent
	from smolagents.mcp_client import MCPClient as SmolMCPClient
	from gradio_client import Client as GradioClient
	from config.constants import AVAILABLE_MODELS_BY_PROVIDER
	from services.db import save_analysis_report

	MCP_SERVER_URL = os.getenv("MCP_SERVER_URL", "https://mcp-1st-birthday-gitrepo-inspector-mcp.hf.space/")

	# ===================================================================
	# TOOLS WITH CORRECT DOCSTRINGS
	# ===================================================================

	@tool
	def get_issue_status(issue_number: int, repo_url: str) -> Dict[str, Any]:
	"""
	Retrieves the latest AI analysis report for a specific GitHub issue from the database.

	Args:
	issue_number (int): The GitHub issue number (e.g. 12345).
	repo_url (str): Full repository URL (e.g. "https://github.com/gradio-app/gradio").

	Returns:
	dict: Structured report with keys:
	- issue_number (int)
	- title (str)
	- verdict (str)
	- report (str) – clean text without HTML
	- action (dict or None)
	- model_used (str)
	- has_report (bool)
	- error (str, optional)
	"""
	try:
	client = GradioClient(MCP_SERVER_URL)
	result = client.predict(repo_url, issue_number, api_name="/get_issue_report")

	# Normalize MCP response
	if isinstance(result, str):
	data = json.loads(result) if "{" in result else {"error": result}
	else:
	data = result if isinstance(result, dict) else {"error": str(result)}

	if data.get("error"):
	return {"error": data["error"], "has_report": False}

	# Remove HTML tags for easy LLM reading
	raw_body = data.get("report", "")
	clean_body = re.sub(r'<[^>]+>', '', raw_body).strip()

	return {
	"issue_number": int(data.get("issue", issue_number)),
	"title": data.get("title", "No title"),
	"verdict": data.get("verdict", "Pending Analysis"),
	"report": clean_body,
	"action": data.get("action"),
	"model_used": data.get("llm_model", "unknown"),
	"has_report": True
	}
	except Exception as e:
	return {"error": str(e), "has_report": False}


	@tool
	def search_issues(
	repo_url: str,
	query: str = "",
	verdict: Optional[str] = None,
	author: Optional[str] = None,
	limit: int = 8
	) -> List[Dict[str, Any]]:
	"""
	Searches for GitHub issues matching the given criteria.

	Args:
	repo_url (str): Full repository URL.
	query (str, optional): Text to search in title/body.
	verdict (str, optional): AI verdict filter ("resolved", "duplicate", "unresolved", etc.).
	author (str, optional): GitHub username of the issue author.
	limit (int, optional): Maximum number of results (default: 8).

	Returns:
	list[dict]: List of issues, each containing:
	- issue_number (int)
	- title (str)
	- author (str)
	- verdict (str)
	- snippet (str)
	"""
	try:
	client = GradioClient(MCP_SERVER_URL)
	result = client.predict(
	repo_url, query, None, "open", verdict, author, limit,
	api_name="/search_issues"
	)

	if isinstance(result, str):
	data = json.loads(result) if ("[" in result or "{" in result) else []
	else:
	data = result if isinstance(result, list) else []

	return [
	{
	"issue_number": item.get("id"),
	"title": item.get("title", "No title"),
	"author": item.get("author", "unknown"),
	"verdict": item.get("verdict", "pending"),
	"snippet": (item.get("snippet") or "")[:150].replace("\n", " ")
	}
	for item in data
	]
	except Exception as e:
	return [{"error": str(e)}]


	@tool
	def trigger_live_analysis(
	issue_number: int,
	repo_url: str,
	provider: str = "gemini",
	model: Optional[str] = None,
	github_token: Optional[str] = None
	) -> str:
	"""
	Forces a brand-new AI analysis of an issue, ignoring any cached data.
	Use ONLY when the user explicitly asks to re-analyze or "now", "again", etc.

	Args:
	issue_number (int): The GitHub issue number.
	repo_url (str): Full repository URL.
	provider (str, optional): AI provider ("gemini", "openai", "nebius", "sambanova").
	model (str, optional): Specific model name. If None, uses first model of the provider.
	github_token (str, optional): GitHub token for private repos.

	Returns:
	str: Confirmation message or error.
	"""
	try:
	if not model:
	model = AVAILABLE_MODELS_BY_PROVIDER.get(provider.lower(), ["gemini-2.0-flash"])[0]

	client = GradioClient(MCP_SERVER_URL)
	result = client.predict(
	repo_url, int(issue_number), provider, model, github_token, None,
	api_name="/analyze_github_issue"
	)

	html_report, thought = result[0], result[1]

	# Detects verdict to save in database
	verdict = "unresolved"
	if "Resolved" in html_report: verdict = "resolved"
	elif "Possibly Resolved" in html_report: verdict = "possibly_resolved"
	elif "Duplicate" in html_report: verdict = "duplicate"

	save_analysis_report(
	repo_url=repo_url,
	issue_number=issue_number,
	provider=provider,
	model=model,
	verdict=verdict,
	body=html_report,
	thought=thought
	)

	return f"Live analysis completed using {provider} ({model}). Report updated!"
	except Exception as e:
	return f"Live analysis failed: {str(e)}"


	# ===================================================================
	# AGENT FACTORY
	# ===================================================================

	def create_dashboard_agent(gemini_api_key):
	print("Initializing GitRepo Inspector Agent...")

	model = LiteLLMModel(
	model_id="gemini/gemini-2.5-flash",
	temperature=0.1,
	max_tokens=2048,
	api_key=gemini_api_key
	)

	# Loads the clean prompt from YAML config
	import yaml
	yaml_path = os.path.join(os.path.dirname(__file__), "../config/gitrepo_agent_prompt.yaml")
	with open(yaml_path, "r", encoding="utf-8") as f:
	prompt_templates = yaml.safe_load(f)

	# Automatic MCP tools (keep web_search, etc.)
	sse_url = f"{MCP_SERVER_URL.rstrip('/')}/gradio_api/mcp/sse"
	mcp_client = SmolMCPClient({"url": sse_url, "transport": "sse"})
	auto_tools = [
	t for t in mcp_client.get_tools()
	if t.name not in {"analyze_github_issue", "get_issue_report", "search_issues"}
	]

	my_tools = [get_issue_status, search_issues, trigger_live_analysis]

	agent = ToolCallingAgent(
	tools=auto_tools + my_tools,
	model=model,
	prompt_templates=prompt_templates,
	max_steps=12,
	planning_interval=4
	)

	print("GitRepo Inspector Agent ready!")
	return agent