Spaces:

Ogero79
/

Threatscope_ai

Runtime error

App Files Files Community

Threatscope_ai / app.py

Ogero79

Update app.py

93c3afd verified 1 day ago

raw

history blame contribute delete

7.32 kB

	# app.py
	import gradio as gr
	import torch
	from transformers import AutoTokenizer, AutoModelForCausalLM, pipeline
	from peft import PeftModel
	import json
	import os

	# --- 1. Configuration ---
	adapter_model_name = "Ogero79/threatscope-cyberthreat-analyst"
	base_model_name = "meta-llama/Meta-Llama-3-8B-Instruct"

	# --- 2. Model Loading ---
	print("--- Loading Model and Tokenizer ---")
	# Load the tokenizer from the adapter repo
	tokenizer = AutoTokenizer.from_pretrained(adapter_model_name)

	# Load the base Llama 3 model.
	# We use float16 to save memory on the CPU Space.
	# device_map="auto" will intelligently place the model on the CPU.
	base_model = AutoModelForCausalLM.from_pretrained(
	base_model_name,
	torch_dtype=torch.float16,
	device_map="auto",
	token=os.environ.get("HF_TOKEN"), # Use the token from Space secrets
	)

	# Load the PEFT adapter and merge it into the base model for faster inference.
	model = PeftModel.from_pretrained(base_model, adapter_model_name)
	model = model.merge_and_unload()
	model.eval()

	# Create the text-generation pipeline. device=-1 ensures it runs on CPU.
	generator = pipeline(
	"text-generation",
	model=model,
	tokenizer=tokenizer,
	device=-1, # Explicitly set to CPU
	torch_dtype=torch.float16
	)

	print("✅ Model and pipeline loaded successfully!")


	# --- 3. Inference Function (copied and adapted from your notebook) ---
	def generate_response(prompt_text, max_new_tokens=512, temperature=0.01):
	# Define the safe/default JSON structure for non-threats
	safe_default_response = {
	"summary": "No actionable cybersecurity threat detected",
	"threat_type": "Non-Threat",
	"risk_score": 0,
	"risk_level": "None",
	"suggested_defense": "No action required",
	"iocs": [],
	"threat_actor": "None",
	"geographical_scope": "None"
	}

	messages = [
	{
	"role": "system",
	"content": (
	"You are an expert cybersecurity analyst. Analyze input and return JSON with these fields:\n"
	"- summary: If input describes a threat, summarize it. Otherwise, state no threat detected\n"
	"- threat_type: Threat category if valid, otherwise 'Non-Threat'\n"
	"- risk_score: 0-100 (0 for non-threats)\n"
	"- risk_level: Critical/High/Medium/Low/None\n"
	"- suggested_defense: Recommendations or 'No action required'\n"
	"- iocs: Empty list for non-threats\n"
	"- threat_actor: 'None' for non-threats\n"
	"- geographical_scope: 'None' for non-threats\n"
	"For CLEAR non-threats (e.g., 'Hello', weather queries), return the safe default format immediately."
	)
	},
	{
	"role": "user",
	"content": f"Analyze this input for cybersecurity threats: {prompt_text}\n"
	f"Return ONLY the JSON output with all fields populated."
	}
	]

	try:
	prompt = tokenizer.apply_chat_template(messages, tokenize=False, add_generation_prompt=True)
	outputs = generator(prompt, max_new_tokens=max_new_tokens, temperature=temperature,
	top_p=0.9, do_sample=True, pad_token_id=tokenizer.eos_token_id)
	generated_full_text = outputs[0]["generated_text"]
	response = generated__text[len(prompt):].strip()

	# First try to find and parse JSON
	try:
	first_brace = response.find('{')
	last_brace = response.rfind('}')
	if first_brace == -1 or last_brace == -1:
	raise ValueError("No JSON detected in response")

	parsed_json = json.loads(response[first_brace:last_brace+1])

	# Validate required fields exist
	required_fields = {
	'summary': str, 'threat_type': str, 'risk_score': int,
	'risk_level': str, 'suggested_defense': str, 'iocs': list,
	'threat_actor': str, 'geographical_scope': str
	}

	for field, field_type in required_fields.items():
	if field not in parsed_json or not isinstance(parsed_json.get(field), field_type):
	parsed_json[field] = safe_default_response[field]

	return parsed_json

	except (json.JSONDecodeError, ValueError):
	# If JSON parsing fails, analyze the raw response for threat indicators
	threat_keywords = ["malware", "attack", "phishing", "breach", "exploit", "hack", "ransomware"]
	if any(keyword in response.lower() for keyword in threat_keywords):
	# If threat keywords found but JSON invalid, return error with the raw analysis
	return {
	**safe_default_response,
	"summary": f"Potential threat detected but invalid format. Analyst review recommended. Raw response: {response[:200]}...",
	"threat_type": "Unknown (Format Error)",
	"risk_score": 50,
	"risk_level": "Medium"
	}
	else:
	# No threat keywords detected - definitely safe to return default
	return safe_default_response

	except Exception as e:
	# Critical error case - return safe format with error details
	safe_default_response["summary"] = f"System error: {str(e)}. Default safe response returned"
	return safe_default_response

	# --- 4. Gradio Interface ---
	css = """
	#col-container {
	margin: 0 auto;
	max-width: 900px;
	}
	"""

	with gr.Blocks(css=css, theme=gr.themes.Soft()) as demo:
	with gr.Column(elem_id="col-container"):
	gr.Markdown(
	"""
	# 🤖 ThreatScope: AI Cybersecurity Analyst

	Enter a description of a potential security event below. The fine-tuned Llama 3 model will analyze it and return a structured JSON response with a risk assessment and suggested actions.

	Note: This is an 8B parameter model running on a CPU. The first inference may be slow, but subsequent ones will be faster.
	"""
	)

	with gr.Row():
	prompt_input = gr.Textbox(
	label="Enter Threat Description",
	placeholder="e.g., Our DNS server is being flooded with requests from thousands of botnet IPs.",
	lines=4
	)

	analyze_button = gr.Button("Analyze Threat")

	output_json = gr.JSON(label="Analysis Result")

	gr.Examples(
	[
	"A misconfigured cloud storage bucket exposed sensitive customer data online for months.",
	"Urgent: Employee received a suspicious email with a malicious attachment claiming to be from HR.",
	"An ex-employee's credentials were used to log into the main database at 2 AM.",
	"What's the capital of France?",
	],
	inputs=prompt_input,
	outputs=output_json,
	fn=generate_response,
	)

	analyze_button.click(
	fn=generate_response,
	inputs=prompt_input,
	outputs=output_json
	)

	demo.launch()