Whshhs / app.py
Athspi's picture
Update app.py
3fd0067 verified
raw
history blame
5.82 kB
import base64
import os
import gradio as gr
import requests
import markdownify
from google import genai
from google.genai import types
from urllib.robotparser import RobotFileParser
from urllib.parse import urlparse
# Configure browser tools
def can_crawl_url(url: str, user_agent: str = "*") -> bool:
"""Check robots.txt permissions for a URL"""
try:
parsed_url = urlparse(url)
robots_url = f"{parsed_url.scheme}://{parsed_url.netloc}/robots.txt"
rp = RobotFileParser(robots_url)
rp.read()
return rp.can_fetch(user_agent, url)
except Exception as e:
print(f"Error checking robots.txt: {e}")
return False
def load_page(url: str) -> str:
"""Load webpage content as markdown"""
if not can_crawl_url(url):
return f"URL {url} failed robots.txt check"
try:
response = requests.get(url, timeout=10)
return markdownify.markdownify(response.text)
except Exception as e:
return f"Error loading page: {str(e)}"
# Configure Gemini client
client = genai.Client(api_key=os.environ.get("GEMINI_API_KEY"))
MODEL = "gemini-2.0-flash"
TOOLS = [
types.Tool(
function_declarations=[
types.FunctionDeclaration(
name="load_page",
description="Load webpage content as markdown",
parameters={
"type": "object",
"properties": {
"url": {"type": "string", "description": "Full URL to load"}
},
"required": ["url"]
}
)
]
),
types.Tool(google_search=types.GoogleSearch()),
types.Tool(code_execution=types.ToolCodeExecution())
]
SYSTEM_INSTRUCTION = """You are an AI assistant with multiple capabilities:
1. Web browsing through search and direct page access
2. Code execution for calculations, simulations, and data analysis
3. File I/O operations for data processing
Use this decision tree:
- For factual questions: Use search
- For time-sensitive data: Use browser tool
- For math/data processing: Generate and execute code
- Always explain your reasoning"""
def format_code_response(parts):
"""Format code execution parts for Markdown display"""
formatted = []
for part in parts:
if part.text:
formatted.append(part.text)
if part.executable_code:
formatted.append(f"```python\n{part.executable_code.code}\n```")
if part.code_execution_result:
formatted.append(f"**Result**:\n{part.code_execution_result.output}")
if part.inline_data:
formatted.append(f"![Generated Image](data:image/png;base64,{base64.b64encode(part.inline_data.data).decode()})")
return "\n\n".join(formatted)
def generate_response(user_input):
full_response = ""
chat = client.chats.create(
model=MODEL,
config=types.GenerateContentConfig(
temperature=0.7,
tools=TOOLS,
system_instruction=SYSTEM_INSTRUCTION
)
)
# Initial request
response = chat.send_message(user_input)
# Process all response parts
response_parts = []
for part in response.candidates[0].content.parts:
response_parts.append(part)
full_response = format_code_response(response_parts)
yield full_response
# Handle function calls
if part.function_call:
fn = part.function_call
if fn.name == "load_page":
result = load_page(**fn.args)
chat.send_message(
types.Content(
parts=[
types.Part(
function_response=types.FunctionResponse(
name=fn.name,
id=fn.id,
response={"result": result}
)
)
]
)
)
# Get final response after tool execution
final_response = chat.send_message("")
for final_part in final_response.candidates[0].content.parts:
response_parts.append(final_part)
full_response = format_code_response(response_parts)
yield full_response
# Gradio Interface
with gr.Blocks(title="Gemini 2.0 AI Assistant") as demo:
gr.Markdown("# πŸš€ Gemini 2.0 AI Assistant")
gr.Markdown("Web Access β€’ Code Execution β€’ Data Analysis")
with gr.Row():
input_box = gr.Textbox(
label="Your Query",
placeholder="Ask anything or request code execution...",
lines=3,
max_lines=10,
autofocus=True
)
output_box = gr.Markdown(
label="Assistant Response",
elem_classes="markdown-output"
)
with gr.Row():
submit_btn = gr.Button("Submit", variant="primary")
clear_btn = gr.Button("Clear")
def clear():
return ["", ""]
submit_btn.click(
fn=generate_response,
inputs=input_box,
outputs=output_box,
queue=True
)
clear_btn.click(
fn=clear,
inputs=[],
outputs=[input_box, output_box]
)
if __name__ == "__main__":
demo.launch(
server_name="0.0.0.0",
server_port=7860,
css="""
.markdown-output {
padding: 20px;
border-radius: 5px;
background: #f9f9f9;
}
.markdown-output code {
background: #f3f3f3;
padding: 2px 5px;
border-radius: 3px;
}
"""
)