First_agent / app.py
lchumaceiro's picture
Update app.py
303aa30 verified
from smolagents import CodeAgent, DuckDuckGoSearchTool, HfApiModel, load_tool, tool
import datetime
import requests
import pytz
import yaml
import time
from tools.final_answer import FinalAnswerTool
from huggingface_hub import InferenceClient
from pydub.generators import WhiteNoise
from pydub import AudioSegment
import gradio as gr
from Gradio_UI import GradioUI
import os
from huggingface_hub import login
hf_token = os.getenv("HF_TOKEN") # Fetch secret from Hugging Face Space
if hf_token:
login(hf_token)
else:
print("⚠️ Hugging Face API token is missing! Set HF_TOKEN in Space secrets.")
# Sound generation tool
@tool
def generate_sound(sound_type: str, duration: int) -> str:
"""Generates a simple sound based on the specified type and duration.
Args:
sound_type: Type of sound to generate (e.g., 'rain', 'car', 'white_noise').
duration: Duration of the sound in seconds.
Returns:
Path to the generated audio file.
"""
try:
duration_ms = duration * 1000 # Convert to milliseconds
if sound_type == "rain":
sound = WhiteNoise().to_audio_segment(duration=duration_ms).low_pass_filter(5000)
else:
return f"Unsupported sound type: {sound_type}"
output_path = f"/tmp/{sound_type}_{duration}s.wav"
sound.export(output_path, format="wav")
return output_path
except Exception as e:
return f"Error generating sound: {str(e)}"
# Time zone tool
@tool
def get_current_time_in_timezone(timezone: str) -> str:
"""A tool that fetches the current local time in a specified timezone.
Args:
timezone: A string representing a valid timezone (e.g., 'America/New_York').
"""
try:
tz = pytz.timezone(timezone)
local_time = datetime.datetime.now(tz).strftime("%Y-%m-%d %H:%M:%S")
return f"The current local time in {timezone} is: {local_time}"
except Exception as e:
return f"Error fetching time for timezone '{timezone}': {str(e)}"
final_answer = FinalAnswerTool()
model = HfApiModel(
max_tokens=2096,
temperature=0.5,
model_id='Qwen/Qwen2.5-Coder-32B-Instruct',
custom_role_conversions=None,
token= hf_token
)
image_generation_tool = load_tool("agents-course/text-to-image", trust_remote_code=True)
with open("prompts.yaml", 'r') as stream:
prompt_templates = yaml.safe_load(stream)
agent = CodeAgent(
model=model,
tools=[final_answer, generate_sound], # Add your tool
max_steps=6,
verbosity_level=1,
grammar=None,
planning_interval=None,
name=None,
description=None,
prompt_templates=prompt_templates
)
# Start the UI with processing time display
def launch_with_processing_time():
def wrapped_launch():
start_time = time.time()
print("Processing request...")
# Define a simple Gradio UI
def generate_and_return_file(sound_type, duration):
file_path = generate_sound(sound_type, duration)
return file_path # Return the file for download
interface = gr.Interface(
fn=generate_and_return_file,
inputs=[gr.Textbox(label="Sound Type"), gr.Number(label="Duration (seconds)")],
outputs=gr.File(label="Download Sound File"),
)
interface.launch()
end_time = time.time()
print(f"Processing completed in {end_time - start_time:.2f} seconds")
wrapped_launch()
launch_with_processing_time()