First_agent_template

Running

App Files Files Community

oort commited on Feb 13

Commit

65367f3

verified ·

1 Parent(s): 49f2138

Add Flux prompt generation tool

Browse files

Files changed (1) hide show

app.py +55 -1

app.py CHANGED Viewed

@@ -33,6 +33,60 @@ def get_current_time_in_timezone(timezone: str) -> str:
     except Exception as e:
         return f"Error fetching time for timezone '{timezone}': {str(e)}"
 final_answer = FinalAnswerTool()
@@ -55,7 +109,7 @@ with open("prompts.yaml", 'r') as stream:
 agent = CodeAgent(
     model=model,
-    tools=[final_answer, get_current_time_in_timezone], ## add your tools here (don't remove final answer)
     max_steps=6,
     verbosity_level=1,
     grammar=None,

     except Exception as e:
         return f"Error fetching time for timezone '{timezone}': {str(e)}"
+@tool
+def llm_tool(user_prompt: str) -> str:
+    """Executes a prompt using a language model to create a detaled prompt
+    for image generation based on user_prompt.
+    Returns prompt for image_generation_tool.
+    Args:
+        user_prompt: The user's text prompt to be processed by the language model.
+    """
+    # Prompt parts
+    prefix="Generate a detailed and structured FLUX-Schnell-compatible prompt based on the following short description of an image: "
+    postfix="""
+    The generated prompt should follow these guidelines:
+	1.	Foreground, Middle Ground, and Background: Clearly describe elements in each layer of the image in an organized manner.
+	2.	Tone and Style: Specify the tone (e.g., cinematic, surreal, vibrant) and artistic style (e.g., photorealistic, painterly, abstract).
+	3.	Color Palette: Include details about the dominant colors or overall color scheme.
+	4.	Perspective and Camera Details: Mention the point of view (e.g., wide-angle, close-up), camera type, lens, aperture, and lighting conditions if applicable.
+	5.	Additional Details: Highlight any specific objects, text, or unique features with clear emphasis (e.g., ‘with green text’ or ‘emphasis on golden hour lighting’).
+	6.	Output Settings: Suggest aspect ratio, output format (e.g., PNG), quality level, and seed for reproducibility.
+    Ensure that the generated prompt is logical, descriptive, and written in natural language to maximize compatibility with FLUX-Schnell’s capabilities.”
+    Example Input:
+    'An image of a serene forest with a small cabin.'
+    Example Output:
+    '''
+    In the foreground, a lush green forest floor covered with moss and scattered wildflowers.
+    In the middle ground, a cozy wooden cabin with smoke gently rising from its chimney.
+    In the background, towering pine trees fading into a misty horizon.
+    The tone is tranquil and inviting, with a photorealistic style.
+    The color palette includes rich greens, warm browns for the cabin, and soft gray mist.
+    The perspective is slightly elevated as if viewed from a drone camera at sunrise,
+    capturing golden hour lighting for soft shadows and warm highlights.
+    The aspect ratio is 16:9 in PNG format with high quality (90), using seed 42 for reproducibility.
+    '''
+    """
+    model = HfApiModel(
+    max_tokens=200,
+    temperature=1.0,
+    model_id='Qwen/Qwen2.5-Coder-32B-Instruct',
+    custom_role_conversions=None,
+    )
+    prompt = prefix + user_prompt + '. ' + postfix
+    try:
+        response = model.generate(
+            prompt=prompt, temperature=1., max_tokens=200)
+        response = openai.Completion.create(
+            engine=model_name,  # Use 'engine' for older models, 'model' for newer
+            prompt=prompt
+        )
+        return response.choices[0].text.strip()
+    except Exception as e:
+        return f"Error during LLM call: {str(e)}"
 final_answer = FinalAnswerTool()
 agent = CodeAgent(
     model=model,
+    tools=[final_answer, llm_tool, image_generation_tool], ## add your tools here (don't remove final answer)
     max_steps=6,
     verbosity_level=1,
     grammar=None,