Spaces:

Athspi-aitools
/

Aittsg

Running

App Files Files Community

Aittsg / app.py

Athspi

Update app.py

22004d7 verified about 2 months ago

raw

history blame contribute delete

6.78 kB

	# main.py
	from fastapi import FastAPI, Query, HTTPException
	from fastapi.responses import FileResponse
	from gtts import gTTS, gTTSError # Import gTTSError for specific error handling
	import uuid
	import os # Import os module for path operations
	import tempfile # Import tempfile for better temporary file handling

	# --- Configuration ---
	# Use tempfile to get a cross-platform temporary directory
	TEMP_DIR = tempfile.gettempdir()
	# Ensure the temporary directory exists
	os.makedirs(TEMP_DIR, exist_ok=True)

	# --- FastAPI App Initialization ---
	app = FastAPI(
	title="gTTS API",
	description="A simple API to convert text to speech using Google Text-to-Speech (gTTS). Supports multiple languages including Tamil, Sinhala, and many others.",
	version="1.2.0", # Increment version for documentation changes
	)

	# --- API Endpoints ---

	@app.get("/", tags=["General"])
	def read_root():
	"""
	Root endpoint providing a welcome message.
	"""
	return {"message": "Welcome to the gTTS API. Use the /tts endpoint to generate speech."}

	@app.get("/tts", tags=["Text-to-Speech"])
	def text_to_speech(
	text: str = Query(
	..., # Ellipsis makes the parameter required
	min_length=1,
	max_length=500, # Adjust max length as needed
	title="Text to Convert",
	description="The text you want to convert into speech (1-500 characters)."
	),
	lang: str = Query(
	"en", # Default language is English
	min_length=2,
	max_length=10, # Allow for language codes like 'en-us', 'zh-CN' etc.
	title="Language Code",
	description="The BCP 47 language code for the speech synthesis (e.g., 'en', 'es', 'ta', 'si', 'ja', 'zh-CN'). See gTTS documentation for supported languages."
	)
	):
	"""
	Converts the provided text into an MP3 audio file using the specified language.

	- text: The text to synthesize (required).
	- lang: The language code (e.g., 'en', 'es', 'fr', 'ta', 'si'). Defaults to 'en'. Crucially, gTTS must support this language code.
	"""
	try:
	# Generate a unique filename in the configured temporary directory
	filename = os.path.join(TEMP_DIR, f"{uuid.uuid4().hex}.mp3")

	# Create gTTS object with text and language
	# Use slow=False for normal speed speech
	tts_object = gTTS(text=text, lang=lang, slow=False)

	# Save the audio file
	tts_object.save(filename)

	# Return the audio file as a response
	# The 'filename' parameter sets the download name for the browser
	return FileResponse(
	path=filename,
	media_type="audio/mpeg",
	filename=f"speech_{lang}.mp3" # Suggest a filename like speech_en.mp3 or speech_ta.mp3
	# Consider adding background task for cleanup as mentioned in previous examples
	)

	except gTTSError as e:
	# Handle specific gTTS errors (like invalid language code, network issues)
	detail_message = f"gTTS Error: {str(e)}. Ensure the language code '{lang}' is supported and text is appropriate for the language."
	# Check common error patterns
	if "400 (Bad Request)" in str(e) or "Language not supported" in str(e):
	raise HTTPException(status_code=400, detail=detail_message)
	elif "500 (Internal Server Error)" in str(e) or "Failed to connect" in str(e):
	# Treat these as potential temporary Google service issues
	raise HTTPException(status_code=503, detail=f"Service Error: {str(e)}. Could be a temporary issue with the TTS service.")
	else: # Other gTTS errors
	raise HTTPException(status_code=503, detail=detail_message) # 503 Service Unavailable likely

	except ValueError as e:
	# Potentially handle other value errors if gTTS raises them for certain inputs
	raise HTTPException(status_code=400, detail=f"Input Error: {str(e)}")

	except Exception as e:
	# Catch any other unexpected errors
	# Log the error for debugging
	# import logging
	# logging.exception(f"An unexpected error occurred during TTS generation for lang='{lang}'")
	raise HTTPException(status_code=500, detail=f"Internal Server Error: An unexpected error occurred.")

	# --- How to Run (Instructions) ---
	# 1. Save this code as `main.py`.
	# 2. Install necessary libraries:
	# pip install fastapi "uvicorn[standard]" gTTS
	# 3. Run the FastAPI server using Uvicorn:
	# uvicorn main:app --reload
	#
	# --- How to Use - Examples ---
	# Open your browser or use a tool like curl/Postman.
	# Access the TTS endpoint with the 'text' and 'lang' query parameters.
	# NOTE: Text containing non-ASCII characters needs to be URL-encoded. Most browsers do this automatically.
	#
	# - English (en - Default):
	# Text: "Hello, world!"
	# URL: http://127.0.0.1:8000/tts?text=Hello%2C%20world%21
	#
	# - Spanish (es):
	# Text: "Hola Mundo"
	# URL: http://127.0.0.1:8000/tts?text=Hola%20Mundo&lang=es
	#
	# - French (fr):
	# Text: "Bonjour le monde"
	# URL: http://127.0.0.1:8000/tts?text=Bonjour%20le%20monde&lang=fr
	#
	# - German (de):
	# Text: "Hallo Welt"
	# URL: http://127.0.0.1:8000/tts?text=Hallo%20Welt&lang=de
	#
	# - Tamil (ta):
	# Text: "வணக்கம் உலகம்"
	# URL: http://127.0.0.1:8000/tts?text=%E0%AE%B5%E0%AE%A3%E0%AE%95%E0%AF%8D%E0%AE%95%E0%AE%AE%E0%AF%8D%20%E0%AE%89%E0%AE%B2%E0%AE%95%E0%AE%AE%E0%AF%8D&lang=ta
	#
	# - Sinhala (si):
	# Text: "හෙලෝ ලෝකය"
	# URL: http://127.0.0.1:8000/tts?text=%E0%B7%84%E0%B7%99%E0%B6%BD%E0%B7%9D%20%E0%B6%BD%E0%B7%9D%E0%B6%9A%E0%B6%BA&lang=si
	#
	# - Japanese (ja):
	# Text: "こんにちは世界"
	# URL: http://127.0.0.1:8000/tts?text=%E3%81%93%E3%82%93%E3%81%AB%E3%81%A1%E3%81%AF%E4%B8%96%E7%95%8C&lang=ja
	#
	# - Chinese (Mandarin, Simplified) (zh-CN):
	# Text: "你好世界"
	# URL: http://127.0.0.1:8000/tts?text=%E4%BD%A0%E5%A5%BD%E4%B8%96%E7%95%8C&lang=zh-CN
	#
	# - Russian (ru):
	# Text: "Привет мир"
	# URL: http://127.0.0.1:8000/tts?text=%D0%9F%D1%80%D0%B8%D0%B2%D0%B5%D1%82%20%D0%BC%D0%B8%D1%80&lang=ru
	#
	# - Hindi (hi):
	# Text: "नमस्ते दुनिया"
	# URL: http://127.0.0.1:8000/tts?text=%E0%A4%A8%E0%A4%AE%E0%A4%B8%E0%A5%8D%E0%A4%A4%E0%A5%87%20%E0%A4%A6%E0%A5%81%E0%A4%A8%E0%A4%BF%E0%A4%AF%E0%A4%BE&lang=hi
	#
	# - Arabic (ar):
	# Text: "مرحبا بالعالم"
	# URL: http://127.0.0.1:8000/tts?text=%D9%85%D8%B1%D8%AD%D8%A8%D8%A7%20%D8%A8%D8%A7%D9%84%D8%B9%D8%A7%D9%84%D9%85&lang=ar
	#
	# Find more supported language codes in the gTTS documentation or common lists of BCP 47 codes.
	# The API will return an MP3 file download or playback depending on your browser/client.
	# If you provide an unsupported language code, you should get a 400 Bad Request error.