Spaces:

Shujah239
/

emotion-detection-app-server

Running

App Files Files Community

Shujah239 commited on 1 day ago

Commit

31c7755

verified ·

1 Parent(s): f5a7a9e

Upload 3 files

Browse files

Files changed (3) hide show

README.md +62 -12
app.py +279 -0
requirements.txt +10 -0

README.md CHANGED Viewed

@@ -1,12 +1,62 @@
----
-title: Emotion Detection App Server
-emoji: 🦀
-colorFrom: gray
-colorTo: pink
-sdk: docker
-pinned: false
-license: mit
-short_description: an app server to analyze emotions in sound using .wav
----
-Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

+# Audio Emotion Detection API
+This application provides an API for detecting emotions in audio files using the wav2vec2 model fine-tuned for emotion recognition.
+## Features
+- Upload audio files for emotion analysis
+- List all uploaded recordings
+- Download previously uploaded recordings
+- Analyze existing recordings
+- Delete recordings
+## API Endpoints
+- `GET /health` - Health check endpoint
+- `POST /upload` - Upload and analyze an audio file
+- `GET /recordings` - List all uploaded recordings
+- `GET /recordings/{filename}` - Download a specific recording
+- `GET /analyze/{filename}` - Analyze an existing recording
+- `DELETE /recordings/{filename}` - Delete a recording
+## Supported Audio Formats
+- WAV
+- MP3
+- OGG
+- FLAC
+## File Size Limits
+Maximum file size: 10MB
+## Usage Example
+```python
+import requests
+# Upload and analyze an audio file
+with open('your_audio.wav', 'rb') as f:
+    files = {'file': f}
+    response = requests.post('https://your-space-url.hf.space/upload', files=files)
+    print(response.json())
+```
+## Technical Details
+- Based on FastAPI
+- Uses Hugging Face's wav2vec2-base-superb-er model for emotion recognition
+- Optimized for Hugging Face Spaces deployment
+- Automatic file cleanup to manage storage limits
+## Storage Management
+Files are automatically cleaned up after 24 hours to manage storage limits on Hugging Face Spaces.
+## Development
+To run this API locally:
+1. Install dependencies: `pip install -r requirements.txt`
+2. Run the server: `python app.py`
+3. Access the Swagger documentation at `http://localhost:7860/docs`

app.py ADDED Viewed

	@@ -0,0 +1,279 @@

+import shutil
+import logging
+import time
+from pathlib import Path
+from typing import List, Dict, Any, Optional
+from fastapi import FastAPI, HTTPException, UploadFile, File, BackgroundTasks, Request
+from fastapi.responses import FileResponse
+from fastapi.middleware.cors import CORSMiddleware
+from fastapi.middleware.gzip import GZipMiddleware
+from transformers import pipeline
+import torch
+import uvicorn
+# Configure logging
+logging.basicConfig(level=logging.INFO)
+logger = logging.getLogger(__name__)
+# Define uploads directory
+UPLOAD_DIR = Path("uploads")
+MAX_STORAGE_MB = 100  # Maximum storage in MB
+MAX_FILE_AGE_DAYS = 1  # Maximum age of files in days
+app = FastAPI(
+    title="Emotion Detection API",
+    description="Audio emotion detection using wav2vec2",
+    version="1.0.0",
+)
+# Add middleware
+app.add_middleware(
+    CORSMiddleware,
+    allow_origins=["*"],
+    allow_credentials=True,
+    allow_methods=["*"],
+    allow_headers=["*"],
+)
+app.add_middleware(GZipMiddleware, minimum_size=1000)
+# Preloaded classifier (global)
+classifier = None
+@app.on_event("startup")
+async def load_model():
+    """
+    Load the pretrained Wav2Vec2 emotion recognition model at startup
+    and ensure the upload directory exists.
+    """
+    global classifier
+    try:
+        # Use GPU if available, else CPU
+        device = 0 if torch.cuda.is_available() else -1
+        # For Hugging Face Spaces with limited resources, use quantized model if on CPU
+        if device == -1:
+            logger.info("Loading quantized model for CPU usage")
+            classifier = pipeline(
+                "audio-classification",
+                model="superb/wav2vec2-base-superb-er",
+                device=device,
+                torch_dtype=torch.float16  # Use half precision
+            )
+        else:
+            classifier = pipeline(
+                "audio-classification",
+                model="superb/wav2vec2-base-superb-er",
+                device=device
+            )
+        logger.info("Loaded emotion recognition model (device=%s)",
+                    "GPU" if device == 0 else "CPU")
+    except Exception as e:
+        logger.error("Failed to load model: %s", e)
+        raise
+    # Ensure the upload directory exists
+    try:
+        UPLOAD_DIR.mkdir(parents=True, exist_ok=True)
+        # Clean up old files at startup
+        await cleanup_old_files()
+    except Exception as e:
+        logger.error("Failed to create upload directory: %s", e)
+        raise
+async def cleanup_old_files():
+    """Clean up old files to prevent storage issues on Hugging Face Spaces."""
+    try:
+        # Remove files older than MAX_FILE_AGE_DAYS
+        now = time.time()
+        deleted_count = 0
+        for file_path in UPLOAD_DIR.iterdir():
+            if file_path.is_file():
+                file_age_days = (now - file_path.stat().st_mtime) / (60 * 60 * 24)
+                if file_age_days > MAX_FILE_AGE_DAYS:
+                    file_path.unlink()
+                    deleted_count += 1
+        if deleted_count > 0:
+            logger.info(f"Cleaned up {deleted_count} old files")
+    except Exception as e:
+        logger.error(f"Error during file cleanup: {e}")
+@app.middleware("http")
+async def add_process_time_header(request: Request, call_next):
+    """Add X-Process-Time header to responses."""
+    start_time = time.time()
+    response = await call_next(request)
+    process_time = time.time() - start_time
+    response.headers["X-Process-Time"] = str(process_time)
+    return response
+@app.get("/health")
+async def health():
+    """Health check endpoint."""
+    return {"status": "ok", "model_loaded": classifier is not None}
+@app.post("/upload")
+async def upload_audio(
+    file: UploadFile = File(...),
+    background_tasks: BackgroundTasks = None
+):
+    """
+    Upload an audio file and analyze emotions.
+    Saves the file to the uploads directory and returns model predictions.
+    """
+    if not classifier:
+        raise HTTPException(status_code=503, detail="Model not yet loaded")
+    filename = Path(file.filename).name
+    if not filename:
+        raise HTTPException(status_code=400, detail="Invalid filename")
+    # Check file extension
+    valid_extensions = [".wav", ".mp3", ".ogg", ".flac"]
+    if not any(filename.lower().endswith(ext) for ext in valid_extensions):
+        raise HTTPException(
+            status_code=400,
+            detail=f"Invalid file type. Supported types: {', '.join(valid_extensions)}"
+        )
+    # Read file contents
+    try:
+        contents = await file.read()
+    except Exception as e:
+        logger.error("Error reading file %s: %s", filename, e)
+        raise HTTPException(status_code=500, detail=f"Failed to read file: {str(e)}")
+    finally:
+        await file.close()
+    # Check file size (limit to 10MB for Spaces)
+    if len(contents) > 10 * 1024 * 1024:
+        raise HTTPException(
+            status_code=413,
+            detail="File too large. Maximum size is 10MB"
+        )
+    # Check available disk space
+    try:
+        total, used, free = shutil.disk_usage(UPLOAD_DIR)
+        free_mb = free / (1024 * 1024)
+        if free_mb < 10:  # Keep at least 10MB free
+            # Schedule cleanup in background
+            if background_tasks:
+                background_tasks.add_task(cleanup_old_files)
+            if len(contents) > free:
+                logger.error(
+                    "Insufficient storage: needed %d bytes, free %d bytes",
+                    len(contents), free
+                )
+                raise HTTPException(status_code=507, detail="Insufficient storage to save file")
+    except Exception as e:
+        logger.warning(f"Failed to check disk usage: {e}")
+    # Save file to uploads directory
+    file_path = UPLOAD_DIR / filename
+    try:
+        with open(file_path, "wb") as f:
+            f.write(contents)
+        logger.info("Saved uploaded file: %s", file_path)
+    except Exception as e:
+        logger.error("Failed to save file %s: %s", filename, e)
+        raise HTTPException(status_code=500, detail=f"Failed to save file: {str(e)}")
+    # Analyze the audio file using the pretrained model pipeline
+    try:
+        results = classifier(str(file_path))
+        # Schedule cleanup in background
+        if background_tasks:
+            background_tasks.add_task(cleanup_old_files)
+        return {"filename": filename, "predictions": results}
+    except Exception as e:
+        logger.error("Model inference failed for %s: %s", filename, e)
+        # Try to remove the file if inference fails
+        try:
+            file_path.unlink(missing_ok=True)
+        except Exception:
+            pass
+        raise HTTPException(status_code=500, detail=f"Emotion detection failed: {str(e)}")
+@app.get("/recordings")
+async def list_recordings():
+    """
+    List all uploaded recordings.
+    Returns a JSON list of filenames in the uploads directory.
+    """
+    try:
+        files = [f.name for f in UPLOAD_DIR.iterdir() if f.is_file()]
+        total, used, free = shutil.disk_usage(UPLOAD_DIR)
+        storage_info = {
+            "total_mb": total / (1024 * 1024),
+            "used_mb": used / (1024 * 1024),
+            "free_mb": free / (1024 * 1024)
+        }
+        return {"recordings": files, "storage": storage_info}
+    except Exception as e:
+        logger.error("Could not list files: %s", e)
+        raise HTTPException(status_code=500, detail=f"Failed to list recordings: {str(e)}")
+@app.get("/recordings/{filename}")
+async def get_recording(filename: str):
+    """
+    Stream/download an audio file from the server.
+    """
+    safe_name = Path(filename).name
+    file_path = UPLOAD_DIR / safe_name
+    if not file_path.exists() or not file_path.is_file():
+        raise HTTPException(status_code=404, detail="Recording not found")
+    # Guess MIME type (fallback to octet-stream)
+    import mimetypes
+    media_type, _ = mimetypes.guess_type(file_path)
+    return FileResponse(
+        file_path,
+        media_type=media_type or "application/octet-stream",
+        filename=safe_name
+    )
+@app.get("/analyze/{filename}")
+async def analyze_recording(filename: str):
+    """
+    Analyze an already-uploaded recording by filename.
+    Returns emotion predictions for the given file.
+    """
+    if not classifier:
+        raise HTTPException(status_code=503, detail="Model not yet loaded")
+    safe_name = Path(filename).name
+    file_path = UPLOAD_DIR / safe_name
+    if not file_path.exists() or not file_path.is_file():
+        raise HTTPException(status_code=404, detail="Recording not found")
+    try:
+        results = classifier(str(file_path))
+    except Exception as e:
+        logger.error("Model inference failed for %s: %s", filename, e)
+        raise HTTPException(status_code=500, detail=f"Emotion detection failed: {str(e)}")
+    return {"filename": safe_name, "predictions": results}
+@app.delete("/recordings/{filename}")
+async def delete_recording(filename: str):
+    """
+    Delete a recording by filename.
+    """
+    safe_name = Path(filename).name
+    file_path = UPLOAD_DIR / safe_name
+    if not file_path.exists() or not file_path.is_file():
+        raise HTTPException(status_code=404, detail="Recording not found")
+    try:
+        file_path.unlink()
+        return {"status": "success", "message": f"Deleted {safe_name}"}
+    except Exception as e:
+        logger.error("Failed to delete file %s: %s", filename, e)
+        raise HTTPException(status_code=500, detail=f"Failed to delete file: {str(e)}")
+if __name__ == "__main__":
+    # Bind to 0.0.0.0:7860 for Hugging Face Spaces compatibility
+    uvicorn.run(app, host="0.0.0.0", port=7860)

requirements.txt ADDED Viewed

	@@ -0,0 +1,10 @@

+fastapi>=0.95.1,<0.96.0
+uvicorn>=0.22.0,<0.23.0
+transformers>=4.28.1,<4.29.0
+torch>=2.0.0,<2.1.0
+librosa>=0.10.0,<0.11.0
+soundfile>=0.12.1,<0.13.0
+python-multipart>=0.0.6,<0.0.7
+numpy>=1.24.3,<1.25.0
+tqdm>=4.65.0,<4.66.0
+pydantic>=1.10.7,<1.11.0