Spaces:

ParthSadaria
/

lokiai

Running

File size: 3,703 Bytes

4986fe4
 
ef215d3
7c60ac5
378f2c3
8834a20
378f2c3
4986fe4
 
 
378f2c3
 
4986fe4
 
 
 
 
 
 
e2e24f9
378f2c3
 
 
 
 
7c60ac5
7ef5d89
7c60ac5
 
 
 
 
 
 
 
4986fe4
7c60ac5
4986fe4
7c60ac5
 
 
 
 
 
e2e24f9
7c60ac5
 
 
 
 
 
7ef5d89
a68045e
 
 
8834a20
 
e2e24f9
8834a20
 
 
 
7ef5d89
045bd95
ef215d3
 
378f2c3
045bd95
378f2c3
045bd95
378f2c3
9d35223
 
045bd95
114ca84
8834a20
 
 
 
 
114ca84
 
 
8834a20
 
045bd95
 
 
378f2c3
4116ca1
7ef5d89
 
 
 
 
045bd95
6a84e5c
 
 
 
a68045e

import os
from dotenv import load_dotenv
from fastapi import FastAPI, HTTPException, Request
from fastapi.responses import StreamingResponse, HTMLResponse
from pydantic import BaseModel
import httpx

# Load environment variables from .env file
load_dotenv()

app = FastAPI()

# Get API keys and secret endpoint from environment variables
api_keys_str = os.getenv('API_KEYS')
valid_api_keys = api_keys_str.split(',') if api_keys_str else []
secret_api_endpoint = os.getenv('SECRET_API_ENDPOINT')

# Check if the endpoint is set in the environment
if not secret_api_endpoint:
    raise HTTPException(status_code=500, detail="API endpoint is not configured in environment variables.")

class Payload(BaseModel):
    model: str
    messages: list

@app.get("/", response_class=HTMLResponse)
async def root():
    html_content = """
    <!DOCTYPE html>
    <html lang="en">
    <head>
        <meta charset="UTF-8">
        <meta name="viewport" content="width=device-width, initial-scale=1.0">
        <title>Loki.AI API</title>
        <style>
            body { font-family: Arial, sans-serif; text-align: center; margin-top: 50px; background-color: #121212; color: white; }
            h1 { color: #4CAF50; }
            a { color: #BB86FC; text-decoration: none; }
            a:hover { text-decoration: underline; }
        </style>
    </head>
    <body>
        <h1>Welcome to Loki.AI API!</h1>
        <p>Created by Parth Sadaria</p>
        <p>Go to /models for more info</p>
        <p>Check out the GitHub for more projects:</p>
        <a href="https://github.com/ParthSadaria" target="_blank">github.com/ParthSadaria</a>
    </body>
    </html>
    """
    return HTMLResponse(content=html_content)

# Remove cache from get_models
@app.get("/v1/models")
async def get_models():
    async with httpx.AsyncClient() as client:
        try:
            response = await client.get(f"{secret_api_endpoint}/v1/models", timeout=3)
            response.raise_for_status()
            return response.json()
        except httpx.RequestError as e:
            raise HTTPException(status_code=500, detail=f"Request failed: {e}")

@app.post("/v1/chat/completions")
async def get_completion(payload: Payload, request: Request):
    api_key = request.headers.get("Authorization")
    
    # Validate API key
    if api_key not in valid_api_keys:
        raise HTTPException(status_code=403, detail="Forbidden: Invalid API key. Join dsc.gg/chadgang and DM @mr_leaderyt on Discord for a free API key :)")
    
    # Prepare the payload for streaming
    payload_dict = {**payload.dict(), "stream": True}

    # Define an asynchronous generator to stream the response line by line
    async def stream_generator():
        async with httpx.AsyncClient() as client:
            try:
                async with client.stream("POST", secret_api_endpoint, json=payload_dict, timeout=10) as response:
                    response.raise_for_status()
                    async for line in response.aiter_lines():
                        if line:
                            yield f"{line}\n"  # Add a newline to distinguish each line
            except httpx.RequestError as e:
                raise HTTPException(status_code=500, detail=f"Streaming failed: {e}")

    # Return the streaming response
    return StreamingResponse(stream_generator(), media_type="application/json")

# Log the API endpoints
@app.on_event("startup")
async def startup_event():
    print("API endpoints:")
    print("GET /")
    print("GET /models")
    print("POST /v1/chat/completions")

# Run the server with Uvicorn using the 'main' module
if __name__ == "__main__":
    import uvicorn
    uvicorn.run(app, host="0.0.0.0", port=8000)