Spaces:

aioverlords-amnil
/

internal-ollama

Paused

App Files Files Community

internal-ollama / app.py

Sirorororo

Add openAI compatibility

aef7a8e about 1 month ago

raw

history blame contribute delete

5.56 kB

	# import os
	# import logging
	# import requests
	# from fastapi import FastAPI, HTTPException
	# from fastapi.responses import StreamingResponse
	# from pydantic import BaseModel
	# from openai import OpenAI

	# logging.basicConfig(level=logging.INFO)
	# logger = logging.getLogger(__name__)

	# app = FastAPI()
	# MODEL_NAME = 'llama3.1:8b'

	# OLLAMA_URL = "http://localhost:11434"


	# # def create_model(query):
	# # message = [
	# # {"role": "system", "content": "You are a general chat bot."},
	# # {"role": "user", "content": f"{query}"}
	# # ]

	# # completion = ollama_client.chat.completions.create(
	# # model="llama3.1:8b",
	# # messages=message
	# # # response_format=base_model,
	# # #temperature = 0.1
	# # )
	# # return completion

	# class Question(BaseModel):
	# text: str

	# @app.get("/")
	# def read_root():
	# return {"Hello": f"Welcome to {MODEL_NAME} FastAPI"}


	# # # POST endpoint to query the LLM
	# # @app.post("/ask")
	# # async def ask_question(question: Question):
	# # try:
	# # response = create_model(question.text)
	# # return {"response": response}
	# # except Exception as e:
	# # raise HTTPException(status_code=500, detail=f"Error querying the model: {str(e)}")


	# @app.get("/list_models")
	# async def list_models():
	# """List all available models in Ollama."""
	# try:
	# response = requests.get(f"{OLLAMA_URL}/api/tags")
	# except Exception as e:
	# return {"error": str(e)}

	# return response.json()

	# @app.post("/pull_model")
	# async def pull_model(model_name: str):
	# """Pull a model from Ollama's repository."""
	# response = requests.post(f"{OLLAMA_URL}/api/pull", json={"name": model_name})
	# # print(response)

	# return response.json()


	# @app.post("/generate")
	# async def generate_text(model: str, prompt: str, system: str = "You are a helpful AI assistant.", stream: bool = False):
	# """Generate text from a given prompt using a specific model."""
	# try:
	# response = requests.post(
	# f"{OLLAMA_URL}/api/generate",
	# json={"model": model, "prompt": prompt, "system": system, "stream": stream}
	# )
	# except Exception as e:
	# return {"error": str(e)}
	# # print(response)

	# return response.json()

	# @app.post("/embed")
	# async def get_embedding(model: str, text: str):
	# """Generate embeddings for the given text using a model."""
	# try:
	# response = requests.post(
	# f"{OLLAMA_URL}/api/embeddings",
	# json={"model": model, "prompt": text}
	# )
	# except Exception as e:
	# return {"error": str(e)}
	# # print(response)

	# return response.json()

	# @app.post("/chat")
	# async def chat(model: str, message: str, system: str = "You are a helpful chatbot."):
	# """Chat with the model while maintaining context."""
	# try:
	# response = requests.post(
	# f"{OLLAMA_URL}/api/chat",
	# json={"model": model, "messages": [{"role": "system", "content": system}, {"role": "user", "content": message}]}
	# )
	# except Exception as e:
	# return {"error": str(e)}
	# # print(response)

	# return response.json()



	# @app.on_event("startup")
	# async def startup_event():
	# logger.info(f"Starting up with model: {MODEL_NAME}")

	# @app.on_event("shutdown")
	# async def shutdown_event():
	# logger.info("Shutting down")



	# from fastapi import FastAPI
	# import httpx

	# app = FastAPI()
	# TARGET_SERVER = "http://localhost:11434"

	# @app.get("/proxy/{path:path}")
	# async def get_proxy_request(path: str):
	# async with httpx.AsyncClient() as client:
	# response = await client.get(f"{TARGET_SERVER}/{path}")
	# return response.json()

	# @app.post("/proxy/{path:path}")
	# async def post_proxy_request(path: str):
	# async with httpx.AsyncClient() as client:
	# response = await client.post(f"{TARGET_SERVER}/{path}")
	# return response.json()


	from fastapi import FastAPI
	import httpx
	from pydantic import BaseModel
	from OpenAIClasses import ChatCompletionRequest

	class RequestBody(BaseModel):
	data: dict

	app = FastAPI()
	TARGET_SERVER = "http://localhost:11434"

	@app.get("/proxy/{path:path}")
	async def proxy_get(path: str):
	""" Forwards GET requests to the target server """
	async with httpx.AsyncClient() as client:
	response = await client.get(f"{TARGET_SERVER}/{path}")
	return response.json()

	@app.post("/proxy/{path:path}")
	async def proxy_post(path: str, request_body: RequestBody):
	# print(request_body)
	# print(request_body.model_dump())
	""" Forwards POST requests to the target server """
	try:
	data = request_body.model_dump()["data"]

	async with httpx.AsyncClient() as client:
	response = await client.post(f"{TARGET_SERVER}/{path}", json=data, timeout=120)
	return response.json()
	except Exception as e:
	print(e)
	return {"error": str(e)}


	@app.post("/openai_compatible/chat/completions")
	async def openai_compatible(request_body: ChatCompletionRequest):

	""" Forwards POST requests to the target server """
	try:
	data = request_body.model_dump()

	async with httpx.AsyncClient() as client:
	response = await client.post(f"{TARGET_SERVER}/api/chat", json=data, timeout=120)
	print(response.json())
	return {"choices": [response.json()]}
	except Exception as e:
	print(e)
	return {"error": str(e)}