Spaces:

Dragneel
/

TinyLlama

Sleeping

Drag2121 commited on Sep 17, 2024

Commit

9a2fab8

1 Parent(s): 5124590

phi3

Files changed (2) hide show

app.py CHANGED Viewed

@@ -13,7 +13,7 @@ logger = logging.getLogger(__name__)
 app = FastAPI()
-MODEL_NAME = 'tinyllama'
 @lru_cache()
 def get_llm():

 app = FastAPI()
+MODEL_NAME = 'phi3:mini'
 @lru_cache()
 def get_llm():

start.sh CHANGED Viewed

@@ -9,8 +9,8 @@ export CUDA_VISIBLE_DEVICES=0  # Use the first GPU if available
 ollama serve &  # Use GPU 0 if available
 # Pull the model if not already present
-if ! ollama list | grep -q "tinyllama"; then
-    ollama pull tinyllama
 fi
 # Wait for Ollama to start up (use a more robust check)

 ollama serve &  # Use GPU 0 if available
 # Pull the model if not already present
+if ! ollama list | grep -q "phi3:mini"; then
+    ollama pull phi3:mini
 fi
 # Wait for Ollama to start up (use a more robust check)