# =============================================================================
# REQUIRED CONFIGURATION
# =============================================================================
# Hugging Face token with read/write permissions for repositories and inference API
# Get it from: https://huggingface.co/settings/tokens
HF_TOKEN=hg_...

# -----------------------------------------------------------------------------
# GENERATION SETTINGS
# -----------------------------------------------------------------------------
MAX_NUM_TOKENS=2048
MAX_NUM_ROWS=1000
DEFAULT_BATCH_SIZE=5

# Required for chat data generation with Llama or Qwen models
# Options: "llama3", "qwen2", or custom template string
#MAGPIE_PRE_QUERY_TEMPLATE=qwen2


# =============================================================================
# MODEL & SERVICES CONFIGURATION
# =============================================================================

# -----------------------------------------------------------------------------
# A. STANDALONE SETUP (No additional installation required)
# -----------------------------------------------------------------------------

# 1. HUGGING FACE SERVERLESS (Recommended default)
# Just requires HF_TOKEN
# MODEL=meta-llama/Llama-3.1-8B-Instruct
# MODEL=Qwen/Qwen2.5-1.5B-Instruct

# 2. ARGILLA ON HUGGING FACE SPACES (Recommended for data annotation)
# ARGILLA_API_URL=https://daqc-my-argilla.hf.space/
#ARGILLA_API_KEY=

# 3. OPENAI API
# Requires OpenAI API key
# OPENAI_BASE_URL=https://api.openai.com/v1/
# MODEL=gpt-4
# API_KEY=

# -----------------------------------------------------------------------------
# B. LOCAL SETUP (Requires local installation)
# -----------------------------------------------------------------------------

# 1. LOCAL OLLAMA
# Requires: Ollama installed (https://ollama.ai)
#OLLAMA_BASE_URL=http://127.0.0.1:11434/
#MODEL=qwen2.5:32b-instruct-q5_K_S
#TOKENIZER_ID=Qwen/Qwen2.5-32B-Instruct

# MODEL=deepseek-r1:1.5b
# TOKENIZER_ID=deepseek-r1:1.5b


# 2. LOCAL VLLM
# Requires: VLLM installed
# VLLM_BASE_URL=http://127.0.0.1:8000/
# MODEL=Qwen/Qwen2.5-1.5B-Instruct
# TOKENIZER_ID=Qwen/Qwen2.5-1.5B-Instruct

# 3. LOCAL TGI/ENDPOINTS
# Requires: Text Generation Inference installed
# HUGGINGFACE_BASE_URL=http://127.0.0.1:3000/
# TOKENIZER_ID=meta-llama/Llama-3.1-8B-Instruct


# -----------------------------------------------------------------------------
# C. DOCKER SETUP (Ready to use with docker-compose, recommended for full setup)
# -----------------------------------------------------------------------------

# 1. DOCKER OLLAMA
OLLAMA_BASE_URL=http://ollama:11434
# Options for OLLAMA_HARDWARE: latest (for CPU/NVIDIA), rocm (for AMD)
OLLAMA_HARDWARE=latest


# DEEPSEEK R1
#MODEL=deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B
#TOKENIZER_ID=deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B
#MAGPIE_PRE_QUERY_TEMPLATE= "<｜begin▁of▁sentence｜>User: " # use the custom template for the model

#LLAMA3.2
MODEL=llama3.2:1b # model for instruction generation
TOKENIZER_ID=meta-llama/Llama-3.2-1B-Instruct # tokenizer for instruction generation
MAGPIE_PRE_QUERY_TEMPLATE=llama3 # magpie template required for instruction generation


# 2. DOCKER ARGILLA (persistent data)
ARGILLA_API_URL=http://argilla:6900
ARGILLA_USERNAME=admin
ARGILLA_PASSWORD=admin1234
ARGILLA_API_KEY=admin.1234
ARGILLA_REINDEX_DATASET=1

# Usage: 
#docker-compose --profile with-ollama --profile with-argilla build
#(open new terminal) docker-compose --profile with-ollama up -d
#                    docker-compose exec ollama ollama run llama3.2:1b
#docker-compose --profile with-ollama --profile with-argilla up -d