iver / src /api /config.py
hevold's picture
Upload 29 files
b34efa5 verified
"""
Configuration for Hugging Face API integration.
Contains model IDs, API endpoints, and other configuration parameters.
"""
# Norwegian LLM options
LLM_MODELS = {
"normistral": {
"model_id": "norallm/normistral-7b-scratch",
"description": "NorMistral 7B - Norwegian language model based on Mistral architecture"
},
"viking": {
"model_id": "silo-ai/viking-7b",
"description": "Viking 7B - Multilingual model for Nordic languages"
},
"norskgpt": {
"model_id": "NbAiLab/NorskGPT",
"description": "NorskGPT - Norwegian language model"
}
}
# Default LLM model
DEFAULT_LLM_MODEL = "normistral"
# Norwegian embedding models
EMBEDDING_MODELS = {
"nb-sbert": {
"model_id": "NbAiLab/nb-sbert-base",
"description": "NB-SBERT-BASE - Norwegian sentence embedding model"
},
"simcse": {
"model_id": "FFI/SimCSE-NB-BERT-large",
"description": "SimCSE-NB-BERT-large - Norwegian sentence embedding model"
}
}
# Default embedding model
DEFAULT_EMBEDDING_MODEL = "nb-sbert"
# Hugging Face API endpoints
HF_API_ENDPOINTS = {
"inference": "https://api-inference.huggingface.co/models/",
"feature-extraction": "https://api-inference.huggingface.co/pipeline/feature-extraction/"
}
# API request parameters
API_PARAMS = {
"max_length": 512,
"temperature": 0.7,
"top_p": 0.9,
"top_k": 50,
"repetition_penalty": 1.1
}
# Document processing parameters
CHUNK_SIZE = 512
CHUNK_OVERLAP = 100
# RAG parameters
MAX_CHUNKS_TO_RETRIEVE = 5
SIMILARITY_THRESHOLD = 0.75