audit_assistant / model_params.cfg
ppsingh's picture
Update model_params.cfg
f7e359e verified
raw
history blame
402 Bytes
[retriever]
MODEL = BAAI/bge-m3
NORMALIZE = 1
TOP_K = 20
[ranker]
MODEL = BAAI/bge-reranker-v2-m3
TOP_K = 5
[reader]
TYPE = DEDICATED
DEDICATED_MODEL = meta-llama/Llama-3.1-8B-Instruct
DEDICATED_ENDPOINT = https://qu2d8m6dmsollhly.us-east-1.aws.endpoints.huggingface.cloud
NVIDIA_MODEL = meta-llama/Llama-3.1-8B-Instruct
NVIDIA_ENDPOINT = https://huggingface.co/api/integrations/dgx/v1
MAX_TOKENS = 768