Spaces:

johannoriel
/

OlympIA

Running

App Files Files Community

johannoriel commited on 15 days ago

Commit

8e46350

•

1 Parent(s): 645a356

HF bug correction

Browse files

Files changed (1) hide show

plugins/ragllm.py +28 -9

plugins/ragllm.py CHANGED Viewed

@@ -16,6 +16,7 @@ from langchain_huggingface import HuggingFaceEmbeddings
 DEVICE = 'cuda' if torch.cuda.is_available() else 'cpu'
 MAX_LENGTH = 512
 CHUNK_SIZE = 200
 def mean_pooling(model_output, attention_mask):
     token_embeddings = model_output[0]
@@ -52,6 +53,7 @@ translations["en"].update({
     "rag_error_calling_llm": "Error calling LLM: ",
     "rag_processing" : "Processing...",
     "rag_hf_api_key": "HuggingFace API Token",
 })
 translations["fr"].update({
@@ -77,25 +79,23 @@ translations["fr"].update({
     "rag_error_calling_llm": "Erreur lors de l'appel au LLM : ",
     "rag_processing" : "En cours de traitement...",
      "rag_hf_api_key": "Token API HuggingFace",
 })
 class RagllmPlugin(Plugin):
     def __init__(self, name: str, plugin_manager):
         super().__init__(name, plugin_manager)
-        try:
-            self.config = self.load_llm_config()
-        except:
-            self.config = {}
         self.embeddings = None
         self.chunks = None
         self.hf_client = None
     def load_llm_config(self) -> Dict:
-        try:
-            with open('.llm-config.yml', 'r') as file:
-                return yaml.safe_load(file)
-        except:
             return {}
     def get_tabs(self):
         return [{"name": "RAG", "plugin": "ragllm"}]
@@ -161,6 +161,12 @@ class RagllmPlugin(Plugin):
     def get_config_ui(self, config):
         updated_config = {}
         for field, params in self.get_config_fields().items():
             if params['type'] == 'select':
                 if field == 'llm_model':
@@ -203,11 +209,24 @@ class RagllmPlugin(Plugin):
                     params['label'],
                     value=config.get(field, params['default'])
                 )
         return updated_config
     def get_sidebar_config_ui(self, config: Dict[str, Any]) -> Dict[str, Any]:
-        available_models = self.get_available_models('ollama') + self.get_available_models('groq')
         default_model = config.get('llm_model', available_models[0] if available_models else None)
         selected_model = st.sidebar.selectbox(
             t("rag_llm_model"),
             options=available_models,

 DEVICE = 'cuda' if torch.cuda.is_available() else 'cpu'
 MAX_LENGTH = 512
 CHUNK_SIZE = 200
+CONFIG_FILE = '.llm-config.yml'
 def mean_pooling(model_output, attention_mask):
     token_embeddings = model_output[0]
     "rag_error_calling_llm": "Error calling LLM: ",
     "rag_processing" : "Processing...",
     "rag_hf_api_key": "HuggingFace API Token",
+    "rag_config_file_missing": "Configuration file .llm-config.yml not found. This is required for Ollama and Groq providers.",
 })
 translations["fr"].update({
     "rag_error_calling_llm": "Erreur lors de l'appel au LLM : ",
     "rag_processing" : "En cours de traitement...",
      "rag_hf_api_key": "Token API HuggingFace",
+    "rag_config_file_missing": "Fichier de configuration .llm-config.yml non trouvé. Ce fichier est nécessaire pour les providers Ollama et Groq.",
 })
 class RagllmPlugin(Plugin):
     def __init__(self, name: str, plugin_manager):
         super().__init__(name, plugin_manager)
         self.embeddings = None
         self.chunks = None
         self.hf_client = None
+        self.config = {}
     def load_llm_config(self) -> Dict:
+        if not os.path.exists(CONFIG_FILE):
+            st.warning(t("rag_config_file_missing"))
             return {}
+        with open(CONFIG_FILE, 'r') as file:
+            return yaml.safe_load(file)
     def get_tabs(self):
         return [{"name": "RAG", "plugin": "ragllm"}]
     def get_config_ui(self, config):
         updated_config = {}
+        # Load config file only if provider is not huggingface
+        current_provider = config.get('provider', 'ollama')
+        if current_provider != 'huggingface':
+            self.config = self.load_llm_config()
         for field, params in self.get_config_fields().items():
             if params['type'] == 'select':
                 if field == 'llm_model':
                     params['label'],
                     value=config.get(field, params['default'])
                 )
+        if config.get('provider') == 'huggingface':
+            updated_config['hf_api_key'] = st.text_input(
+                t("rag_hf_api_key"),
+                type="password",
+                value=config.get('hf_api_key', '')
+            )
         return updated_config
     def get_sidebar_config_ui(self, config: Dict[str, Any]) -> Dict[str, Any]:
+        provider = config.get('provider', 'ollama')
+        available_models = self.get_available_models(provider)
         default_model = config.get('llm_model', available_models[0] if available_models else None)
+        if default_model not in available_models:
+            default_model = available_models[0] if available_models else None
         selected_model = st.sidebar.selectbox(
             t("rag_llm_model"),
             options=available_models,