Spaces:

lynx-analytics
/

lynxkite

Running

App Files Files Community

darabos commited on Apr 22

Commit

2148b2a

unverified ·

2 Parent(s): edf6482 b9f38c7

Merge pull request #129 from biggraph/feature/image-search-new

Browse files

Files changed (9) hide show

examples/LynxScribe FAQ Chatbot Builder.lynxkite.json +605 -0
examples/LynxScribe Image Search.lynxkite.json +419 -0
examples/{LynxScribe demo.lynxkite.json → LynxScribe RAG Chatbot.lynxkite.json} +471 -706
examples/uploads/image_description_prompts.yaml +90 -0
examples/uploads/lynx_chatbot_scenario_selector.yaml +302 -0
examples/uploads/organon_demo/backend-scenarios-en.yaml +92 -0
examples/uploads/organon_demo/organon_en_copy.xlsx +0 -0
lynxkite-lynxscribe/pyproject.toml +1 -1
lynxkite-lynxscribe/src/lynxkite_lynxscribe/lynxscribe_ops.py +634 -83

examples/LynxScribe FAQ Chatbot Builder.lynxkite.json ADDED Viewed

	@@ -0,0 +1,605 @@

+{
+  "edges": [
+    {
+      "id": "LynxScribe FAQ to RAG 1 LynxScribe RAG Graph Chatbot Builder 1",
+      "source": "LynxScribe FAQ to RAG 1",
+      "sourceHandle": "output",
+      "target": "LynxScribe RAG Graph Chatbot Builder 1",
+      "targetHandle": "rag_graph"
+    },
+    {
+      "id": "LynxScribe RAG Graph Chatbot Builder 1 LynxScribe RAG Graph Chatbot Backend 1",
+      "source": "LynxScribe RAG Graph Chatbot Builder 1",
+      "sourceHandle": "output",
+      "target": "LynxScribe RAG Graph Chatbot Backend 1",
+      "targetHandle": "knowledge_base"
+    },
+    {
+      "id": "Chat processor 1 LynxScribe RAG Graph Chatbot Backend 1",
+      "source": "Chat processor 1",
+      "sourceHandle": "output",
+      "target": "LynxScribe RAG Graph Chatbot Backend 1",
+      "targetHandle": "chat_processor"
+    },
+    {
+      "id": "Truncate history 1 Chat processor 1",
+      "source": "Truncate history 1",
+      "sourceHandle": "output",
+      "target": "Chat processor 1",
+      "targetHandle": "processor"
+    },
+    {
+      "id": "LynxScribe RAG Graph Chatbot Backend 1 Test Chat API 1",
+      "source": "LynxScribe RAG Graph Chatbot Backend 1",
+      "sourceHandle": "output",
+      "target": "Test Chat API 1",
+      "targetHandle": "chat_api"
+    },
+    {
+      "id": "Input chat 1 Test Chat API 1",
+      "source": "Input chat 1",
+      "sourceHandle": "output",
+      "target": "Test Chat API 1",
+      "targetHandle": "message"
+    },
+    {
+      "id": "Test Chat API 1 View 1",
+      "source": "Test Chat API 1",
+      "sourceHandle": "output",
+      "target": "View 1",
+      "targetHandle": "input"
+    }
+  ],
+  "env": "LynxScribe",
+  "nodes": [
+    {
+      "data": {
+        "__execution_delay": 0.0,
+        "collapsed": false,
+        "display": null,
+        "error": null,
+        "input_metadata": null,
+        "meta": {
+          "inputs": {},
+          "name": "LynxScribe FAQ to RAG",
+          "outputs": {
+            "output": {
+              "name": "output",
+              "position": "right",
+              "type": {
+                "type": "None"
+              }
+            }
+          },
+          "params": {
+            "faq_excel_path": {
+              "default": "uploads/organon_demo/organon_en_copy.xlsx",
+              "name": "faq_excel_path",
+              "type": {
+                "type": "<class 'str'>"
+              }
+            },
+            "scenario_cluster_distance_pct": {
+              "default": 30.0,
+              "name": "scenario_cluster_distance_pct",
+              "type": {
+                "type": "<class 'float'>"
+              }
+            },
+            "text_embedder_interface": {
+              "default": "openai",
+              "name": "text_embedder_interface",
+              "type": {
+                "type": "<class 'str'>"
+              }
+            },
+            "text_embedder_model_name_or_path": {
+              "default": "text-embedding-3-large",
+              "name": "text_embedder_model_name_or_path",
+              "type": {
+                "type": "<class 'str'>"
+              }
+            },
+            "vdb_collection_name": {
+              "default": "lynx",
+              "name": "vdb_collection_name",
+              "type": {
+                "type": "<class 'str'>"
+              }
+            },
+            "vdb_num_dimensions": {
+              "default": 3072.0,
+              "name": "vdb_num_dimensions",
+              "type": {
+                "type": "<class 'int'>"
+              }
+            },
+            "vdb_provider_name": {
+              "default": "faiss",
+              "name": "vdb_provider_name",
+              "type": {
+                "type": "<class 'str'>"
+              }
+            }
+          },
+          "type": "basic"
+        },
+        "params": {
+          "faq_excel_path": "uploads/organon_demo/organon_en_copy.xlsx",
+          "scenario_cluster_distance_pct": "30",
+          "text_embedder_interface": "openai",
+          "text_embedder_model_name_or_path": "text-embedding-3-large",
+          "vdb_collection_name": "lynx",
+          "vdb_num_dimensions": 3072.0,
+          "vdb_provider_name": "faiss"
+        },
+        "status": "done",
+        "title": "LynxScribe FAQ to RAG"
+      },
+      "dragHandle": ".bg-primary",
+      "height": 620.0,
+      "id": "LynxScribe FAQ to RAG 1",
+      "position": {
+        "x": -1180.0,
+        "y": -76.0
+      },
+      "type": "basic",
+      "width": 415.0
+    },
+    {
+      "data": {
+        "__execution_delay": 0.0,
+        "collapsed": false,
+        "display": null,
+        "error": null,
+        "input_metadata": null,
+        "meta": {
+          "inputs": {
+            "rag_graph": {
+              "name": "rag_graph",
+              "position": "left",
+              "type": {
+                "type": "<class 'inspect._empty'>"
+              }
+            }
+          },
+          "name": "LynxScribe RAG Graph Chatbot Builder",
+          "outputs": {
+            "output": {
+              "name": "output",
+              "position": "top",
+              "type": {
+                "type": "None"
+              }
+            }
+          },
+          "params": {
+            "node_types": {
+              "default": "intent_cluster",
+              "name": "node_types",
+              "type": {
+                "type": "<class 'str'>"
+              }
+            },
+            "scenario_file": {
+              "default": "uploads/lynx_chatbot_scenario_selector.yaml",
+              "name": "scenario_file",
+              "type": {
+                "type": "<class 'str'>"
+              }
+            },
+            "scenario_meta_name": {
+              "default": "scenario_name",
+              "name": "scenario_meta_name",
+              "type": {
+                "type": "<class 'str'>"
+              }
+            }
+          },
+          "position": {
+            "x": 1569.0,
+            "y": 528.0
+          },
+          "type": "basic"
+        },
+        "params": {
+          "node_types": "intent_cluster",
+          "scenario_file": "uploads/organon_demo/backend-scenarios-en.yaml",
+          "scenario_meta_name": "scenario_name"
+        },
+        "status": "done",
+        "title": "LynxScribe RAG Graph Chatbot Builder"
+      },
+      "dragHandle": ".bg-primary",
+      "height": 296.0,
+      "id": "LynxScribe RAG Graph Chatbot Builder 1",
+      "position": {
+        "x": -591.0,
+        "y": 86.0
+      },
+      "type": "basic",
+      "width": 547.0
+    },
+    {
+      "data": {
+        "__execution_delay": 0.0,
+        "collapsed": null,
+        "display": null,
+        "error": null,
+        "input_metadata": null,
+        "meta": {
+          "inputs": {
+            "chat_processor": {
+              "name": "chat_processor",
+              "position": "bottom",
+              "type": {
+                "type": "<class 'inspect._empty'>"
+              }
+            },
+            "knowledge_base": {
+              "name": "knowledge_base",
+              "position": "bottom",
+              "type": {
+                "type": "<class 'inspect._empty'>"
+              }
+            }
+          },
+          "name": "LynxScribe RAG Graph Chatbot Backend",
+          "outputs": {
+            "output": {
+              "name": "output",
+              "position": "top",
+              "type": {
+                "type": "None"
+              }
+            }
+          },
+          "params": {
+            "llm_interface": {
+              "default": "openai",
+              "name": "llm_interface",
+              "type": {
+                "type": "<class 'str'>"
+              }
+            },
+            "llm_model_name": {
+              "default": "gpt-4o",
+              "name": "llm_model_name",
+              "type": {
+                "type": "<class 'str'>"
+              }
+            },
+            "negative_answer": {
+              "default": "I'm sorry, but the data I've been trained on does not contain any information related to your question.",
+              "name": "negative_answer",
+              "type": {
+                "type": "<class 'str'>"
+              }
+            },
+            "retriever_limits_by_type": {
+              "default": "{}",
+              "name": "retriever_limits_by_type",
+              "type": {
+                "type": "<class 'str'>"
+              }
+            },
+            "retriever_max_iterations": {
+              "default": 3.0,
+              "name": "retriever_max_iterations",
+              "type": {
+                "type": "<class 'int'>"
+              }
+            },
+            "retriever_overall_chunk_limit": {
+              "default": 20.0,
+              "name": "retriever_overall_chunk_limit",
+              "type": {
+                "type": "<class 'int'>"
+              }
+            },
+            "retriever_overall_token_limit": {
+              "default": 3000.0,
+              "name": "retriever_overall_token_limit",
+              "type": {
+                "type": "<class 'int'>"
+              }
+            },
+            "retriever_strict_limits": {
+              "default": true,
+              "name": "retriever_strict_limits",
+              "type": {
+                "type": "<class 'bool'>"
+              }
+            }
+          },
+          "position": {
+            "x": 1280.0,
+            "y": 450.0
+          },
+          "type": "basic"
+        },
+        "params": {
+          "llm_interface": "openai",
+          "llm_model_name": "gpt-4o",
+          "negative_answer": "I'm sorry, but the data I've been trained on does not contain any information related to your question.",
+          "retriever_limits_by_type": "{\"faq_question\": [0, 0], \"faq_answer\": [3, 3]}",
+          "retriever_max_iterations": "3",
+          "retriever_overall_chunk_limit": "3",
+          "retriever_overall_token_limit": "30000",
+          "retriever_strict_limits": true
+        },
+        "status": "done",
+        "title": "LynxScribe RAG Graph Chatbot Backend"
+      },
+      "dragHandle": ".bg-primary",
+      "height": 382.0,
+      "id": "LynxScribe RAG Graph Chatbot Backend 1",
+      "position": {
+        "x": -427.131476508498,
+        "y": -465.1194966607713
+      },
+      "type": "basic",
+      "width": 791.0
+    },
+    {
+      "data": {
+        "display": null,
+        "error": null,
+        "input_metadata": null,
+        "meta": {
+          "inputs": {
+            "processor": {
+              "name": "processor",
+              "position": "bottom",
+              "type": {
+                "type": "<class 'inspect._empty'>"
+              }
+            }
+          },
+          "name": "Chat processor",
+          "outputs": {
+            "output": {
+              "name": "output",
+              "position": "top",
+              "type": {
+                "type": "None"
+              }
+            }
+          },
+          "params": {},
+          "position": {
+            "x": 1291.0,
+            "y": 718.0
+          },
+          "type": "basic"
+        },
+        "params": {},
+        "status": "done",
+        "title": "Chat processor"
+      },
+      "dragHandle": ".bg-primary",
+      "height": 200.0,
+      "id": "Chat processor 1",
+      "position": {
+        "x": 252.7291107206022,
+        "y": 81.86852349150202
+      },
+      "type": "basic",
+      "width": 200.0
+    },
+    {
+      "data": {
+        "display": null,
+        "error": null,
+        "input_metadata": null,
+        "meta": {
+          "inputs": {},
+          "name": "Truncate history",
+          "outputs": {
+            "output": {
+              "name": "output",
+              "position": "top",
+              "type": {
+                "type": "None"
+              }
+            }
+          },
+          "params": {
+            "max_tokens": {
+              "default": 10000.0,
+              "name": "max_tokens",
+              "type": {
+                "type": "<class 'int'>"
+              }
+            }
+          },
+          "position": {
+            "x": 1440.0,
+            "y": 936.0
+          },
+          "type": "basic"
+        },
+        "params": {
+          "max_tokens": 10000.0
+        },
+        "status": "done",
+        "title": "Truncate history"
+      },
+      "dragHandle": ".bg-primary",
+      "height": 200.0,
+      "id": "Truncate history 1",
+      "position": {
+        "x": 253.59374153502728,
+        "y": 386.4661577036063
+      },
+      "type": "basic",
+      "width": 200.0
+    },
+    {
+      "data": {
+        "__execution_delay": 0.0,
+        "collapsed": null,
+        "display": null,
+        "error": null,
+        "input_metadata": null,
+        "meta": {
+          "inputs": {},
+          "name": "Input chat",
+          "outputs": {
+            "output": {
+              "name": "output",
+              "position": "right",
+              "type": {
+                "type": "None"
+              }
+            }
+          },
+          "params": {
+            "chat": {
+              "default": null,
+              "name": "chat",
+              "type": {
+                "type": "<class 'str'>"
+              }
+            }
+          },
+          "position": {
+            "x": 449.0,
+            "y": 172.0
+          },
+          "type": "basic"
+        },
+        "params": {
+          "chat": "I had headache after taking the pill"
+        },
+        "status": "done",
+        "title": "Input chat"
+      },
+      "dragHandle": ".bg-primary",
+      "height": 204.0,
+      "id": "Input chat 1",
+      "position": {
+        "x": -1115.7774404622555,
+        "y": -747.1320865489535
+      },
+      "type": "basic",
+      "width": 552.0
+    },
+    {
+      "data": {
+        "__execution_delay": 0.0,
+        "collapsed": null,
+        "display": null,
+        "error": null,
+        "input_metadata": null,
+        "meta": {
+          "inputs": {
+            "chat_api": {
+              "name": "chat_api",
+              "position": "bottom",
+              "type": {
+                "type": "<class 'inspect._empty'>"
+              }
+            },
+            "message": {
+              "name": "message",
+              "position": "left",
+              "type": {
+                "type": "<class 'inspect._empty'>"
+              }
+            }
+          },
+          "name": "Test Chat API",
+          "outputs": {
+            "output": {
+              "name": "output",
+              "position": "right",
+              "type": {
+                "type": "None"
+              }
+            }
+          },
+          "params": {
+            "show_details": {
+              "default": false,
+              "name": "show_details",
+              "type": {
+                "type": "<class 'bool'>"
+              }
+            }
+          },
+          "position": {
+            "x": 937.0,
+            "y": 213.0
+          },
+          "type": "basic"
+        },
+        "params": {
+          "show_details": false
+        },
+        "status": "done",
+        "title": "Test Chat API"
+      },
+      "dragHandle": ".bg-primary",
+      "height": 200.0,
+      "id": "Test Chat API 1",
+      "position": {
+        "x": -131.54900620226195,
+        "y": -745.4660726292032
+      },
+      "type": "basic",
+      "width": 200.0
+    },
+    {
+      "data": {
+        "display": {
+          "dataframes": {
+            "df": {
+              "columns": [
+                "answer"
+              ],
+              "data": [
+                [
+                  "I'm not equipped to handle adverse events or other product-related queries. Your safety is important to us, and we want to ensure you receive the appropriate support. Please report any adverse events or concerns to our dedicated support team. They can be reached at [email protected]. If you have any questions related to contraceptives or women's health, please feel free to ask, and I'll provide you with the information you need.\n"
+                ]
+              ]
+            }
+          }
+        },
+        "error": null,
+        "input_metadata": null,
+        "meta": {
+          "inputs": {
+            "input": {
+              "name": "input",
+              "position": "left",
+              "type": {
+                "type": "<class 'inspect._empty'>"
+              }
+            }
+          },
+          "name": "View",
+          "outputs": {},
+          "params": {},
+          "position": {
+            "x": 1547.0,
+            "y": 222.0
+          },
+          "type": "table_view"
+        },
+        "params": {},
+        "status": "done",
+        "title": "View"
+      },
+      "dragHandle": ".bg-primary",
+      "height": 483.0,
+      "id": "View 1",
+      "position": {
+        "x": 540.6544350347407,
+        "y": -886.065865503576
+      },
+      "type": "table_view",
+      "width": 707.0
+    }
+  ]
+}

examples/LynxScribe Image Search.lynxkite.json ADDED Viewed

	@@ -0,0 +1,419 @@

+{
+  "edges": [
+    {
+      "id": "Cloud-sourced File Listing 1 LynxScribe Image Describer 1",
+      "source": "Cloud-sourced File Listing 1",
+      "sourceHandle": "output",
+      "target": "LynxScribe Image Describer 1",
+      "targetHandle": "file_urls"
+    },
+    {
+      "id": "LynxScribe Image Describer 1 LynxScribe Image RAG Builder 1",
+      "source": "LynxScribe Image Describer 1",
+      "sourceHandle": "output",
+      "target": "LynxScribe Image RAG Builder 1",
+      "targetHandle": "image_descriptions"
+    },
+    {
+      "id": "Input chat 1 LynxScribe Image RAG Query 1",
+      "source": "Input chat 1",
+      "sourceHandle": "output",
+      "target": "LynxScribe Image RAG Query 1",
+      "targetHandle": "text"
+    },
+    {
+      "id": "LynxScribe Image RAG Builder 1 LynxScribe Image RAG Query 1",
+      "source": "LynxScribe Image RAG Builder 1",
+      "sourceHandle": "output",
+      "target": "LynxScribe Image RAG Query 1",
+      "targetHandle": "rag_graph"
+    },
+    {
+      "id": "LynxScribe Image RAG Query 1 LynxScribe Image Result Viewer 1",
+      "source": "LynxScribe Image RAG Query 1",
+      "sourceHandle": "output",
+      "target": "LynxScribe Image Result Viewer 1",
+      "targetHandle": "embedding_similarities"
+    }
+  ],
+  "env": "LynxScribe",
+  "nodes": [
+    {
+      "data": {
+        "__execution_delay": 0.0,
+        "collapsed": null,
+        "display": null,
+        "error": null,
+        "input_metadata": null,
+        "meta": {
+          "inputs": {},
+          "name": "Cloud-sourced File Listing",
+          "outputs": {
+            "output": {
+              "name": "output",
+              "position": "right",
+              "type": {
+                "type": "None"
+              }
+            }
+          },
+          "params": {
+            "accepted_file_types": {
+              "default": ".jpg, .jpeg, .png",
+              "name": "accepted_file_types",
+              "type": {
+                "type": "<class 'str'>"
+              }
+            },
+            "cloud_provider": {
+              "default": "gcp",
+              "name": "cloud_provider",
+              "type": {
+                "enum": [
+                  "GCP",
+                  "AWS",
+                  "AZURE"
+                ]
+              }
+            },
+            "folder_URL": {
+              "default": "https://storage.googleapis.com/lynxkite_public_data/lynxscribe-images/image-rag-test",
+              "name": "folder_URL",
+              "type": {
+                "type": "<class 'str'>"
+              }
+            }
+          },
+          "type": "basic"
+        },
+        "params": {
+          "accepted_file_types": ".jpg, .jpeg, .png",
+          "cloud_provider": "GCP",
+          "folder_URL": "https://storage.googleapis.com/lynxkite_public_data/lynxscribe-images/image-rag-test"
+        },
+        "status": "done",
+        "title": "Cloud-sourced File Listing"
+      },
+      "dragHandle": ".bg-primary",
+      "height": 353.0,
+      "id": "Cloud-sourced File Listing 1",
+      "position": {
+        "x": -365.0,
+        "y": 302.0
+      },
+      "type": "basic",
+      "width": 430.0
+    },
+    {
+      "data": {
+        "display": null,
+        "error": null,
+        "input_metadata": null,
+        "meta": {
+          "inputs": {
+            "file_urls": {
+              "name": "file_urls",
+              "position": "left",
+              "type": {
+                "type": "<class 'inspect._empty'>"
+              }
+            }
+          },
+          "name": "LynxScribe Image Describer",
+          "outputs": {
+            "output": {
+              "name": "output",
+              "position": "right",
+              "type": {
+                "type": "None"
+              }
+            }
+          },
+          "params": {
+            "llm_interface": {
+              "default": "openai",
+              "name": "llm_interface",
+              "type": {
+                "type": "<class 'str'>"
+              }
+            },
+            "llm_prompt_name": {
+              "default": "cot_picture_descriptor",
+              "name": "llm_prompt_name",
+              "type": {
+                "type": "<class 'str'>"
+              }
+            },
+            "llm_prompt_path": {
+              "default": "uploads/image_description_prompts.yaml",
+              "name": "llm_prompt_path",
+              "type": {
+                "type": "<class 'str'>"
+              }
+            },
+            "llm_visual_model": {
+              "default": "gpt-4o",
+              "name": "llm_visual_model",
+              "type": {
+                "type": "<class 'str'>"
+              }
+            }
+          },
+          "type": "basic"
+        },
+        "params": {
+          "llm_interface": "openai",
+          "llm_prompt_name": "cot_picture_descriptor",
+          "llm_prompt_path": "uploads/image_description_prompts.yaml",
+          "llm_visual_model": "gpt-4o"
+        },
+        "status": "done",
+        "title": "LynxScribe Image Describer"
+      },
+      "dragHandle": ".bg-primary",
+      "height": 361.0,
+      "id": "LynxScribe Image Describer 1",
+      "position": {
+        "x": 159.0,
+        "y": 298.0
+      },
+      "type": "basic",
+      "width": 371.0
+    },
+    {
+      "data": {
+        "display": null,
+        "error": null,
+        "input_metadata": null,
+        "meta": {
+          "inputs": {
+            "image_descriptions": {
+              "name": "image_descriptions",
+              "position": "left",
+              "type": {
+                "type": "<class 'inspect._empty'>"
+              }
+            }
+          },
+          "name": "LynxScribe Image RAG Builder",
+          "outputs": {
+            "output": {
+              "name": "output",
+              "position": "right",
+              "type": {
+                "type": "None"
+              }
+            }
+          },
+          "params": {
+            "text_embedder_interface": {
+              "default": "openai",
+              "name": "text_embedder_interface",
+              "type": {
+                "type": "<class 'str'>"
+              }
+            },
+            "text_embedder_model_name_or_path": {
+              "default": "text-embedding-3-large",
+              "name": "text_embedder_model_name_or_path",
+              "type": {
+                "type": "<class 'str'>"
+              }
+            },
+            "vdb_collection_name": {
+              "default": "lynx",
+              "name": "vdb_collection_name",
+              "type": {
+                "type": "<class 'str'>"
+              }
+            },
+            "vdb_num_dimensions": {
+              "default": 3072.0,
+              "name": "vdb_num_dimensions",
+              "type": {
+                "type": "<class 'int'>"
+              }
+            },
+            "vdb_provider_name": {
+              "default": "faiss",
+              "name": "vdb_provider_name",
+              "type": {
+                "type": "<class 'str'>"
+              }
+            }
+          },
+          "type": "basic"
+        },
+        "params": {
+          "text_embedder_interface": "openai",
+          "text_embedder_model_name_or_path": "text-embedding-3-large",
+          "vdb_collection_name": "lynx",
+          "vdb_num_dimensions": 3072.0,
+          "vdb_provider_name": "faiss"
+        },
+        "status": "done",
+        "title": "LynxScribe Image RAG Builder"
+      },
+      "dragHandle": ".bg-primary",
+      "height": 441.0,
+      "id": "LynxScribe Image RAG Builder 1",
+      "position": {
+        "x": 644.0,
+        "y": 259.0
+      },
+      "type": "basic",
+      "width": 291.0
+    },
+    {
+      "data": {
+        "__execution_delay": 0.0,
+        "collapsed": null,
+        "display": null,
+        "error": null,
+        "input_metadata": null,
+        "meta": {
+          "inputs": {},
+          "name": "Input chat",
+          "outputs": {
+            "output": {
+              "name": "output",
+              "position": "right",
+              "type": {
+                "type": "None"
+              }
+            }
+          },
+          "params": {
+            "chat": {
+              "default": null,
+              "name": "chat",
+              "type": {
+                "type": "<class 'str'>"
+              }
+            }
+          },
+          "position": {
+            "x": 1260.0,
+            "y": 166.0
+          },
+          "type": "basic"
+        },
+        "params": {
+          "chat": "Show me a picture about doctors and patients!"
+        },
+        "status": "done",
+        "title": "Input chat"
+      },
+      "dragHandle": ".bg-primary",
+      "height": 218.0,
+      "id": "Input chat 1",
+      "position": {
+        "x": 153.0,
+        "y": -47.0
+      },
+      "type": "basic",
+      "width": 776.0
+    },
+    {
+      "data": {
+        "display": null,
+        "error": null,
+        "input_metadata": null,
+        "meta": {
+          "inputs": {
+            "rag_graph": {
+              "name": "rag_graph",
+              "position": "bottom",
+              "type": {
+                "type": "<class 'inspect._empty'>"
+              }
+            },
+            "text": {
+              "name": "text",
+              "position": "left",
+              "type": {
+                "type": "<class 'inspect._empty'>"
+              }
+            }
+          },
+          "name": "LynxScribe Image RAG Query",
+          "outputs": {
+            "output": {
+              "name": "output",
+              "position": "right",
+              "type": {
+                "type": "None"
+              }
+            }
+          },
+          "params": {
+            "top_k": {
+              "default": 3.0,
+              "name": "top_k",
+              "type": {
+                "type": "<class 'int'>"
+              }
+            }
+          },
+          "position": {
+            "x": 1987.0,
+            "y": 365.0
+          },
+          "type": "basic"
+        },
+        "params": {
+          "top_k": 3.0
+        },
+        "status": "done",
+        "title": "LynxScribe Image RAG Query"
+      },
+      "dragHandle": ".bg-primary",
+      "height": 207.0,
+      "id": "LynxScribe Image RAG Query 1",
+      "position": {
+        "x": 1160.0,
+        "y": -40.0
+      },
+      "type": "basic",
+      "width": 283.0
+    },
+    {
+      "data": {
+        "display": "https://storage.googleapis.com/lynxkite_public_data/lynxscribe-images/image-rag-test/bethesda-naval-medical-center-80380_1280.jpg",
+        "error": null,
+        "input_metadata": null,
+        "meta": {
+          "inputs": {
+            "embedding_similarities": {
+              "name": "embedding_similarities",
+              "position": "left",
+              "type": {
+                "type": "<class 'inspect._empty'>"
+              }
+            }
+          },
+          "name": "LynxScribe Image Result Viewer",
+          "outputs": {},
+          "params": {},
+          "position": {
+            "x": 2326.0,
+            "y": 319.0
+          },
+          "type": "image"
+        },
+        "params": {},
+        "status": "done",
+        "title": "LynxScribe Image Result Viewer"
+      },
+      "dragHandle": ".bg-primary",
+      "height": 515.0,
+      "id": "LynxScribe Image Result Viewer 1",
+      "position": {
+        "x": 1657.0,
+        "y": -193.0
+      },
+      "type": "image",
+      "width": 707.0
+    }
+  ]
+}

examples/{LynxScribe demo.lynxkite.json → LynxScribe RAG Chatbot.lynxkite.json} RENAMED Viewed

@@ -1,217 +1,243 @@
 {
   "env": "LynxScribe",
   "nodes": [
     {
-      "id": "Input chat 1",
-      "type": "basic",
       "data": {
-        "title": "Input chat",
-        "params": {
-          "chat": "who is the CTO of Lynx?"
-        },
         "display": null,
         "error": null,
-        "collapsed": null,
         "meta": {
           "inputs": {},
-          "params": {
-            "chat": {
-              "default": null,
-              "type": {
-                "type": "<class 'str'>"
-              },
-              "name": "chat"
-            }
-          },
           "outputs": {
             "output": {
               "name": "output",
               "type": {
                 "type": "None"
-              },
-              "position": "right"
             }
           },
-          "name": "Input chat",
           "type": "basic"
         },
-        "__execution_delay": 0.0
       },
       "position": {
-        "x": -493.5496596237119,
-        "y": 20.90123252513356
       },
-      "height": 186.0,
-      "width": 259.0,
-      "parentId": null
     },
     {
-      "id": "View 1",
-      "type": "table_view",
       "data": {
-        "title": "View",
-        "params": {},
-        "display": {
-          "dataframes": {
-            "df": {
-              "columns": [
-                "answer"
-              ],
-              "data": [
-                [
-                  "TheThe Chief Technology Officer (CTO) of Lynx Analytics is Chema Lizano. He leads the technology strategy and roadmap at the company, overseeing the vision, development, and implementation of solutions across various clients and environments. If you have any more questions regarding our team or services, feel free to ask!\n\nPlease visit https://www.lynxanalytics.com/board for further information."
-                ]
-              ]
-            }
-          }
-        },
         "error": null,
         "meta": {
-          "type": "table_view",
-          "name": "View",
           "inputs": {
-            "input": {
-              "name": "input",
               "type": {
                 "type": "<class 'inspect._empty'>"
-              },
-              "position": "left"
             }
           },
-          "outputs": {},
-          "params": {}
-        }
-      },
-      "position": {
-        "x": 731.7440706129762,
-        "y": -716.4943976910913
-      },
-      "width": 1256.0,
-      "parentId": null,
-      "height": 950.0
-    },
-    {
-      "id": "LLM 1",
-      "type": "basic",
-      "data": {
-        "title": "LLM",
-        "params": {
-          "name": "openai"
-        },
-        "display": null,
-        "error": null,
-        "meta": {
-          "inputs": {},
           "outputs": {
             "output": {
               "type": {
                 "type": "None"
-              },
-              "name": "output",
-              "position": "top"
             }
           },
-          "type": "basic",
           "params": {
-            "name": {
               "default": "openai",
-              "name": "name",
               "type": {
                 "type": "<class 'str'>"
               }
-            }
-          },
-          "name": "LLM"
-        }
-      },
-      "position": {
-        "x": -312.5774211084781,
-        "y": 1093.4019527511366
-      },
-      "parentId": null,
-      "width": 200.0,
-      "height": 200.0
-    },
-    {
-      "id": "Scenario selector 1",
-      "type": "basic",
-      "data": {
-        "title": "Scenario selector",
-        "params": {
-          "scenario_file": "uploads/chat_api/scenarios.yaml",
-          "node_types": "intent_cluster"
-        },
-        "display": null,
-        "error": null,
-        "meta": {
-          "params": {
-            "scenario_file": {
               "type": {
                 "type": "<class 'str'>"
-              },
-              "name": "scenario_file",
-              "default": null
             },
-            "node_types": {
-              "default": "intent_cluster",
               "type": {
                 "type": "<class 'str'>"
-              },
-              "name": "node_types"
-            }
-          },
-          "inputs": {},
-          "outputs": {
-            "output": {
-              "position": "top",
-              "name": "output",
               "type": {
-                "type": "None"
               }
             }
           },
-          "type": "basic",
-          "name": "Scenario selector"
-        }
       },
       "position": {
-        "x": -549.1300345090008,
-        "y": 1086.4852248156676
       },
-      "parentId": null,
-      "height": 200.0,
-      "width": 200.0
     },
     {
-      "id": "Chat API 1",
-      "type": "basic",
       "data": {
-        "title": "Chat API",
-        "params": {
-          "model": "gpt-4o-mini"
-        },
         "display": null,
         "error": null,
         "meta": {
-          "name": "Chat API",
-          "type": "basic",
-          "outputs": {
-            "output": {
-              "type": {
-                "type": "None"
-              },
-              "position": "top",
-              "name": "output"
-            }
-          },
           "inputs": {
-            "chatbot": {
-              "name": "chatbot",
-              "type": {
-                "type": "<class 'inspect._empty'>"
-              },
-              "position": "bottom"
-            },
             "chat_processor": {
               "name": "chat_processor",
               "position": "bottom",
@@ -220,126 +246,36 @@
               }
             },
             "knowledge_base": {
-              "type": {
-                "type": "<class 'inspect._empty'>"
-              },
               "position": "bottom",
-              "name": "knowledge_base"
-            }
-          },
-          "params": {
-            "model": {
-              "default": "gpt-4o-mini",
-              "type": {
-                "type": "<class 'str'>"
-              },
-              "name": "model"
-            }
-          }
-        }
-      },
-      "position": {
-        "x": -22.866663363810787,
-        "y": 258.20943122219336
-      },
-      "parentId": null,
-      "width": 200.0,
-      "height": 200.0
-    },
-    {
-      "id": "Knowledge base 1",
-      "type": "basic",
-      "data": {
-        "title": "Knowledge base",
-        "params": {
-          "template_cluster_path": "uploads/chat_api/data/lynx/tempclusters.pickle",
-          "edges_path": "uploads/chat_api/data/lynx/edges.pickle",
-          "nodes_path": "uploads/chat_api/data/lynx/nodes.pickle"
-        },
-        "display": null,
-        "error": null,
-        "meta": {
-          "name": "Knowledge base",
-          "type": "basic",
-          "params": {
-            "nodes_path": {
-              "name": "nodes_path",
-              "default": "nodes.pickle",
-              "type": {
-                "type": "<class 'str'>"
-              }
-            },
-            "template_cluster_path": {
-              "type": {
-                "type": "<class 'str'>"
-              },
-              "name": "template_cluster_path",
-              "default": "tempclusters.pickle"
-            },
-            "edges_path": {
-              "name": "edges_path",
-              "default": "edges.pickle",
               "type": {
-                "type": "<class 'str'>"
               }
             }
           },
-          "inputs": {},
           "outputs": {
             "output": {
-              "position": "top",
               "name": "output",
-              "type": {
-                "type": "None"
-              }
-            }
-          }
-        }
-      },
-      "position": {
-        "x": 598.8683124946176,
-        "y": 609.9499973808545
-      },
-      "width": 336.0,
-      "height": 320.0,
-      "parentId": null
-    },
-    {
-      "id": "RAG chatbot 1",
-      "type": "basic",
-      "data": {
-        "title": "RAG chatbot",
-        "params": {
-          "limits_by_type": "{\"information\": [2, 3], \"summary\": [2, 3]}",
-          "max_results": "5",
-          "negative_answer": "I'm sorry, but the data I've been trained on does not contain any information related to your question.",
-          "strict_limits": true
-        },
-        "display": null,
-        "error": null,
-        "meta": {
-          "outputs": {
-            "output": {
               "position": "top",
-              "name": "output",
               "type": {
                 "type": "None"
               }
             }
           },
           "params": {
-            "max_results": {
-              "default": 5.0,
               "type": {
-                "type": "<class 'int'>"
-              },
-              "name": "max_results"
             },
-            "strict_limits": {
-              "name": "strict_limits",
-              "default": true,
               "type": {
-                "type": "<class 'bool'>"
               }
             },
             "negative_answer": {
@@ -349,404 +285,395 @@
                 "type": "<class 'str'>"
               }
             },
-            "limits_by_type": {
               "default": "{}",
-              "name": "limits_by_type",
               "type": {
                 "type": "<class 'str'>"
               }
-            }
-          },
-          "name": "RAG chatbot",
-          "type": "basic",
-          "inputs": {
-            "rag_graph": {
-              "type": {
-                "type": "<class 'inspect._empty'>"
-              },
-              "name": "rag_graph",
-              "position": "bottom"
             },
-            "llm": {
-              "name": "llm",
-              "position": "bottom",
               "type": {
-                "type": "<class 'inspect._empty'>"
               }
             },
-            "scenario_selector": {
               "type": {
-                "type": "<class 'inspect._empty'>"
-              },
-              "name": "scenario_selector",
-              "position": "bottom"
             }
-          }
         },
-        "beingResized": false
       },
       "position": {
-        "x": -533.1301830766971,
-        "y": 547.294980747757
       },
-      "parentId": null,
-      "height": 399.0,
-      "width": 339.0
     },
     {
-      "id": "RAG graph 1",
-      "type": "basic",
       "data": {
-        "title": "RAG graph",
-        "params": {},
         "display": null,
         "error": null,
         "meta": {
-          "type": "basic",
           "inputs": {
-            "text_embedder": {
-              "type": {
-                "type": "<class 'inspect._empty'>"
-              },
-              "position": "bottom",
-              "name": "text_embedder"
-            },
-            "vector_store": {
               "position": "bottom",
               "type": {
                 "type": "<class 'inspect._empty'>"
-              },
-              "name": "vector_store"
             }
           },
-          "name": "RAG graph",
-          "params": {},
           "outputs": {
             "output": {
               "position": "top",
               "type": {
                 "type": "None"
-              },
-              "name": "output"
             }
-          }
-        }
       },
       "position": {
-        "x": -817.8208895639339,
-        "y": 1014.836542916127
       },
-      "parentId": null,
-      "width": 200.0,
-      "height": 200.0
     },
     {
-      "id": "Vector store 1",
-      "type": "basic",
       "data": {
-        "title": "Vector store",
-        "params": {
-          "name": "chromadb",
-          "collection_name": "lynx"
-        },
         "display": null,
         "error": null,
-        "beingResized": false,
         "meta": {
-          "params": {
-            "collection_name": {
-              "type": {
-                "type": "<class 'str'>"
-              },
-              "default": "lynx",
-              "name": "collection_name"
-            },
-            "name": {
-              "default": "chromadb",
-              "type": {
-                "type": "<class 'str'>"
-              },
-              "name": "name"
-            }
-          },
-          "type": "basic",
-          "name": "Vector store",
           "outputs": {
             "output": {
               "type": {
                 "type": "None"
-              },
-              "position": "top",
-              "name": "output"
             }
           },
-          "inputs": {}
-        }
-      },
-      "position": {
-        "x": -1053.794625339574,
-        "y": 1347.7711940497127
-      },
-      "height": 227.0,
-      "parentId": null,
-      "width": 275.0
-    },
-    {
-      "id": "Text embedder 2",
-      "type": "basic",
-      "data": {
-        "title": "Text embedder",
-        "params": {
-          "model": "text-embedding-ada-002"
-        },
-        "display": null,
-        "error": null,
-        "meta": {
           "params": {
-            "model": {
-              "default": "text-embedding-ada-002",
-              "type": {
-                "type": "<class 'str'>"
-              },
-              "name": "model"
-            }
-          },
-          "name": "Text embedder",
-          "outputs": {
-            "output": {
               "type": {
-                "type": "None"
-              },
-              "position": "top",
-              "name": "output"
             }
           },
-          "type": "basic",
-          "inputs": {
-            "llm": {
-              "type": {
-                "type": "<class 'inspect._empty'>"
-              },
-              "name": "llm",
-              "position": "bottom"
-            }
-          }
-        }
       },
       "position": {
-        "x": -719.98604638686,
-        "y": 1343.5978526690794
       },
-      "width": 200.0,
-      "height": 200.0,
-      "parentId": null
     },
     {
-      "id": "LLM 2",
-      "type": "basic",
       "data": {
-        "title": "LLM",
-        "params": {
-          "name": "openai"
-        },
         "display": null,
         "error": null,
         "meta": {
           "outputs": {
             "output": {
-              "position": "top",
               "name": "output",
               "type": {
                 "type": "None"
               }
             }
           },
-          "name": "LLM",
-          "type": "basic",
-          "inputs": {},
           "params": {
             "name": {
-              "default": "openai",
               "name": "name",
               "type": {
                 "type": "<class 'str'>"
               }
             }
-          }
-        }
       },
       "position": {
-        "x": -727.6171373682814,
-        "y": 1649.7242636905507
       },
-      "width": 200.0,
-      "parentId": null,
-      "height": 200.0
     },
     {
-      "id": "Truncate history 1",
-      "type": "basic",
       "data": {
-        "title": "Truncate history",
-        "params": {
-          "max_tokens": 10000.0
-        },
         "display": null,
         "error": null,
         "meta": {
           "outputs": {
             "output": {
               "type": {
                 "type": "None"
-              },
-              "name": "output",
-              "position": "top"
             }
           },
-          "type": "basic",
           "params": {
-            "max_tokens": {
-              "default": 10000.0,
-              "name": "max_tokens",
               "type": {
-                "type": "<class 'int'>"
               }
             }
           },
-          "name": "Truncate history",
-          "inputs": {}
-        }
       },
       "position": {
-        "x": 0.08889822620079713,
-        "y": 1044.7639853229612
       },
-      "height": 200.0,
-      "width": 200.0,
-      "parentId": null
     },
     {
-      "id": "Chat processor 1",
-      "type": "basic",
       "data": {
-        "title": "Chat processor",
-        "params": {},
         "display": null,
         "error": null,
-        "__execution_delay": null,
-        "collapsed": true,
         "meta": {
-          "name": "Chat processor",
           "inputs": {
-            "processor": {
-              "name": "processor",
               "position": "bottom",
               "type": {
                 "type": "<class 'inspect._empty'>"
               }
             }
           },
-          "params": {},
-          "type": "basic",
           "outputs": {
             "output": {
               "type": {
                 "type": "None"
-              },
-              "position": "top",
-              "name": "output"
             }
-          }
-        }
       },
       "position": {
-        "x": 182.89729246405872,
-        "y": 778.546274223181
       },
-      "parentId": null,
-      "width": 200.0,
-      "height": 200.0
     },
     {
-      "id": "Mask 1",
-      "type": "basic",
       "data": {
-        "title": "Mask",
-        "params": {
-          "mask_pattern": "masked_email_address_{}",
-          "name": "email",
-          "exceptions": "[email protected],[email protected],[email protected],[email protected]",
-          "regex": "([a-z0-9!#$%&'*+\\/=?^_`{|.}~-]+@(?:[a-z0-9](?:[a-z0-9-]*[a-z0-9])?\\.)+[a-z0-9](?:[a-z0-9-]*[a-z0-9])?)"
         },
-        "display": null,
         "error": null,
         "meta": {
-          "inputs": {},
-          "outputs": {
-            "output": {
-              "position": "top",
-              "name": "output",
               "type": {
-                "type": "None"
               }
             }
           },
-          "type": "basic",
-          "name": "Mask",
-          "params": {
-            "name": {
-              "default": "",
-              "name": "name",
-              "type": {
-                "type": "<class 'str'>"
-              }
-            },
-            "exceptions": {
-              "name": "exceptions",
-              "type": {
-                "type": "<class 'str'>"
-              },
-              "default": ""
-            },
-            "regex": {
-              "type": {
-                "type": "<class 'str'>"
-              },
-              "name": "regex",
-              "default": ""
-            },
-            "mask_pattern": {
-              "default": "",
-              "type": {
-                "type": "<class 'str'>"
-              },
-              "name": "mask_pattern"
-            }
-          }
-        }
       },
       "position": {
-        "x": 233.69759202223884,
-        "y": 1041.6145468043276
       },
-      "height": 200.0,
-      "parentId": null,
-      "width": 200.0
     },
     {
-      "id": "Mask 2",
-      "type": "basic",
       "data": {
-        "title": "Mask",
-        "params": {
-          "regex": "((?:(?:\\\\d{4}[- ]?){3}\\\\d{4}|\\\\d{15,16}))(?![\\\\d])",
-          "exceptions": "",
-          "name": "credit_card",
-          "mask_pattern": "masked_credit_card_number_{}"
-        },
         "display": null,
         "error": null,
         "meta": {
           "outputs": {
             "output": {
               "name": "output",
@@ -756,214 +683,52 @@
               }
             }
           },
-          "inputs": {},
-          "name": "Mask",
-          "type": "basic",
           "params": {
-            "exceptions": {
-              "type": {
-                "type": "<class 'str'>"
-              },
-              "default": "",
-              "name": "exceptions"
-            },
-            "regex": {
-              "default": "",
               "type": {
                 "type": "<class 'str'>"
-              },
-              "name": "regex"
             },
-            "mask_pattern": {
-              "name": "mask_pattern",
               "type": {
                 "type": "<class 'str'>"
-              },
-              "default": ""
             },
-            "name": {
-              "name": "name",
-              "default": "",
               "type": {
                 "type": "<class 'str'>"
               }
             }
-          }
-        }
-      },
-      "position": {
-        "x": 513.2761671440603,
-        "y": 1034.8547191984255
-      },
-      "width": 200.0,
-      "parentId": null,
-      "height": 200.0
-    },
-    {
-      "id": "Test Chat API 2",
-      "type": "basic",
-      "data": {
-        "title": "Test Chat API",
-        "params": {
-          "show_details": false
-        },
-        "display": null,
-        "error": null,
-        "collapsed": false,
-        "__execution_delay": 0.0,
-        "meta": {
-          "params": {
-            "show_details": {
-              "default": false,
-              "type": {
-                "type": "<class 'bool'>"
-              },
-              "name": "show_details"
-            }
-          },
-          "inputs": {
-            "message": {
-              "name": "message",
-              "position": "left",
-              "type": {
-                "type": "<class 'inspect._empty'>"
-              }
-            },
-            "chat_api": {
-              "position": "bottom",
-              "type": {
-                "type": "<class 'inspect._empty'>"
-              },
-              "name": "chat_api"
-            }
           },
-          "outputs": {
-            "output": {
-              "position": "right",
-              "type": {
-                "type": "None"
-              },
-              "name": "output"
-            }
           },
-          "name": "Test Chat API",
           "type": "basic"
-        }
       },
       "position": {
-        "x": -57.377776548056346,
-        "y": -16.924593985348814
       },
-      "width": 376.0,
-      "parentId": null,
-      "height": 225.0
-    }
-  ],
-  "edges": [
-    {
-      "id": "xy-edge__Knowledge base 1output-Chat API 1knowledge_base",
-      "source": "Knowledge base 1",
-      "target": "Chat API 1",
-      "sourceHandle": "output",
-      "targetHandle": "knowledge_base"
-    },
-    {
-      "id": "xy-edge__RAG chatbot 1output-Chat API 1chatbot",
-      "source": "RAG chatbot 1",
-      "target": "Chat API 1",
-      "sourceHandle": "output",
-      "targetHandle": "chatbot"
-    },
-    {
-      "id": "xy-edge__LLM 1output-RAG chatbot 1llm",
-      "source": "LLM 1",
-      "target": "RAG chatbot 1",
-      "sourceHandle": "output",
-      "targetHandle": "llm"
-    },
-    {
-      "id": "xy-edge__Scenario selector 1output-RAG chatbot 1scenario_selector",
-      "source": "Scenario selector 1",
-      "target": "RAG chatbot 1",
-      "sourceHandle": "output",
-      "targetHandle": "scenario_selector"
-    },
-    {
-      "id": "xy-edge__RAG graph 1output-RAG chatbot 1rag_graph",
-      "source": "RAG graph 1",
-      "target": "RAG chatbot 1",
-      "sourceHandle": "output",
-      "targetHandle": "rag_graph"
-    },
-    {
-      "id": "xy-edge__Vector store 1output-RAG graph 1vector_store",
-      "source": "Vector store 1",
-      "target": "RAG graph 1",
-      "sourceHandle": "output",
-      "targetHandle": "vector_store"
-    },
-    {
-      "id": "xy-edge__Text embedder 2output-RAG graph 1text_embedder",
-      "source": "Text embedder 2",
-      "target": "RAG graph 1",
-      "sourceHandle": "output",
-      "targetHandle": "text_embedder"
-    },
-    {
-      "id": "xy-edge__LLM 2output-Text embedder 2llm",
-      "source": "LLM 2",
-      "target": "Text embedder 2",
-      "sourceHandle": "output",
-      "targetHandle": "llm"
-    },
-    {
-      "id": "xy-edge__Truncate history 1output-Chat processor 1processor",
-      "source": "Truncate history 1",
-      "target": "Chat processor 1",
-      "sourceHandle": "output",
-      "targetHandle": "processor"
-    },
-    {
-      "id": "xy-edge__Chat processor 1output-Chat API 1chat_processor",
-      "source": "Chat processor 1",
-      "target": "Chat API 1",
-      "sourceHandle": "output",
-      "targetHandle": "chat_processor"
-    },
-    {
-      "id": "xy-edge__Mask 1output-Chat processor 1processor",
-      "source": "Mask 1",
-      "target": "Chat processor 1",
-      "sourceHandle": "output",
-      "targetHandle": "processor"
-    },
-    {
-      "id": "xy-edge__Mask 2output-Chat processor 1processor",
-      "source": "Mask 2",
-      "target": "Chat processor 1",
-      "sourceHandle": "output",
-      "targetHandle": "processor"
-    },
-    {
-      "id": "xy-edge__Input chat 1output-Test Chat API 2message",
-      "source": "Input chat 1",
-      "target": "Test Chat API 2",
-      "sourceHandle": "output",
-      "targetHandle": "message"
-    },
-    {
-      "id": "xy-edge__Test Chat API 2output-View 1input",
-      "source": "Test Chat API 2",
-      "target": "View 1",
-      "sourceHandle": "output",
-      "targetHandle": "input"
-    },
-    {
-      "id": "xy-edge__Chat API 1output-Test Chat API 2chat_api",
-      "source": "Chat API 1",
-      "target": "Test Chat API 2",
-      "sourceHandle": "output",
-      "targetHandle": "chat_api"
     }
   ]
 }

 {
+  "edges": [
+    {
+      "id": "Cloud-sourced File Listing 1 LynxScribe Text RAG Loader 1",
+      "source": "Cloud-sourced File Listing 1",
+      "sourceHandle": "output",
+      "target": "LynxScribe Text RAG Loader 1",
+      "targetHandle": "file_urls"
+    },
+    {
+      "id": "Truncate history 1 Chat processor 1",
+      "source": "Truncate history 1",
+      "sourceHandle": "output",
+      "target": "Chat processor 1",
+      "targetHandle": "processor"
+    },
+    {
+      "id": "Chat processor 1 LynxScribe RAG Graph Chatbot Backend 1",
+      "source": "Chat processor 1",
+      "sourceHandle": "output",
+      "target": "LynxScribe RAG Graph Chatbot Backend 1",
+      "targetHandle": "chat_processor"
+    },
+    {
+      "id": "Mask 1 Chat processor 1",
+      "source": "Mask 1",
+      "sourceHandle": "output",
+      "target": "Chat processor 1",
+      "targetHandle": "processor"
+    },
+    {
+      "id": "Input chat 1 Test Chat API 1",
+      "source": "Input chat 1",
+      "sourceHandle": "output",
+      "target": "Test Chat API 1",
+      "targetHandle": "message"
+    },
+    {
+      "id": "LynxScribe RAG Graph Chatbot Backend 1 Test Chat API 1",
+      "source": "LynxScribe RAG Graph Chatbot Backend 1",
+      "sourceHandle": "output",
+      "target": "Test Chat API 1",
+      "targetHandle": "chat_api"
+    },
+    {
+      "id": "Test Chat API 1 View 1",
+      "source": "Test Chat API 1",
+      "sourceHandle": "output",
+      "target": "View 1",
+      "targetHandle": "input"
+    },
+    {
+      "id": "LynxScribe Text RAG Loader 1 LynxScribe RAG Graph Chatbot Builder 1",
+      "source": "LynxScribe Text RAG Loader 1",
+      "sourceHandle": "output",
+      "target": "LynxScribe RAG Graph Chatbot Builder 1",
+      "targetHandle": "rag_graph"
+    },
+    {
+      "id": "LynxScribe RAG Graph Chatbot Builder 1 LynxScribe RAG Graph Chatbot Backend 1",
+      "source": "LynxScribe RAG Graph Chatbot Builder 1",
+      "sourceHandle": "output",
+      "target": "LynxScribe RAG Graph Chatbot Backend 1",
+      "targetHandle": "knowledge_base"
+    }
+  ],
   "env": "LynxScribe",
   "nodes": [
     {
       "data": {
+        "__execution_delay": 0.0,
+        "collapsed": null,
         "display": null,
         "error": null,
+        "input_metadata": null,
         "meta": {
           "inputs": {},
+          "name": "Cloud-sourced File Listing",
           "outputs": {
             "output": {
               "name": "output",
+              "position": "right",
               "type": {
                 "type": "None"
+              }
+            }
+          },
+          "params": {
+            "accepted_file_types": {
+              "default": ".jpg, .jpeg, .png",
+              "name": "accepted_file_types",
+              "type": {
+                "type": "<class 'str'>"
+              }
+            },
+            "cloud_provider": {
+              "default": "gcp",
+              "name": "cloud_provider",
+              "type": {
+                "enum": [
+                  "GCP",
+                  "AWS",
+                  "AZURE"
+                ]
+              }
+            },
+            "folder_URL": {
+              "default": "https://storage.googleapis.com/lynxkite_public_data/lynxscribe-images/image-rag-test",
+              "name": "folder_URL",
+              "type": {
+                "type": "<class 'str'>"
+              }
             }
           },
           "type": "basic"
         },
+        "params": {
+          "accepted_file_types": ".pickle",
+          "cloud_provider": "GCP",
+          "folder_URL": "https://storage.googleapis.com/lynxkite_public_data/lynxscribe-knowledge-graphs/lynx-chatbot"
+        },
+        "status": "done",
+        "title": "Cloud-sourced File Listing"
       },
+      "dragHandle": ".bg-primary",
+      "height": 286.0,
+      "id": "Cloud-sourced File Listing 1",
       "position": {
+        "x": -827.0,
+        "y": 382.0
       },
+      "type": "basic",
+      "width": 515.0
     },
     {
       "data": {
+        "__execution_delay": 0.0,
+        "collapsed": null,
+        "display": null,
         "error": null,
+        "input_metadata": null,
         "meta": {
           "inputs": {
+            "file_urls": {
+              "name": "file_urls",
+              "position": "left",
               "type": {
                 "type": "<class 'inspect._empty'>"
+              }
             }
           },
+          "name": "LynxScribe Text RAG Loader",
           "outputs": {
             "output": {
+              "name": "output",
+              "position": "right",
               "type": {
                 "type": "None"
+              }
             }
           },
           "params": {
+            "input_type": {
+              "default": "v1",
+              "name": "input_type",
+              "type": {
+                "enum": [
+                  "V1",
+                  "V2"
+                ]
+              }
+            },
+            "text_embedder_interface": {
               "default": "openai",
+              "name": "text_embedder_interface",
               "type": {
                 "type": "<class 'str'>"
               }
+            },
+            "text_embedder_model_name_or_path": {
+              "default": "text-embedding-3-large",
+              "name": "text_embedder_model_name_or_path",
               "type": {
                 "type": "<class 'str'>"
+              }
             },
+            "vdb_collection_name": {
+              "default": "lynx",
+              "name": "vdb_collection_name",
               "type": {
                 "type": "<class 'str'>"
+              }
+            },
+            "vdb_num_dimensions": {
+              "default": 3072.0,
+              "name": "vdb_num_dimensions",
               "type": {
+                "type": "<class 'int'>"
+              }
+            },
+            "vdb_provider_name": {
+              "default": "faiss",
+              "name": "vdb_provider_name",
+              "type": {
+                "type": "<class 'str'>"
               }
             }
           },
+          "type": "basic"
+        },
+        "params": {
+          "input_type": "V1",
+          "text_embedder_interface": "openai",
+          "text_embedder_model_name_or_path": "text-embedding-ada-002",
+          "vdb_collection_name": "lynx",
+          "vdb_num_dimensions": "1536",
+          "vdb_provider_name": "faiss"
+        },
+        "status": "done",
+        "title": "LynxScribe Text RAG Loader"
       },
+      "dragHandle": ".bg-primary",
+      "height": 515.0,
+      "id": "LynxScribe Text RAG Loader 1",
       "position": {
+        "x": -173.0,
+        "y": 268.0
       },
+      "type": "basic",
+      "width": 290.0
     },
     {
       "data": {
+        "__execution_delay": 0.0,
+        "collapsed": null,
         "display": null,
         "error": null,
+        "input_metadata": null,
         "meta": {
           "inputs": {
             "chat_processor": {
               "name": "chat_processor",
               "position": "bottom",
               }
             },
             "knowledge_base": {
+              "name": "knowledge_base",
               "position": "bottom",
               "type": {
+                "type": "<class 'inspect._empty'>"
               }
             }
           },
+          "name": "LynxScribe RAG Graph Chatbot Backend",
           "outputs": {
             "output": {
               "name": "output",
               "position": "top",
               "type": {
                 "type": "None"
               }
             }
           },
           "params": {
+            "llm_interface": {
+              "default": "openai",
+              "name": "llm_interface",
               "type": {
+                "type": "<class 'str'>"
+              }
             },
+            "llm_model_name": {
+              "default": "gpt-4o",
+              "name": "llm_model_name",
               "type": {
+                "type": "<class 'str'>"
               }
             },
             "negative_answer": {
                 "type": "<class 'str'>"
               }
             },
+            "retriever_limits_by_type": {
               "default": "{}",
+              "name": "retriever_limits_by_type",
               "type": {
                 "type": "<class 'str'>"
               }
             },
+            "retriever_max_iterations": {
+              "default": 3.0,
+              "name": "retriever_max_iterations",
               "type": {
+                "type": "<class 'int'>"
               }
             },
+            "retriever_overall_chunk_limit": {
+              "default": 20.0,
+              "name": "retriever_overall_chunk_limit",
               "type": {
+                "type": "<class 'int'>"
+              }
+            },
+            "retriever_overall_token_limit": {
+              "default": 3000.0,
+              "name": "retriever_overall_token_limit",
+              "type": {
+                "type": "<class 'int'>"
+              }
+            },
+            "retriever_strict_limits": {
+              "default": true,
+              "name": "retriever_strict_limits",
+              "type": {
+                "type": "<class 'bool'>"
+              }
             }
+          },
+          "type": "basic"
         },
+        "params": {
+          "llm_interface": "openai",
+          "llm_model_name": "gpt-4o",
+          "negative_answer": "I'm sorry, but the data I've been trained on does not contain any information related to your question.",
+          "retriever_limits_by_type": "{\"information\": [1, 5], \"summary\": [0, 2], \"template_qna\": [1, 3], \"QnA question\": [0, 0]}",
+          "retriever_max_iterations": "3",
+          "retriever_overall_chunk_limit": 20.0,
+          "retriever_overall_token_limit": 3000.0,
+          "retriever_strict_limits": true
+        },
+        "status": "done",
+        "title": "LynxScribe RAG Graph Chatbot Backend"
       },
+      "dragHandle": ".bg-primary",
+      "height": 697.0,
+      "id": "LynxScribe RAG Graph Chatbot Backend 1",
       "position": {
+        "x": 356.69268530841373,
+        "y": -467.49315862719016
       },
+      "type": "basic",
+      "width": 821.0
     },
     {
       "data": {
         "display": null,
         "error": null,
+        "input_metadata": null,
         "meta": {
           "inputs": {
+            "processor": {
+              "name": "processor",
               "position": "bottom",
               "type": {
                 "type": "<class 'inspect._empty'>"
+              }
             }
           },
+          "name": "Chat processor",
           "outputs": {
             "output": {
+              "name": "output",
               "position": "top",
               "type": {
                 "type": "None"
+              }
             }
+          },
+          "params": {},
+          "type": "basic"
+        },
+        "params": {},
+        "status": "done",
+        "title": "Chat processor"
       },
+      "dragHandle": ".bg-primary",
+      "height": 220.0,
+      "id": "Chat processor 1",
       "position": {
+        "x": 907.3546850533578,
+        "y": 381.09754180073975
       },
+      "type": "basic",
+      "width": 387.0
     },
     {
       "data": {
         "display": null,
         "error": null,
+        "input_metadata": null,
         "meta": {
+          "inputs": {},
+          "name": "Truncate history",
           "outputs": {
             "output": {
+              "name": "output",
+              "position": "top",
               "type": {
                 "type": "None"
+              }
             }
           },
           "params": {
+            "max_tokens": {
+              "default": 10000.0,
+              "name": "max_tokens",
               "type": {
+                "type": "<class 'int'>"
+              }
             }
           },
+          "type": "basic"
+        },
+        "params": {
+          "max_tokens": 10000.0
+        },
+        "status": "done",
+        "title": "Truncate history"
       },
+      "dragHandle": ".bg-primary",
+      "height": 200.0,
+      "id": "Truncate history 1",
       "position": {
+        "x": 931.4096899549071,
+        "y": 703.2861674410822
       },
+      "type": "basic",
+      "width": 200.0
     },
     {
       "data": {
+        "__execution_delay": 0.0,
+        "collapsed": false,
         "display": null,
         "error": null,
+        "input_metadata": null,
         "meta": {
+          "inputs": {},
+          "name": "Mask",
           "outputs": {
             "output": {
               "name": "output",
+              "position": "top",
               "type": {
                 "type": "None"
               }
             }
           },
           "params": {
+            "exceptions": {
+              "default": "",
+              "name": "exceptions",
+              "type": {
+                "type": "<class 'str'>"
+              }
+            },
+            "mask_pattern": {
+              "default": "",
+              "name": "mask_pattern",
+              "type": {
+                "type": "<class 'str'>"
+              }
+            },
             "name": {
+              "default": "",
               "name": "name",
               "type": {
                 "type": "<class 'str'>"
               }
+            },
+            "regex": {
+              "default": "",
+              "name": "regex",
+              "type": {
+                "type": "<class 'str'>"
+              }
             }
+          },
+          "type": "basic"
+        },
+        "params": {
+          "exceptions": "[email protected],[email protected],[email protected],[email protected]",
+          "mask_pattern": "masked_email_address_{}",
+          "name": "email",
+          "regex": "([a-z0-9!#$%&'*+\\/=?^_`{|.}~-]+@(?:[a-z0-9](?:[a-z0-9-]*[a-z0-9])?\\.)+[a-z0-9](?:[a-z0-9-]*[a-z0-9])?)"
+        },
+        "status": "done",
+        "title": "Mask"
       },
+      "dragHandle": ".bg-primary",
+      "height": 366.0,
+      "id": "Mask 1",
       "position": {
+        "x": 1163.4170914925835,
+        "y": 712.6187958660655
       },
+      "type": "basic",
+      "width": 281.0
     },
     {
       "data": {
+        "__execution_delay": 0.0,
+        "collapsed": null,
         "display": null,
         "error": null,
+        "input_metadata": null,
         "meta": {
+          "inputs": {},
+          "name": "Input chat",
           "outputs": {
             "output": {
+              "name": "output",
+              "position": "right",
               "type": {
                 "type": "None"
+              }
             }
           },
           "params": {
+            "chat": {
+              "default": null,
+              "name": "chat",
               "type": {
+                "type": "<class 'str'>"
               }
             }
           },
+          "type": "basic"
+        },
+        "params": {
+          "chat": "Who is the CEO of Lynx?"
+        },
+        "status": "done",
+        "title": "Input chat"
       },
+      "dragHandle": ".bg-primary",
+      "height": 198.0,
+      "id": "Input chat 1",
       "position": {
+        "x": -854.3584473819146,
+        "y": -770.2371549901112
       },
+      "type": "basic",
+      "width": 910.0
     },
     {
       "data": {
+        "__execution_delay": 0.0,
+        "collapsed": null,
         "display": null,
         "error": null,
+        "input_metadata": null,
         "meta": {
           "inputs": {
+            "chat_api": {
+              "name": "chat_api",
               "position": "bottom",
               "type": {
                 "type": "<class 'inspect._empty'>"
               }
+            },
+            "message": {
+              "name": "message",
+              "position": "left",
+              "type": {
+                "type": "<class 'inspect._empty'>"
+              }
             }
           },
+          "name": "Test Chat API",
           "outputs": {
             "output": {
+              "name": "output",
+              "position": "right",
               "type": {
                 "type": "None"
+              }
             }
+          },
+          "params": {
+            "show_details": {
+              "default": false,
+              "name": "show_details",
+              "type": {
+                "type": "<class 'bool'>"
+              }
+            }
+          },
+          "type": "basic"
+        },
+        "params": {
+          "show_details": false
+        },
+        "status": "done",
+        "title": "Test Chat API"
       },
+      "dragHandle": ".bg-primary",
+      "height": 260.0,
+      "id": "Test Chat API 1",
       "position": {
+        "x": 356.57819670145534,
+        "y": -803.3229228909706
       },
+      "type": "basic",
+      "width": 820.0
     },
     {
       "data": {
+        "display": {
+          "dataframes": {
+            "df": {
+              "columns": [
+                "answer"
+              ],
+              "data": [
+                [
+                  "The CEO of Lynx Analytics is Gyorgy Lajtai. He is also a co-founder of the company and has a rich background in CRM, marketing automation, and systems."
+                ]
+              ]
+            }
+          }
         },
         "error": null,
+        "input_metadata": null,
         "meta": {
+          "inputs": {
+            "input": {
+              "name": "input",
+              "position": "left",
               "type": {
+                "type": "<class 'inspect._empty'>"
               }
             }
           },
+          "name": "View",
+          "outputs": {},
+          "params": {},
+          "type": "table_view"
+        },
+        "params": {},
+        "status": "done",
+        "title": "View"
       },
+      "dragHandle": ".bg-primary",
+      "height": 627.0,
+      "id": "View 1",
       "position": {
+        "x": 1497.8623453933426,
+        "y": -810.6258103791108
       },
+      "type": "table_view",
+      "width": 995.0
     },
     {
       "data": {
+        "__execution_delay": 0.0,
+        "collapsed": null,
         "display": null,
         "error": null,
+        "input_metadata": null,
         "meta": {
+          "inputs": {
+            "rag_graph": {
+              "name": "rag_graph",
+              "position": "left",
+              "type": {
+                "type": "<class 'inspect._empty'>"
+              }
+            }
+          },
+          "name": "LynxScribe RAG Graph Chatbot Builder",
           "outputs": {
             "output": {
               "name": "output",
               }
             }
           },
           "params": {
+            "node_types": {
+              "default": "intent_cluster",
+              "name": "node_types",
               "type": {
                 "type": "<class 'str'>"
+              }
             },
+            "scenario_file": {
+              "default": "uploads/lynx_chatbot_scenario_selector.yaml",
+              "name": "scenario_file",
               "type": {
                 "type": "<class 'str'>"
+              }
             },
+            "scenario_meta_name": {
+              "default": "scenario_name",
+              "name": "scenario_meta_name",
               "type": {
                 "type": "<class 'str'>"
               }
             }
           },
+          "position": {
+            "x": 1121.0,
+            "y": 813.0
           },
           "type": "basic"
+        },
+        "params": {
+          "node_types": "intent_cluster",
+          "scenario_file": "uploads/lynx_chatbot_scenario_selector.yaml",
+          "scenario_meta_name": ""
+        },
+        "status": "done",
+        "title": "LynxScribe RAG Graph Chatbot Builder"
       },
+      "dragHandle": ".bg-primary",
+      "height": 297.0,
+      "id": "LynxScribe RAG Graph Chatbot Builder 1",
       "position": {
+        "x": 328.41755532473496,
+        "y": 378.2277574498554
       },
+      "type": "basic",
+      "width": 396.0
     }
   ]
 }

examples/uploads/image_description_prompts.yaml ADDED Viewed

	@@ -0,0 +1,90 @@

+cot_picture_descriptor:
+  - role: system
+    content: &cot_starter >
+      You are an advanced AI specializing in structured image descriptions using a Chain-of-Thought (CoT) approach.
+      Your goal is to analyze an image and return a detailed dictionary containing relevant details categorized by elements.
+  - role: system
+    content: &cot_details >
+      You should always return a dictionary with the following main keys:
+        - "image type": Identify whether the image is a "picture", "diagram", "flowchart", "advertisement", or "other".
+        - "overall description": A concise but clear summary of the entire image.
+        - "details": A dictionary containing all significant elements in the image, where:
+            * Each key represents a major object or entity in the image.
+            * Each value is a detailed description of that entity.
+  - role: system
+    content: &cot_normal_pic >
+      If the image is a normal picture (e.g., a scene with people, animals, landscapes, or objects in a real-world setting),
+      follow these steps:
+        1. Identify and describe the background (e.g., sky, buildings, landscape).
+        2. Identify the main action happening (e.g., a dog chasing a ball).
+        3. Break down individual objects and provide a description for each, including attributes like color, size, texture, and their relationship with other objects.
+      In this case, the sub-dictionary under the "details" key should contain the following keys:
+        * "background": A description of the background elements.
+        * "main scene": A summary of the primary action taking place.
+        * Individual keys for all identified objects, each with a detailed description.
+      While describing the objects, be very detailed. Not just mention person, but mention: middle-aged women with brown curly hair, ...
+  - role: system
+    content: &cot_diagrams >
+      If the image is a diagram, identify key labeled components and describe their meaning.
+        - Describe the meaning of the diagram, and if there are axes, explain their purpose.
+        - Provide an interpretation of the overall meaning and takeaway from the chart, including relationships between elements if applicable.
+      In this case, the sub-dictionary under the "details" key should contain the following keys:
+        * "x-axis", "y-axis" (or variations like "y1-axis" and "y2-axis") if applicable.
+        * "legend": A description of the plotted data, including sources if available.
+        * "takeaway": A summary of the main insights derived from the chart.
+        * Additional structured details, such as grouped data (e.g., individual timelines in a line chart).
+  - role: system
+    content: &cot_flowcharts >
+      If the image is a flowchart:
+        - Identify the start and end points.
+        - List key process steps and decision nodes.
+        - Describe directional flows and relationships between components.
+      In this case, the sub-dictionary under the "details" key should contain the following keys:
+        * "start points": The identified starting nodes of the flowchart.
+        * "end points": The final outcome(s) of the flowchart.
+        * "detailed description": A natural language explanation of the entire flow.
+        * Additional keys for each process step and decision point, described in detail.
+  - role: system
+    content: &cot_ads >
+      If the image is an advertisement:
+        - Describe the main subject and any branding elements.
+        - Identify slogans, logos, and promotional text.
+        - Analyze the visual strategy used (e.g., color scheme, emotional appeal, focal points).
+      In this case, the sub-dictionary under the "details" key should contain the following keys:
+        * "advertised brand": The brand being promoted.
+        * "advertised product": The product or service being advertised.
+        * "background": The background setting of the advertisement.
+        * "main scene": The primary subject or action depicted.
+        * "used slogans": Any slogans or catchphrases appearing in the advertisement.
+        * "visual strategy": An analysis of the design and emotional impact.
+        * Additional keys for individual objects, just like in the case of normal pictures.
+  - role: system
+    content: &cot_output_example >
+      Example output for a normal picture:
+      ```json
+      {
+        "image type": "picture",
+        "overall description": "A peaceful rural landscape featuring a cow chained to a tree in a field with mountains in the background.",
+        "details": {
+          "background": "A large open field with patches of grass and dirt, surrounded by distant mountains under a clear blue sky.",
+          "main scene": "A cow chained to a tree in the middle of a grassy field.",
+          "cow": "A brown and white cow standing near the tree, appearing calm.",
+          "tree": "A sturdy oak tree with green leaves and a metal chain wrapped around its trunk.",
+          "mountain": "Tall, rocky mountains stretching across the horizon.",
+          "chain": "A shiny metal chain, slightly rusty in some places."
+        }
+      }
+      ```
+  - role: user
+    content:
+    - type: text
+      text: "Describe this image as you trained. Only output the dictionary add nothing else."
+    - type: "image_url"
+      image_url: {image_address}

examples/uploads/lynx_chatbot_scenario_selector.yaml ADDED Viewed

	@@ -0,0 +1,302 @@

+- name: general_interest
+  mode: retrieve_llm  # Literal[retrieve_llm, retrieve_only, llm_only, fixed_answer, sticky_answer]
+  prompt_messages:  # Answer prompts in [role, content] format, should contain {context}
+    - role: system  # Literal[system, assistant, user, tool]
+      content: &role >
+        You are LynxScribe, a chatbot representing Lynx Analytics, a leading Singaporean analytics
+        company specializing in pharma, life sciences, generative AI, and graph AI. Your role is to
+        respond to inquiries on the Lynx Analytics website. To better understand the visitors'
+        needs, you may ask follow-up questions as detailed in subsequent instructions.
+    - role: system
+      content: &preferences >
+        Lynx Analytics specializes in a range of areas including pharma (with a focus on marketing
+        support), life sciences, graph AI, and generative AI solutions. When responding to inquiries
+        about our solutions or products, give priority to those related to generative AI (chatbots
+        for pharma and service providers), graph AI (graph reasoning), and pharma (research, key
+        opinion leaders, brand adoption ladder). Also, briefly touch upon our offerings in retail
+        (price AI, assort AI, promo AI) and finance (digital banking, Customer Happiness Index), as
+        these are areas of secondary priority. Additionally, although telecommunication is worth
+        mentioning briefly to highlight our comprehensive range of expertise and solutions.
+    - role: system
+      content: &context >
+        Respond to questions solely based on the context outlined below:\n\n{context}
+    - role: system
+      content: &instr_prices >
+        If inquiries about pricing arise, suggest contacting Lynx Analytics for detailed
+        information. Additionally, emphasize that Lynx Analytics offers solutions at competitive
+        prices without compromising on quality.
+    - role: system
+      content: &ask_industry >
+        If it's not mentioned in the chat history, include a question at the end of your response
+        to inquire about their industry interest or employment. For example: 'May I know which
+        specific domain or industry you are interested in or work in?'
+    - role: system
+      content: &ask_visit_reason >
+        If the chat history does not reveal it, ask about their reason for visiting the website. For
+        instance, you might say: 'Could you share what prompted your visit to our website today?'
+    - role: system
+      content: &final_instr >
+        Carefully answer questions based on the provided context. Refrain from introducing new
+        names; use only those within your context. Respond in the language of the question. If
+        necessary, ask follow-up questions. Ensure your answers are clear, utilizing bullet points
+        where appropriate. Avoid phrases like 'According to this article' to maintain a natural
+        tone.
+  link_answer: &link # When present, formatted node link appends to answer, should contain {link}
+        "\n\nPlease visit <a href='{link}' target='_blank'>{link}</a> for further information."
+  min_similarity_score: -1  # Only need to specify if > -1 and in RETRIEVE_LLM or RETRIEVE_ONLY mode
+- name: life_sciences_interest
+  mode: retrieve_llm
+  prompt_messages:
+    - role: system
+      content: *role
+    - role: system
+      content: *preferences
+    - role: system
+      content: *context
+    - role: system
+      content: *instr_prices
+    - role: system
+      content: &ask_profession >
+        If their job is not mentioned in the chat history, add a question at the end of your answer
+        about their profession. For example: 'Could you please tell me about your current profession
+        or occupation?'
+    - role: system
+      content: *ask_visit_reason
+    - role: system
+      content: &ask_email >
+        If their email is not already in the chat history, suggest that they can provide their email
+        address for further contact. For instance: 'Should you wish for further communication
+        regarding your queries, feel free to provide your email address.'
+    - role: system
+      content: *final_instr
+  link_answer: *link
+  min_similarity_score: -1
+- name: finance_interest
+  mode: retrieve_llm
+  prompt_messages:
+    - role: system
+      content: *role
+    - role: system
+      content: *context
+    - role: system
+      content: *instr_prices
+    - role: system
+      content: &ask_responsibilities >
+        If their job or responsibilities are not detailed in the chat history, include a question
+        at the end of your response. For example: 'Would you mind sharing some details about the
+        specific responsibilities you manage in your role?'
+    - role: system
+      content: *ask_visit_reason
+    - role: system
+      content: *ask_email
+    - role: system
+      content: *final_instr
+  link_answer: *link
+  min_similarity_score: -1
+- name: telco_interest
+  mode: retrieve_llm
+  prompt_messages:
+    - role: system
+      content: *role
+    - role: system
+      content: *context
+    - role: system
+      content: *instr_prices
+    - role: system
+      content: *ask_responsibilities
+    - role: system
+      content: *ask_visit_reason
+    - role: system
+      content: *ask_email
+    - role: system
+      content: *final_instr
+  link_answer: *link
+  min_similarity_score: -1
+- name: retail_interest
+  mode: retrieve_llm
+  prompt_messages:
+    - role: system
+      content: *role
+    - role: system
+      content: *context
+    - role: system
+      content: *instr_prices
+    - role: system
+      content: *ask_responsibilities
+    - role: system
+      content: *ask_visit_reason
+    - role: system
+      content: *ask_email
+    - role: system
+      content: *final_instr
+  link_answer: *link
+  min_similarity_score: -1
+- name: lynx_kite
+  mode: retrieve_llm
+  prompt_messages:
+    - role: system
+      content: *role
+    - role: system
+      content: *preferences
+    - role: system
+      content: *context
+    - role: system
+      content: *instr_prices
+    - role: system
+      content: *ask_industry
+    - role: system
+      content: &ask_graph >
+        If it's not mentioned in the chat history, include a question at the end of your response to
+        inquire about their specific needs related to graph analytics. For example: 'May I know
+        which particular graph-related problem you are looking to solve with graph analytics?'
+    - role: system
+      content: *ask_email
+    - role: system
+      content: *final_instr
+  link_answer: *link
+  min_similarity_score: -1
+- name: lynx_team
+  mode: retrieve_llm
+  prompt_messages:
+    - role: system
+      content: *role
+    - role: system
+      content: *context
+    - role: system
+      content: *instr_prices
+    - role: system
+      content: *ask_visit_reason
+    - role: system
+      content: >
+        When they inquire about names that could refer to multiple individuals, provide the names
+        along with a brief description of each. Then, ask for clarification on which specific
+        individual they are referring to.
+    - role: system
+      content: *final_instr
+  link_answer: *link
+  min_similarity_score: -1
+- name: lynx_career
+  mode: retrieve_llm
+  prompt_messages:
+    - role: system
+      content: *role
+    - role: system
+      content: *context
+    - role: system
+      content: *instr_prices
+    - role: system
+      content: *ask_responsibilities
+    - role: system
+      content: >
+        If it's not already mentioned in the chat history, include a question at the end of your
+        response to inquire about their motivation for wanting to work with us. For example: 'Could
+        you share what motivates you to seek a position with our team?'
+    - role: system
+      content: *ask_email
+    - role: system
+      content: *final_instr
+  link_answer: *link
+  min_similarity_score: -1
+- name: lynxscribe
+  mode: retrieve_llm
+  prompt_messages:
+    - role: system
+      content: *role
+    - role: system
+      content: *preferences
+    - role: system
+      content: *context
+    - role: system
+      content: *instr_prices
+    - role: system
+      content: *ask_industry
+    - role: system
+      content: >
+        If the chat history does not already include this information, add a question at the end of
+        your response to identify their specific needs in generative AI. For example: 'Could you
+        please specify the problem you are aiming to address using generative AI?'
+    - role: system
+      content: *ask_email
+    - role: system
+      content: *final_instr
+  link_answer: *link
+  min_similarity_score: -1
+- name: general_ds
+  mode: retrieve_llm
+  prompt_messages:
+    - role: system
+      content: *role
+    - role: system
+      content: *context
+    - role: system
+      content: *instr_prices
+    - role: system
+      content: *ask_industry
+    - role: system
+      content: *ask_visit_reason
+    - role: system
+      content: *ask_email
+    - role: system
+      content: *final_instr
+  link_answer: *link
+  min_similarity_score: -1
+- name: general_graph
+  mode: retrieve_llm
+  prompt_messages:
+    - role: system
+      content: *role
+    - role: system
+      content: *preferences
+    - role: system
+      content: *context
+    - role: system
+      content: *instr_prices
+    - role: system
+      content: *ask_graph
+    - role: system
+      content: *ask_industry
+    - role: system
+      content: *ask_email
+    - role: system
+      content: *final_instr
+  link_answer: *link
+  min_similarity_score: -1
+- name: other_okay
+  mode: retrieve_llm
+  prompt_messages:
+    - role: system
+      content: *role
+    - role: system
+      content: *preferences
+    - role: system
+      content: *context
+    - role: system
+      content: *instr_prices
+    - role: system
+      content: *ask_industry
+    - role: system
+      content: *ask_visit_reason
+    - role: system
+      content: *final_instr
+  link_answer: *link
+  min_similarity_score: -1
+- name: contact_us
+  mode: retrieve_llm
+  prompt_messages:
+    - role: system
+      content: *role
+    - role: system
+      content: *context
+    - role: system
+      content: *instr_prices
+    - role: system
+      content: *ask_email
+    - role: system
+      content: *final_instr
+  link_answer: *link
+  min_similarity_score: -1
+- name: malicious
+  mode: fixed_answer  # Could be sticky, but if we want the user to rephrase, let's give 2nd chance
+  fixed_answer: >
+    I am sorry, but I feel you want me use in a wrong way. If I feel it wrong, please try to
+    rephrase your question.

examples/uploads/organon_demo/backend-scenarios-en.yaml ADDED Viewed

	@@ -0,0 +1,92 @@

+- name: general_contraception_information # Must match the scenario name found in RAG graph
+  mode: retrieve_only # Literal[retrieve_llm, retrieve_only, llm_only, fixed_answer, sticky_answer]
+  min_pass_similarity_score: 0.55 # Custom value: if any answer is above, give three results
+  single_similarity_score: 0.86 # Custom value: is best answer is above, give single result
+  # min_similarity_score not used (stays -1.0) because it ditches all lower-score docs from results
+- name: intrauterine_devices
+  mode: retrieve_only
+  min_pass_similarity_score: 0.55 # Sim Score = 2 * (1 - Distance) - 1
+  single_similarity_score: 0.86 # Sim Score = 2 * (1 - Distance) - 1
+- name: contraceptive_injection
+  mode: retrieve_only
+  min_pass_similarity_score: 0.55
+  single_similarity_score: 0.86
+- name: emergency_contraceptive_pills
+  mode: retrieve_only
+  min_pass_similarity_score: 0.55
+  single_similarity_score: 0.86
+- name: contraceptive_implant
+  mode: retrieve_only
+  min_pass_similarity_score: 0.55
+  single_similarity_score: 0.86
+- name: combined_contraceptive_pills
+  mode: retrieve_only
+  min_pass_similarity_score: 0.55
+  single_similarity_score: 0.86
+- name: other_okay
+  mode: retrieve_only
+  min_pass_similarity_score: 0.55
+  single_similarity_score: 0.86
+- name: own_side_effect
+  mode: fixed_answer
+  fixed_answer:
+    &abort_side_eff > # Anchors are added only for reference to old V1 template file
+    I'm not equipped to handle adverse events or other product-related queries. Your safety is
+    important to us, and we want to ensure you receive the appropriate support. Please report any
+    adverse events or concerns to our dedicated support team.
+    They can be reached at [email protected].
+    If you have any questions related to contraceptives or women's health, please feel free to ask,
+    and I'll provide you with the information you need.
+  keywords: [Mercilon, Marvelon, Implanon]
+  keyword_answer: &alternative_side_eff >
+    I'm not equipped to handle adverse events or other product-related queries. Your safety is
+    important to us, and we want to ensure you receive the appropriate support. Please report any
+    adverse events or concerns related to Organon products to our dedicated support team.
+    They can be reached at [email protected].
+    If you have any questions related to contraceptives or women's health, please feel free to ask,
+    and I'll provide you with the information you need.
+- name: own_dosage
+  mode: fixed_answer
+  fixed_answer: &abort_dosage >
+    I'm not equipped to handle adverse events, dosage-related questions or other product-related
+    queries. Your safety is important to us, and we want to ensure you receive the appropriate
+    support. Please consult with the prescribing doctor about the details on how to use the
+    medication. For further information, please write a message to our dedicated support team.
+    They can be reached at [email protected].
+    If you have any questions related to contraceptives or women's health, please feel free to ask,
+    and I'll provide you with the information you need.
+- name: brand_specific_information
+  mode: fixed_answer
+  fixed_answer: &brand_selection >
+    I appreciate your question about brand recommendations. For personalized advice related to
+    healthcare or specific products, it's always best to consult with a healthcare professional
+    who can consider your individual needs and provide tailored recommendations. They have the
+    expertise to guide you in the right direction.
+    If you have any questions related to contraceptives or women's health, please feel free to ask,
+    and I'll provide you with the information you need.
+- name: greetings_hay
+  mode: fixed_answer
+  fixed_answer: &how_are_you_hi >
+    I am fine thanks, hope you feel the same! Feel free to ask any contraception related question.
+- name: greetings_hi
+  mode: fixed_answer
+  fixed_answer: &say_hi >
+    Hi, nice to meet you! Feel free to ask any contraception related question.
+- name: emailthanks
+  mode: fixed_answer
+  fixed_answer: &email_thanks >
+    Thank you. Could I help with something else?
+- name: thanks
+  mode: fixed_answer
+  fixed_answer: &thanks_answer >
+    Not at all. Could I help with something else?
+- name: confirmation
+  mode: fixed_answer
+  fixed_answer: &confirmation_answer >
+    Thank you. Could I help with something else?
+- name: malicious
+  mode: sticky_answer
+  fixed_answer: &malicious_message >
+    I am sorry, but I feel you want me use in a wrong way.
+    If I feel it wrong, please try to rephrase your question.
+    Refresh your browser if you'd like to ask more questions.

examples/uploads/organon_demo/organon_en_copy.xlsx ADDED Viewed

Binary file (66.9 kB). View file

lynxkite-lynxscribe/pyproject.toml CHANGED Viewed

@@ -6,7 +6,7 @@ readme = "README.md"
 requires-python = ">=3.11"
 dependencies = [
     "lynxkite-core",
-    "lynxscribe[openai] @ git+ssh://[email protected]/biggraph/lynxscribe@main",
 ]
 [tool.uv.sources]

 requires-python = ">=3.11"
 dependencies = [
     "lynxkite-core",
+    "lynxscribe[openai,faiss-cpu,litellm,google] @ git+ssh://[email protected]/biggraph/lynxscribe@main",
 ]
 [tool.uv.sources]

lynxkite-lynxscribe/src/lynxkite_lynxscribe/lynxscribe_ops.py CHANGED Viewed

@@ -1,12 +1,24 @@
 """
 LynxScribe configuration and testing in LynxKite.
 """
 import pathlib
 from lynxscribe.core.llm.base import get_llm_engine
 from lynxscribe.core.vector_store.base import get_vector_store
 from lynxscribe.common.config import load_config
 from lynxscribe.components.text.embedder import TextEmbedder
 from lynxscribe.components.rag.rag_graph import RAGGraph
 from lynxscribe.components.rag.knowledge_base_graph import PandasKnowledgeBaseGraph
 from lynxscribe.components.rag.rag_chatbot import Scenario, ScenarioSelector, RAGChatbot
@@ -17,94 +29,621 @@ from lynxscribe.components.chat.processors import (
 )
 from lynxscribe.components.chat.api import ChatAPI
 from lynxscribe.core.models.prompts import ChatCompletionPrompt
 from lynxkite.core import ops
 import json
 from lynxkite.core.executors import one_by_one
 ENV = "LynxScribe"
 one_by_one.register(ENV)
 op = ops.op_registration(ENV)
 output_on_top = ops.output_position(output="top")
-@output_on_top
-@op("Vector store")
-def vector_store(*, name="chromadb", collection_name="lynx"):
-    vector_store = get_vector_store(name=name, collection_name=collection_name)
-    return {"vector_store": vector_store}
-@output_on_top
-@op("LLM")
-def llm(*, name="openai"):
-    llm = get_llm_engine(name=name)
-    return {"llm": llm}
-@output_on_top
-@ops.input_position(llm="bottom")
-@op("Text embedder")
-def text_embedder(llm, *, model="text-embedding-ada-002"):
-    llm = llm[0]["llm"]
-    text_embedder = TextEmbedder(llm=llm, model=model)
-    return {"text_embedder": text_embedder}
-@output_on_top
-@ops.input_position(vector_store="bottom", text_embedder="bottom")
-@op("RAG graph")
-def rag_graph(vector_store, text_embedder):
-    vector_store = vector_store[0]["vector_store"]
-    text_embedder = text_embedder[0]["text_embedder"]
     rag_graph = RAGGraph(
         PandasKnowledgeBaseGraph(vector_store=vector_store, text_embedder=text_embedder)
     )
     return {"rag_graph": rag_graph}
 @output_on_top
-@op("Scenario selector")
-def scenario_selector(*, scenario_file: str, node_types="intent_cluster"):
     scenarios = load_config(scenario_file)
     node_types = [t.strip() for t in node_types.split(",")]
-    scenario_selector = ScenarioSelector(
-        scenarios=[Scenario(**scenario) for scenario in scenarios],
-        node_types=node_types,
-    )
-    return {"scenario_selector": scenario_selector}
-DEFAULT_NEGATIVE_ANSWER = "I'm sorry, but the data I've been trained on does not contain any information related to your question."
 @output_on_top
-@ops.input_position(rag_graph="bottom", scenario_selector="bottom", llm="bottom")
-@op("RAG chatbot")
-def rag_chatbot(
-    rag_graph,
-    scenario_selector,
-    llm,
     *,
     negative_answer=DEFAULT_NEGATIVE_ANSWER,
-    limits_by_type="{}",
-    strict_limits=True,
-    max_results=5,
 ):
-    rag_graph = rag_graph[0]["rag_graph"]
-    scenario_selector = scenario_selector[0]["scenario_selector"]
-    llm = llm[0]["llm"]
-    limits_by_type = json.loads(limits_by_type)
     rag_chatbot = RAGChatbot(
         rag_graph=rag_graph,
         scenario_selector=scenario_selector,
         llm=llm,
         negative_answer=negative_answer,
-        limits_by_type=limits_by_type,
-        strict_limits=strict_limits,
-        max_results=max_results,
     )
-    return {"chatbot": rag_chatbot}
 @output_on_top
@@ -162,7 +701,12 @@ async def test_chat_api(message, chat_api, *, show_details=False):
         messages=[{"role": "user", "content": message["text"]}],
     )
     response = await chat_api.answer(request, stream=False)
-    answer = response.choices[0].message.content
     if show_details:
         return {"answer": answer, **response.__dict__}
     else:
@@ -174,39 +718,6 @@ def input_chat(*, chat: str):
     return {"text": chat}
-@output_on_top
-@ops.input_position(chatbot="bottom", chat_processor="bottom", knowledge_base="bottom")
-@op("Chat API")
-def chat_api(chatbot, chat_processor, knowledge_base, *, model="gpt-4o-mini"):
-    chatbot = chatbot[0]["chatbot"]
-    chat_processor = chat_processor[0]["chat_processor"]
-    knowledge_base = knowledge_base[0]
-    c = ChatAPI(
-        chatbot=chatbot,
-        chat_processor=chat_processor,
-        model=model,
-    )
-    if knowledge_base:
-        c.chatbot.rag_graph.kg_base.load_v1_knowledge_base(**knowledge_base)
-        c.chatbot.scenario_selector.check_compatibility(c.chatbot.rag_graph)
-    return {"chat_api": c}
-@output_on_top
-@op("Knowledge base")
-def knowledge_base(
-    *,
-    nodes_path="nodes.pickle",
-    edges_path="edges.pickle",
-    template_cluster_path="tempclusters.pickle",
-):
-    return {
-        "nodes_path": nodes_path,
-        "edges_path": edges_path,
-        "template_cluster_path": template_cluster_path,
-    }
 @op("View", view="table_view")
 def view(input):
     columns = [str(c) for c in input.keys() if not str(c).startswith("_")]
@@ -230,7 +741,7 @@ async def get_chat_api(ws: str):
     assert path.exists(), f"Workspace {path} does not exist"
     ws = workspace.load(path)
     contexts = await ops.EXECUTORS[ENV](ws)
-    nodes = [op for op in ws.nodes if op.data.title == "Chat API"]
     [node] = nodes
     context = contexts[node.id]
     return context.last_result["chat_api"]
@@ -299,3 +810,43 @@ def get_lynxscribe_workspaces():
                 pass  # Ignore files that are not valid workspaces.
     workspaces.sort()
     return workspaces

 """
 LynxScribe configuration and testing in LynxKite.
+TODO: all these outputs should contain metadata. So the next task can check the input type, etc.
 """
+from google.cloud import storage
+from copy import deepcopy
+from enum import Enum
+import asyncio
+import pandas as pd
+import joblib
+from pydantic import BaseModel, ConfigDict
 import pathlib
 from lynxscribe.core.llm.base import get_llm_engine
 from lynxscribe.core.vector_store.base import get_vector_store
 from lynxscribe.common.config import load_config
 from lynxscribe.components.text.embedder import TextEmbedder
+from lynxscribe.core.models.embedding import Embedding
+from lynxscribe.components.embedding_clustering import FclusterBasedClustering
 from lynxscribe.components.rag.rag_graph import RAGGraph
 from lynxscribe.components.rag.knowledge_base_graph import PandasKnowledgeBaseGraph
 from lynxscribe.components.rag.rag_chatbot import Scenario, ScenarioSelector, RAGChatbot
 )
 from lynxscribe.components.chat.api import ChatAPI
 from lynxscribe.core.models.prompts import ChatCompletionPrompt
+from lynxscribe.components.rag.loaders import FAQTemplateLoader
 from lynxkite.core import ops
 import json
 from lynxkite.core.executors import one_by_one
+DEFAULT_NEGATIVE_ANSWER = "I'm sorry, but the data I've been trained on does not contain any information related to your question."
 ENV = "LynxScribe"
 one_by_one.register(ENV)
+mem = joblib.Memory("joblib-cache")
 op = ops.op_registration(ENV)
 output_on_top = ops.output_position(output="top")
+# defining the cloud provider enum
+class CloudProvider(Enum):
+    GCP = "gcp"
+    AWS = "aws"
+    AZURE = "azure"
+class RAGVersion(Enum):
+    V1 = "v1"
+    V2 = "v2"
+class RAGTemplate(BaseModel):
+    """
+    Model for RAG templates consisting of three tables: they are connected via scenario names.
+    One table (FAQs) contains scenario-denoted nodes to upsert into the knowledge base, the other
+    two tables serve as the configuration for the scenario selector.
+    Attributes:
+        faq_data:
+            Table where each row is an FAQ question, and possibly its answer pair. Will be fed into
+            `FAQTemplateLoader.load_nodes_and_edges()`. For configuration of this table see the
+            loader's init arguments.
+        scenario_data:
+            Table where each row is a Scenario, column names are thus scenario attributes. Will be
+            fed into `ScenarioSelector.from_data()`.
+        prompt_codes:
+            Optional helper for the scenario table, may contain prompt code mappings to real prompt
+            messages. It's enough then to use the codes instead of the full messages in the
+            scenarios table. Will be fed into `ScenarioSelector.from_data()`.
+    """
+    model_config = ConfigDict(arbitrary_types_allowed=True)
+    faq_data: pd.DataFrame
+    scenario_data: pd.DataFrame
+    prompt_codes: dict[str, str] = {}
+    @classmethod
+    def from_excel_path(
+        cls,
+        path: str,
+        faq_data_sheet_name: str,
+        scenario_data_sheet_name: str,
+        prompt_codes_sheet_name: str | None = None,
+    ) -> "RAGTemplate":
+        """Spawn a RAGTemplate from an Excel file containing the two needed (plus one optional) sheets."""
+        def transform_codes(prompt_codes: pd.DataFrame) -> dict[str, str]:
+            """Check and transform prompt codes table into a code dictionary."""
+            if (len_columns := len(prompt_codes.columns)) != 2:
+                raise ValueError(
+                    f"Prompt codes should contain exactly 2 columns, {len_columns} found."
+                )
+            return prompt_codes.set_index(prompt_codes.columns[0])[
+                prompt_codes.columns[1]
+            ].to_dict()
+        return cls(
+            faq_data=pd.read_excel(path, sheet_name=faq_data_sheet_name),
+            scenario_data=pd.read_excel(path, sheet_name=scenario_data_sheet_name),
+            prompt_codes=transform_codes(pd.read_excel(path, sheet_name=prompt_codes_sheet_name))
+            if prompt_codes_sheet_name
+            else {},
+        )
+@op("Cloud-sourced File Listing")
+def cloud_file_loader(
+    *,
+    cloud_provider: CloudProvider = CloudProvider.GCP,
+    folder_URL: str = "https://storage.googleapis.com/lynxkite_public_data/lynxscribe-images/image-rag-test",
+    accepted_file_types: str = ".jpg, .jpeg, .png",
+):
+    """
+    Gives back the list of URLs of all the images from a cloud-based folder.
+    Currently only supports GCP storage.
+    """
+    if folder_URL[-1].endswith("/"):
+        folder_URL = folder_URL[:-1]
+    accepted_file_types = tuple([t.strip() for t in accepted_file_types.split(",")])
+    if cloud_provider == CloudProvider.GCP:
+        client = storage.Client()
+        url_useful_part = folder_URL.split(".com/")[-1]
+        bucket_name = url_useful_part.split("/")[0]
+        if bucket_name == url_useful_part:
+            prefix = ""
+        else:
+            prefix = url_useful_part.split(bucket_name + "/")[-1]
+        bucket = client.bucket(bucket_name)
+        blobs = bucket.list_blobs(prefix=prefix)
+        file_urls = [blob.public_url for blob in blobs if blob.name.endswith(accepted_file_types)]
+        return {"file_urls": file_urls}
+    else:
+        raise ValueError(f"Cloud provider '{cloud_provider}' is not supported.")
+# @output_on_top
+# @op("LynxScribe RAG Graph Vector Store")
+# @mem.cache
+# def ls_rag_graph(
+#     *,
+#     name: str = "faiss",
+#     num_dimensions: int = 3072,
+#     collection_name: str = "lynx",
+#     text_embedder_interface: str = "openai",
+#     text_embedder_model_name_or_path: str = "text-embedding-3-large",
+#     # api_key_name: str = "OPENAI_API_KEY",
+# ):
+#     """
+#     Returns with a vector store instance.
+#     """
+#     # getting the text embedder instance
+#     llm_params = {"name": text_embedder_interface}
+#     # if api_key_name:
+#     #     llm_params["api_key"] = os.getenv(api_key_name)
+#     llm = get_llm_engine(**llm_params)
+#     text_embedder = TextEmbedder(llm=llm, model=text_embedder_model_name_or_path)
+#     # getting the vector store
+#     if name == "chromadb":
+#         vector_store = get_vector_store(name=name, collection_name=collection_name)
+#     elif name == "faiss":
+#         vector_store = get_vector_store(name=name, num_dimensions=num_dimensions)
+#     else:
+#         raise ValueError(f"Vector store name '{name}' is not supported.")
+#     # building up the RAG graph
+#     rag_graph = RAGGraph(
+#         PandasKnowledgeBaseGraph(vector_store=vector_store, text_embedder=text_embedder)
+#     )
+#     return {"rag_graph": rag_graph}
+@op("LynxScribe Image Describer")
+@mem.cache
+async def ls_image_describer(
+    file_urls,
+    *,
+    llm_interface: str = "openai",
+    llm_visual_model: str = "gpt-4o",
+    llm_prompt_path: str = "uploads/image_description_prompts.yaml",
+    llm_prompt_name: str = "cot_picture_descriptor",
+    # api_key_name: str = "OPENAI_API_KEY",
+):
+    """
+    Returns with image descriptions from a list of image URLs.
+    TODO: making the inputs more flexible (e.g. accepting file locations, URLs, binaries, etc.).
+          the input dictionary should contain some meta info: e.g., what is in the list...
+    """
+    # handling inputs
+    image_urls = file_urls["file_urls"]
+    # loading the LLM
+    llm_params = {"name": llm_interface}
+    # if api_key_name:
+    #     llm_params["api_key"] = os.getenv(api_key_name)
+    llm = get_llm_engine(**llm_params)
+    # preparing the prompts
+    prompt_base = load_config(llm_prompt_path)[llm_prompt_name]
+    prompt_list = []
+    for i in range(len(image_urls)):
+        image = image_urls[i]
+        _prompt = deepcopy(prompt_base)
+        for message in _prompt:
+            if isinstance(message["content"], list):
+                for _message_part in message["content"]:
+                    if "image_url" in _message_part:
+                        _message_part["image_url"] = {"url": image}
+        prompt_list.append(_prompt)
+    # creating the prompt objects
+    ch_prompt_list = [
+        ChatCompletionPrompt(model=llm_visual_model, messages=prompt) for prompt in prompt_list
+    ]
+    # get the image descriptions
+    tasks = [llm.acreate_completion(completion_prompt=_prompt) for _prompt in ch_prompt_list]
+    out_completions = await asyncio.gather(*tasks)
+    results = [
+        dictionary_corrector(result.choices[0].message.content) for result in out_completions
+    ]
+    # getting the image descriptions (list of dictionaries {image_url: URL, description: description})
+    # TODO: some result class could be a better idea (will be developed in LynxScribe)
+    image_descriptions = [
+        {"image_url": image_urls[i], "description": results[i]} for i in range(len(image_urls))
+    ]
+    return {"image_descriptions": image_descriptions}
+@op("LynxScribe Image RAG Builder")
+@mem.cache
+async def ls_image_rag_builder(
+    image_descriptions,
+    *,
+    vdb_provider_name: str = "faiss",
+    vdb_num_dimensions: int = 3072,
+    vdb_collection_name: str = "lynx",
+    text_embedder_interface: str = "openai",
+    text_embedder_model_name_or_path: str = "text-embedding-3-large",
+    # api_key_name: str = "OPENAI_API_KEY",
+):
+    """
+    Based on image descriptions, and embedding/VDB parameters,
+    the function builds up an image RAG graph, where the nodes are the
+    descriptions of the images (and of all image objects).
+    In a later phase, synthetic questions and "named entities" will also
+    be added to the graph.
+    """
+    # handling inputs
+    image_descriptions = image_descriptions["image_descriptions"]
+    # Building up the empty RAG graph
+    # a) Define LLM interface and get a text embedder
+    llm_params = {"name": text_embedder_interface}
+    # if api_key_name:
+    #     llm_params["api_key"] = os.getenv(api_key_name)
+    llm = get_llm_engine(**llm_params)
+    text_embedder = TextEmbedder(llm=llm, model=text_embedder_model_name_or_path)
+    # b) getting the vector store
+    # TODO: vdb_provider_name should be ENUM, and other parameters should appear accordingly
+    if vdb_provider_name == "chromadb":
+        vector_store = get_vector_store(name=vdb_provider_name, collection_name=vdb_collection_name)
+    elif vdb_provider_name == "faiss":
+        vector_store = get_vector_store(name=vdb_provider_name, num_dimensions=vdb_num_dimensions)
+    else:
+        raise ValueError(f"Vector store name '{vdb_provider_name}' is not supported.")
+    # c) building up the RAG graph
     rag_graph = RAGGraph(
         PandasKnowledgeBaseGraph(vector_store=vector_store, text_embedder=text_embedder)
     )
+    dict_list_df = []
+    for image_description_tuple in image_descriptions:
+        image_url = image_description_tuple["image_url"]
+        image_description = image_description_tuple["description"]
+        if "overall description" in image_description:
+            dict_list_df.append(
+                {
+                    "image_url": image_url,
+                    "description": image_description["overall description"],
+                    "source": "overall description",
+                }
+            )
+        if "details" in image_description:
+            for dkey in image_description["details"].keys():
+                text = f"The picture's description is: {image_description['overall description']}\n\nThe description of the {dkey} is: {image_description['details'][dkey]}"
+                dict_list_df.append(
+                    {"image_url": image_url, "description": text, "source": "details"}
+                )
+    pdf_descriptions = pd.DataFrame(dict_list_df)
+    pdf_descriptions["embedding_values"] = await text_embedder.acreate_embedding(
+        pdf_descriptions["description"].to_list()
+    )
+    pdf_descriptions["id"] = "im_" + pdf_descriptions.index.astype(str)
+    # adding the embeddings to the RAG graph with metadata
+    pdf_descriptions["embedding"] = pdf_descriptions.apply(
+        lambda row: Embedding(
+            id=row["id"],
+            value=row["embedding_values"],
+            metadata={
+                "image_url": row["image_url"],
+                "image_part": row["source"],
+                "type": "image_description",
+            },
+            document=row["description"],
+        ),
+        axis=1,
+    )
+    embedding_list = pdf_descriptions["embedding"].tolist()
+    # adding the embeddings to the RAG graph
+    rag_graph.kg_base.vector_store.upsert(embedding_list)
+    # # saving the RAG graph
+    # rag_graph.kg_base.save(image_rag_out_path)
+    return {"rag_graph": rag_graph}
+@op("LynxScribe RAG Graph Saver")
+def ls_save_rag_graph(
+    rag_graph,
+    *,
+    image_rag_out_path: str = "image_test_rag_graph.pickle",
+):
+    """
+    Saves the RAG graph to a pickle file.
+    """
+    # reading inputs
+    rag_graph = rag_graph[0]["rag_graph"]
+    rag_graph.kg_base.save(image_rag_out_path)
+    return None
+@ops.input_position(rag_graph="bottom")
+@op("LynxScribe Image RAG Query")
+async def search_context(rag_graph, text, *, top_k=3):
+    message = text["text"]
+    rag_graph = rag_graph[0]["rag_graph"]
+    # get all similarities
+    emb_similarities = await rag_graph.search_context(
+        message, max_results=top_k, unique_metadata_key="image_url"
+    )
+    # get the image urls, scores and descriptions
+    result_list = []
+    for emb_sim in emb_similarities:
+        image_url = emb_sim.embedding.metadata["image_url"]
+        score = emb_sim.score
+        description = emb_sim.embedding.document
+        result_list.append({"image_url": image_url, "score": score, "description": description})
+    return {"embedding_similarities": result_list}
+@op("LynxScribe Image Result Viewer", view="image")
+def view_image(embedding_similarities):
+    """
+    Plotting the TOP images (from embedding similarities).
+    TODO: later on, the user can scroll the images and send feedbacks
+    """
+    embedding_similarities = embedding_similarities["embedding_similarities"]
+    return embedding_similarities[0]["image_url"]
+@op("LynxScribe Text RAG Loader")
+@mem.cache
+def ls_text_rag_loader(
+    file_urls,
+    *,
+    input_type: RAGVersion = RAGVersion.V1,
+    vdb_provider_name: str = "faiss",
+    vdb_num_dimensions: int = 3072,
+    vdb_collection_name: str = "lynx",
+    text_embedder_interface: str = "openai",
+    text_embedder_model_name_or_path: str = "text-embedding-3-large",
+    # api_key_name: str = "OPENAI_API_KEY",
+):
+    """
+    Loading a text-based RAG graph from saved files (getting pandas readable links).
+    """
+    # handling inputs
+    file_urls = file_urls["file_urls"]
+    # getting the text embedder instance
+    llm_params = {"name": text_embedder_interface}
+    # if api_key_name:
+    #     llm_params["api_key"] = os.getenv(api_key_name)
+    llm = get_llm_engine(**llm_params)
+    text_embedder = TextEmbedder(llm=llm, model=text_embedder_model_name_or_path)
+    # getting the vector store
+    if vdb_provider_name == "chromadb":
+        vector_store = get_vector_store(name=vdb_provider_name, collection_name=vdb_collection_name)
+    elif vdb_provider_name == "faiss":
+        vector_store = get_vector_store(name=vdb_provider_name, num_dimensions=vdb_num_dimensions)
+    else:
+        raise ValueError(f"Vector store name '{vdb_provider_name}' is not supported.")
+    # building up the RAG graph
+    rag_graph = RAGGraph(
+        PandasKnowledgeBaseGraph(vector_store=vector_store, text_embedder=text_embedder)
+    )
+    # loading the knowledge base (temporary + TODO: adding v2)
+    if input_type == RAGVersion.V1:
+        node_file = [f for f in file_urls if "nodes.p" in f][0]
+        edge_file = [f for f in file_urls if "edges.p" in f][0]
+        tempcluster_file = [f for f in file_urls if "clusters.p" in f][0]
+        rag_graph.kg_base.load_v1_knowledge_base(
+            nodes_path=node_file,
+            edges_path=edge_file,
+            template_cluster_path=tempcluster_file,
+        )
+    elif input_type == RAGVersion.V2:
+        raise ValueError("Currently only v1 input type is supported.")
+    else:
+        raise ValueError(f"Input type '{input_type}' is not supported.")
+    return {"rag_graph": rag_graph}
+@op("LynxScribe FAQ to RAG")
+@mem.cache
+async def ls_faq_to_rag(
+    *,
+    faq_excel_path: str = "",
+    vdb_provider_name: str = "faiss",
+    vdb_num_dimensions: int = 3072,
+    vdb_collection_name: str = "lynx",
+    text_embedder_interface: str = "openai",
+    text_embedder_model_name_or_path: str = "text-embedding-3-large",
+    scenario_cluster_distance_pct: int = 30,
+):
+    """
+    Loading a text-based RAG graph from saved files (getting pandas readable links).
+    """
+    # getting the text embedder instance
+    llm_params = {"name": text_embedder_interface}
+    llm = get_llm_engine(**llm_params)
+    text_embedder = TextEmbedder(llm=llm, model=text_embedder_model_name_or_path)
+    # getting the vector store
+    if vdb_provider_name == "chromadb":
+        vector_store = get_vector_store(name=vdb_provider_name, collection_name=vdb_collection_name)
+    elif vdb_provider_name == "faiss":
+        vector_store = get_vector_store(name=vdb_provider_name, num_dimensions=vdb_num_dimensions)
+    else:
+        raise ValueError(f"Vector store name '{vdb_provider_name}' is not supported.")
+    # building up the RAG graph
+    rag_graph = RAGGraph(
+        PandasKnowledgeBaseGraph(vector_store=vector_store, text_embedder=text_embedder)
+    )
+    # loading the knowledge base from the FAQ file
+    rag_template = RAGTemplate.from_excel_path(
+        path=faq_excel_path,
+        faq_data_sheet_name="scenario_examples",
+        scenario_data_sheet_name="scenario_scripts",
+        prompt_codes_sheet_name="prompt_dictionary",
+    )
+    faq_loader_params = {
+        "id_column": "scenario_example_ID",
+        "timestamp_column": "last_modified_timestamp",
+        "validity_column": "valid_flg",
+        "question_type_contents_id": ["faq_question", "faq_question", "q_{id}"],
+        "answer_type_contents_id": ["faq_answer", "{faq_question}\n\n{faq_answer}", "a_{id}"],
+        "question_to_answer_edge_type_weight": ["qna", 1.0],
+    }
+    nodes, edges = FAQTemplateLoader(**faq_loader_params).load_nodes_and_edges(
+        rag_template.faq_data
+    )
+    await rag_graph.kg_base.upsert_nodes(*nodes)
+    rag_graph.kg_base.upsert_edges(edges)
+    # Generating scenario clusters
+    question_ids = [_id for _id in nodes[0] if _id.startswith("q_")]
+    stored_embeddings = rag_graph.kg_base.vector_store.get(
+        question_ids, include=["embeddings", "metadatas"]
+    )
+    embedding_vals = pd.Series([_emb.value for _emb in stored_embeddings], index=question_ids)
+    labels = pd.Series(
+        [_emb.metadata["scenario_name"] for _emb in stored_embeddings], index=question_ids
+    )
+    temp_cls = FclusterBasedClustering(distance_percentile=scenario_cluster_distance_pct)
+    temp_cls.fit(embedding_vals, labels)
+    df_tempclusters = temp_cls.get_cluster_centers()
+    # Adding the scenario clusters to the RAG Graph
+    df_tempclusters["template_id"] = "t_" + df_tempclusters.index.astype(str)
+    df_tempclusters["embedding"] = df_tempclusters.apply(
+        lambda row: Embedding(
+            id=row["template_id"],
+            value=row["cluster_center"],
+            metadata={"scenario_name": row["control_label"], "type": "intent_cluster"},
+        ),
+        axis=1,
+    )
+    embedding_list = df_tempclusters["embedding"].tolist()
+    rag_graph.kg_base.vector_store.upsert(embedding_list)
     return {"rag_graph": rag_graph}
 @output_on_top
+@op("LynxScribe RAG Graph Chatbot Builder")
+def ls_rag_chatbot_builder(
+    rag_graph,
+    *,
+    scenario_file: str = "uploads/lynx_chatbot_scenario_selector.yaml",
+    node_types: str = "intent_cluster",
+    scenario_meta_name: str = "",
+):
+    """
+    Builds up a RAG Graph-based chatbot (basically the loaded RAG graph +
+    a scenario selector).
+    TODO: Later, the scenario selector can be built up synthetically from
+    the input documents - or semi-automated, not just from the scenario
+    yaml.
+    """
     scenarios = load_config(scenario_file)
     node_types = [t.strip() for t in node_types.split(",")]
+    # handling inputs
+    rag_graph = rag_graph["rag_graph"]
+    parameters = {
+        "scenarios": [Scenario(**scenario) for scenario in scenarios],
+        "node_types": node_types,
+    }
+    if len(scenario_meta_name) > 0:
+        parameters["get_scenario_name"] = lambda node: node.metadata[scenario_meta_name]
+    # loading the scenarios
+    scenario_selector = ScenarioSelector(**parameters)
+    # TODO: later we should unify this "knowledge base" object across the functions
+    # this could be always an input of a RAG Chatbot, but also for other apps.
+    return {
+        "knowledge_base": {
+            "rag_graph": rag_graph,
+            "scenario_selector": scenario_selector,
+        }
+    }
 @output_on_top
+@ops.input_position(knowledge_base="bottom", chat_processor="bottom")
+@op("LynxScribe RAG Graph Chatbot Backend")
+def ls_rag_chatbot_backend(
+    knowledge_base,
+    chat_processor,
     *,
     negative_answer=DEFAULT_NEGATIVE_ANSWER,
+    retriever_limits_by_type="{}",
+    retriever_strict_limits=True,
+    retriever_overall_chunk_limit=20,
+    retriever_overall_token_limit=3000,
+    retriever_max_iterations=3,
+    llm_interface: str = "openai",
+    llm_model_name: str = "gpt-4o",
+    # api_key_name: str = "OPENAI_API_KEY",
 ):
+    """
+    Returns with a chatbot instance.
+    """
+    # handling_inputs
+    rag_graph = knowledge_base[0]["knowledge_base"]["rag_graph"]
+    scenario_selector = knowledge_base[0]["knowledge_base"]["scenario_selector"]
+    chat_processor = chat_processor[0]["chat_processor"]
+    limits_by_type = json.loads(retriever_limits_by_type)
+    # connecting to the LLM
+    llm_params = {"name": llm_interface}
+    # if api_key_name:
+    #     llm_params["api_key"] = os.getenv(api_key_name)
+    llm = get_llm_engine(**llm_params)
+    # setting the parameters
+    params = {
+        "limits_by_type": limits_by_type,
+        "strict_limits": retriever_strict_limits,
+        "max_results": retriever_overall_chunk_limit,
+        "token_limit": retriever_overall_token_limit,
+        "max_iterations": retriever_max_iterations,
+    }
+    # generating the RAG Chatbot
     rag_chatbot = RAGChatbot(
         rag_graph=rag_graph,
         scenario_selector=scenario_selector,
         llm=llm,
         negative_answer=negative_answer,
+        **params,
+    )
+    # generating the chatbot back-end
+    c = ChatAPI(
+        chatbot=rag_chatbot,
+        chat_processor=chat_processor,
+        model=llm_model_name,
     )
+    return {"chat_api": c}
 @output_on_top
         messages=[{"role": "user", "content": message["text"]}],
     )
     response = await chat_api.answer(request, stream=False)
+    if len(response.choices) == 0:
+        answer = "The following FAQ items are similar to the question:\n"
+        for item in response.sources:
+            answer += f"------------------------------------------------------ \n{item.body}\n\n"
+    else:
+        answer = response.choices[0].message.content
     if show_details:
         return {"answer": answer, **response.__dict__}
     else:
     return {"text": chat}
 @op("View", view="table_view")
 def view(input):
     columns = [str(c) for c in input.keys() if not str(c).startswith("_")]
     assert path.exists(), f"Workspace {path} does not exist"
     ws = workspace.load(path)
     contexts = await ops.EXECUTORS[ENV](ws)
+    nodes = [op for op in ws.nodes if op.data.title == "LynxScribe RAG Graph Chatbot Backend"]
     [node] = nodes
     context = contexts[node.id]
     return context.last_result["chat_api"]
                 pass  # Ignore files that are not valid workspaces.
     workspaces.sort()
     return workspaces
+def dictionary_corrector(dict_string: str, expected_keys: list | None = None) -> dict:
+    """
+    Processing LLM outputs: when the LLM returns with a dictionary (in a string format). It optionally
+    crosschecks the input with the expected keys and return a dictionary with the expected keys and their
+    values ('unknown' if not present). If there is an error during the processing, it will return with
+    a dictionary of the expected keys, all with 'error' as a value (or with an empty dictionary).
+    Currently the function does not delete the extra key-value pairs.
+    """
+    out_dict = {}
+    if len(dict_string) == 0:
+        return out_dict
+    # deleting the optional text before the first and after the last curly brackets
+    dstring_prc = dict_string
+    if dstring_prc[0] != "{":
+        dstring_prc = "{" + "{".join(dstring_prc.split("{")[1:])
+    if dstring_prc[-1] != "}":
+        dstring_prc = "}".join(dstring_prc.split("}")[:-1]) + "}"
+    try:
+        trf_dict = json.loads(dstring_prc)
+        if expected_keys:
+            for _key in expected_keys:
+                if _key in trf_dict:
+                    out_dict[_key] = trf_dict[_key]
+                else:
+                    out_dict[_key] = "unknown"
+        else:
+            out_dict = trf_dict
+    except Exception:
+        if expected_keys:
+            for _key in expected_keys:
+                out_dict[_key] = "error"
+    return out_dict