Spaces:

Deepak7376
/

DocChatAI

Running

Deepak Yadav

updated new version deepseek-r1

7cf558f 5 months ago

772 Bytes

	from langchain_ollama import OllamaLLM
	from langchain_huggingface import HuggingFaceEmbeddings
	import streamlit as st


	@st.cache_resource
	def initialize_llm(model_name, temperature, top_p, max_tokens):
	# Configure the LLM with additional parameters
	llm = OllamaLLM(
	model=model_name,
	base_url="https://deepak7376-ollama-server.hf.space",
	temperature=temperature, # Controls randomness (0 = deterministic, 1 = max randomness)
	max_tokens=max_tokens, # Limit the number of tokens in the output
	top_p=top_p # Nucleus sampling for controlling diversity
	)
	return llm

	@st.cache_resource
	def initialize_embeddings():
	embeddings = HuggingFaceEmbeddings(model_name="all-MiniLM-L6-v2")
	return embeddings