AI-RESEARCHER-2024 commited on
Commit
adac3f1
·
verified ·
1 Parent(s): 975d8aa

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +10 -9
app.py CHANGED
@@ -25,6 +25,7 @@ class RAGInterface:
25
  self.llm = Llama.from_pretrained(
26
  repo_id="bartowski/Llama-3.2-1B-Instruct-GGUF",
27
  filename="Llama-3.2-1B-Instruct-Q8_0.gguf",
 
28
  )
29
 
30
  # Define RAG prompt template
@@ -42,7 +43,7 @@ class RAGInterface:
42
  """
43
  self.prompt = PromptTemplate.from_template(self.template)
44
 
45
- def respond(self, message, history, system_message, max_tokens, temperature):
46
  # Build messages list
47
  messages = [{"role": "system", "content": system_message}]
48
  for user_msg, assistant_msg in history:
@@ -160,14 +161,14 @@ class RAGInterface:
160
  label="System Message",
161
  elem_classes="control-panel"
162
  ),
163
- gr.Slider(
164
- minimum=1,
165
- maximum=2048,
166
- value=512,
167
- step=1,
168
- label="Max New Tokens",
169
- elem_classes="control-panel"
170
- ),
171
  gr.Slider(
172
  minimum=0.1,
173
  maximum=1.0,
 
25
  self.llm = Llama.from_pretrained(
26
  repo_id="bartowski/Llama-3.2-1B-Instruct-GGUF",
27
  filename="Llama-3.2-1B-Instruct-Q8_0.gguf",
28
+ n_ctx=2048
29
  )
30
 
31
  # Define RAG prompt template
 
43
  """
44
  self.prompt = PromptTemplate.from_template(self.template)
45
 
46
+ def respond(self, message, history, system_message, temperature,max_tokens=2048):
47
  # Build messages list
48
  messages = [{"role": "system", "content": system_message}]
49
  for user_msg, assistant_msg in history:
 
161
  label="System Message",
162
  elem_classes="control-panel"
163
  ),
164
+ # gr.Slider(
165
+ # minimum=1,
166
+ # maximum=2048,
167
+ # value=512,
168
+ # step=1,
169
+ # label="Max New Tokens",
170
+ # elem_classes="control-panel"
171
+ # ),
172
  gr.Slider(
173
  minimum=0.1,
174
  maximum=1.0,