Update app.py
Browse files
app.py
CHANGED
@@ -75,7 +75,7 @@ def retrieved_info(query, rag_model = rag_model, generating_model = model):
|
|
75 |
# Generating answer using gemma model
|
76 |
tokenizer = AutoTokenizer.from_pretrained("HuggingFaceH4/zephyr-7b-beta")
|
77 |
input_ids = tokenizer(generation_model_input, return_tensors='pt').to(device)
|
78 |
-
output = generating_model.generate(input_ids, max_new_tokens =
|
79 |
|
80 |
return tokenizer.decode(output[0])
|
81 |
|
@@ -116,7 +116,7 @@ demo = gr.ChatInterface(
|
|
116 |
type = 'messages',
|
117 |
additional_inputs=[
|
118 |
gr.Textbox(value="You are a helpful and friendly assistant.", label="System message"),
|
119 |
-
gr.Slider(minimum=1, maximum=2048, value=
|
120 |
gr.Slider(minimum=0.1, maximum=4.0, value=0.7, step=0.1, label="Temperature"),
|
121 |
gr.Slider(
|
122 |
minimum=0.1,
|
|
|
75 |
# Generating answer using gemma model
|
76 |
tokenizer = AutoTokenizer.from_pretrained("HuggingFaceH4/zephyr-7b-beta")
|
77 |
input_ids = tokenizer(generation_model_input, return_tensors='pt').to(device)
|
78 |
+
output = generating_model.generate(input_ids, max_new_tokens = 256)
|
79 |
|
80 |
return tokenizer.decode(output[0])
|
81 |
|
|
|
116 |
type = 'messages',
|
117 |
additional_inputs=[
|
118 |
gr.Textbox(value="You are a helpful and friendly assistant.", label="System message"),
|
119 |
+
gr.Slider(minimum=1, maximum=2048, value=256, step=1, label="Max new tokens"),
|
120 |
gr.Slider(minimum=0.1, maximum=4.0, value=0.7, step=0.1, label="Temperature"),
|
121 |
gr.Slider(
|
122 |
minimum=0.1,
|