Spaces:

dar-tau
/

run_inference

Sleeping

dar-tau commited on Jun 8, 2024

Commit

b80761a

verified ·

1 Parent(s): 4333b51

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -4,12 +4,14 @@ import spaces
 from transformers import AutoTokenizer, AutoModelForCausalLM, pipeline
-model_name = "teknium/OpenHermes-2.5-Mistral-7B"
 token = os.environ['hf_token']
 pipe = pipeline("text-generation", model=model_name, device="cuda")
 system_prompt = '''You are given an input text for a chat interface. Propose auto-completion to the text. You have several roles:
 - Fight under-specification: if the user does not provide sufficient context, propose them a set of relevant suggestions.
 - Complete text: The text provided to you is in the making. If you have a good idea for how to complete - make suggestions.
@@ -24,7 +26,7 @@ def generate(text):
         {'role': 'system', 'content': system_prompt},
         {'role': 'user', 'content': text}
     ]
-    return pipe(messages)
 if __name__ == "__main__":

 from transformers import AutoTokenizer, AutoModelForCausalLM, pipeline
+model_name = "TheBloke/OpenHermes-2.5-Mistral-7B-GGUF"
 token = os.environ['hf_token']
 pipe = pipeline("text-generation", model=model_name, device="cuda")
+generate_kwargs = {'max_new_tokens': 20}
 system_prompt = '''You are given an input text for a chat interface. Propose auto-completion to the text. You have several roles:
 - Fight under-specification: if the user does not provide sufficient context, propose them a set of relevant suggestions.
 - Complete text: The text provided to you is in the making. If you have a good idea for how to complete - make suggestions.
         {'role': 'system', 'content': system_prompt},
         {'role': 'user', 'content': text}
     ]
+    return pipe(messages, generate_kwargs=generate_kwargs)
 if __name__ == "__main__":