Spaces:

dar-tau
/

selfie

Sleeping

dar-tau commited on Apr 11, 2024

Commit

a6550e6

verified ·

1 Parent(s): e8236ff

Update configs.py

Files changed (1) hide show

configs.py CHANGED Viewed

@@ -17,8 +17,9 @@ model_info = {
     'LLAMA2-7B': dict(model_path='meta-llama/Llama-2-7b-chat-hf', token=os.environ['hf_token'],
                       original_prompt_template='<s>{prompt}',
                       interpretation_prompt_template='<s>[INST] [X] [/INST] {prompt}',
-                      layers_format=llama_layers_format), # , load_in_8bit=True
-    'LLAMA2-13B': dict(model_path='meta-llama/Llama-2-13b-chat-hf', token=os.environ['hf_token'],
                       original_prompt_template='<s>{prompt}',
                       interpretation_prompt_template='<s>[INST] [X] [/INST] {prompt}',
                       layers_format=llama_layers_format),

     'LLAMA2-7B': dict(model_path='meta-llama/Llama-2-7b-chat-hf', token=os.environ['hf_token'],
                       original_prompt_template='<s>{prompt}',
                       interpretation_prompt_template='<s>[INST] [X] [/INST] {prompt}',
+                      layers_format=llama_layers_format),
+    'LLAMA2-13B': dict(model_path='meta-llama/Llama-2-13b-chat-hf',
+                      token=os.environ['hf_token'], device_map='cuda', load_in_8bit=True,
                       original_prompt_template='<s>{prompt}',
                       interpretation_prompt_template='<s>[INST] [X] [/INST] {prompt}',
                       layers_format=llama_layers_format),