Spaces:

dar-tau
/

selfie

Sleeping

dar-tau commited on Apr 11, 2024

Commit

655bead

verified ·

1 Parent(s): c9e13f6

Update configs.py

Files changed (1) hide show

configs.py CHANGED Viewed

@@ -35,7 +35,7 @@ model_info = {
                                  ),
     'CodeLLAMA 70B Instruct (Experimental)': dict(model_path='TheBloke/CodeLlama-70B-Instruct-GPTQ',
                                    token=os.environ['hf_token'],
-                                   wait_with_hidden_states=True, dont_cuda=True, device_map='cuda', disable_exllama=True,
                                    original_prompt_template='<s>{prompt}',
                                    interpretation_prompt_template='<s>[INST] [X] [/INST] {prompt}',
                                    layers_format=llama_layers_format

                                  ),
     'CodeLLAMA 70B Instruct (Experimental)': dict(model_path='TheBloke/CodeLlama-70B-Instruct-GPTQ',
                                    token=os.environ['hf_token'],
+                                   wait_with_hidden_states=True, dont_cuda=True, device_map='cuda', # disable_exllama=True,
                                    original_prompt_template='<s>{prompt}',
                                    interpretation_prompt_template='<s>[INST] [X] [/INST] {prompt}',
                                    layers_format=llama_layers_format