Update configs.py
Browse files- configs.py +2 -1
configs.py
CHANGED
@@ -34,7 +34,8 @@ model_info = {
|
|
34 |
layers_format=llama_layers_format
|
35 |
),
|
36 |
'CodeLLAMA 70B Instruct (Experimental)': dict(model_path='TheBloke/CodeLlama-70B-Instruct-GPTQ',
|
37 |
-
token=os.environ['hf_token'],
|
|
|
38 |
original_prompt_template='<s>{prompt}',
|
39 |
interpretation_prompt_template='<s>[INST] [X] [/INST] {prompt}',
|
40 |
layers_format=llama_layers_format
|
|
|
34 |
layers_format=llama_layers_format
|
35 |
),
|
36 |
'CodeLLAMA 70B Instruct (Experimental)': dict(model_path='TheBloke/CodeLlama-70B-Instruct-GPTQ',
|
37 |
+
token=os.environ['hf_token'],
|
38 |
+
wait_with_hidden_states=True, dont_cuda=True, device_map='cuda',
|
39 |
original_prompt_template='<s>{prompt}',
|
40 |
interpretation_prompt_template='<s>[INST] [X] [/INST] {prompt}',
|
41 |
layers_format=llama_layers_format
|