dar-tau commited on
Commit
11779fd
·
verified ·
1 Parent(s): 4306d57

Update configs.py

Browse files
Files changed (1) hide show
  1. configs.py +2 -1
configs.py CHANGED
@@ -34,7 +34,8 @@ model_info = {
34
  layers_format=llama_layers_format
35
  ),
36
  'CodeLLAMA 70B Instruct (Experimental)': dict(model_path='TheBloke/CodeLlama-70B-Instruct-GPTQ',
37
- token=os.environ['hf_token'], wait_with_hidden_states=True,
 
38
  original_prompt_template='<s>{prompt}',
39
  interpretation_prompt_template='<s>[INST] [X] [/INST] {prompt}',
40
  layers_format=llama_layers_format
 
34
  layers_format=llama_layers_format
35
  ),
36
  'CodeLLAMA 70B Instruct (Experimental)': dict(model_path='TheBloke/CodeLlama-70B-Instruct-GPTQ',
37
+ token=os.environ['hf_token'],
38
+ wait_with_hidden_states=True, dont_cuda=True, device_map='cuda',
39
  original_prompt_template='<s>{prompt}',
40
  interpretation_prompt_template='<s>[INST] [X] [/INST] {prompt}',
41
  layers_format=llama_layers_format