sharpenb's picture
97cdadb3b6bb61f5b9d892deef7ae097b0627f1dd804f21cdceb0c4e24ea8d03
ee23848 verified
raw
history blame
928 Bytes
{
"api_key": null,
"verify_url": "http://johnrachwan.pythonanywhere.com",
"smash_config": {
"pruners": "None",
"factorizers": "None",
"quantizers": "['llm-int8']",
"compilers": "None",
"task": "text_text_generation",
"device": "cuda",
"cache_dir": "/ceph/hdd/staff/charpent/.cache/models2nwis9i1",
"batch_size": 1,
"model_name": "h2oai/h2ogpt-gm-oasst1-en-2048-falcon-7b-v3",
"pruning_ratio": 0.0,
"n_quantization_bits": 8,
"output_deviation": 0.005,
"max_batch_size": 1,
"qtype_weight": "torch.qint8",
"qtype_activation": "torch.quint8",
"qobserver": "<class 'torch.ao.quantization.observer.MinMaxObserver'>",
"qscheme": "torch.per_tensor_symmetric",
"qconfig": "x86",
"group_size": 128,
"damp_percent": 0.1,
"save_load_fn": "bitsandbytes"
}
}