cortexso
/

test-internlm3-8b-instruct-gguf

Inference Endpoints

Model card Files Files and versions Community

test-internlm3-8b-instruct-gguf / model.yml

jan-hq's picture

Upload model.yml with huggingface_hub

2d0b5a0 verified 15 days ago

history blame contribute delete

927 Bytes

	# BEGIN GENERAL GGUF METADATA
	id: test-internlm3-8b-instruct-gguf
	model: test-internlm3-8b-instruct-gguf
	name: test-internlm3-8b-instruct-gguf
	version: 1
	# END GENERAL GGUF METADATA

	# BEGIN INFERENCE PARAMETERS
	# BEGIN REQUIRED
	stop:
	- <\|im_end\|>
	- </s>
	# END REQUIRED

	# BEGIN OPTIONAL
	stream: true
	top_p: 0.9
	temperature: 0.7
	frequency_penalty: 0
	presence_penalty: 0
	max_tokens: 4096
	seed: -1
	dynatemp_range: 0
	dynatemp_exponent: 1
	top_k: 40
	min_p: 0.05
	tfs_z: 1
	typ_p: 1
	repeat_last_n: 64
	repeat_penalty: 1
	mirostat: false
	mirostat_tau: 5
	mirostat_eta: 0.100000001
	penalize_nl: false
	ignore_eos: false
	n_probs: 0
	min_keep: 0
	# END OPTIONAL
	# END INFERENCE PARAMETERS

	# BEGIN MODEL LOAD PARAMETERS
	# BEGIN REQUIRED
	engine: llama-cpp
	prompt_template: <\|im_start\|>system\n{system_message}<\|im_end\|>\n<\|im_start\|>user\n{prompt}<\|im_end\|>\n<\|im_start\|>assistant
	ctx_len: 4096
	ngl: 34
	# END REQUIRED
	# END MODEL LOAD PARAMETERS