nitky
/

Swallow-70b-NVE-RP

Text Generation

text-generation-inference

Inference Endpoints

Model card Files Files and versions Community

Swallow-70b-NVE-RP / mergekit_config.yml

nitky's picture

Upload 22 files

281fa5a verified 11 months ago

history blame contribute delete

1.24 kB

	models:
	- model: tokyotech-llm/Swallow-70b-NVE-instruct-hf
	# no parameters necessary for base model
	- model: GOAT-AI/GOAT-70B-Storytelling # storytelling
	parameters:
	density: 1
	weight: 0.25
	- model: dreamgen/opus-v0.5-70b # creative roleplay
	parameters:
	density: 1
	weight: 0.25
	merge_method: dare_ties
	base_model: tokyotech-llm/Swallow-70b-NVE-instruct-hf
	dtype: bfloat16
	name: Swallow-70b-NVE-RP-base
	---
	models:
	- model: tokyotech-llm/Swallow-70b-NVE-instruct-hf
	# no parameters necessary for base model
	- model: Doctor-Shotgun/lzlv-limarpv3-l2-70b # roleplay configuration
	parameters:
	density: 1
	weight: 0.25
	merge_method: dare_ties
	base_model: tokyotech-llm/Swallow-70b-NVE-instruct-hf
	dtype: bfloat16
	name: Swallow-70b-NVE-RP-flavor
	---
	slices:
	- sources:
	- model: Swallow-70b-NVE-RP-base
	layer_range: [0, 80]
	- model: Swallow-70b-NVE-RP-flavor
	layer_range: [0, 80]
	merge_method: slerp
	base_model: Swallow-70b-NVE-RP-base
	parameters:
	t:
	- filter: self_attn
	value: [0, 0.5, 0.3, 0.7, 1]
	- filter: mlp
	value: [1, 0.5, 0.7, 0.3, 0]
	- value: 0.5 # fallback for rest of tensors
	dtype: bfloat16
	name: Swallow-70b-NVE-RP