Spaces:

KBaba7
/

Quantization-LLM

Running

Quantization-LLM / llama.cpp /src /llama-sampling.h

Upload 7646 files

a1a4268 verified 14 days ago

754 Bytes

	#pragma once

	// TODO: rename llama-sampling.h/.cpp to llama-sampler.h/.cpp ?

	#include "llama.h"

	#include <vector>

	struct llama_vocab;
	struct llama_grammar;

	// sampler chain

	struct llama_sampler_chain {
	llama_sampler_chain_params params;

	std::vector<struct llama_sampler *> samplers;

	// timing

	mutable int64_t t_sample_us;

	mutable int32_t n_sample;
	};

	struct llama_sampler * llama_sampler_init_dry_testing(
	int32_t context_size,
	float dry_multiplier,
	float dry_base,
	int32_t dry_allowed_length,
	int32_t dry_penalty_last_n,
	const std::vector<std::vector<llama_token>>& seq_breakers);