Lazyhope
/

python-clone-detection

Feature Extraction

text-embeddings-inference

Inference Endpoints

Model card Files Files and versions Community

python-clone-detection / tokenizer_config.json

Lazyhope's picture

Add pipeline for clone detection

d0e1e46 about 2 years ago

history blame contribute delete

1.52 kB

	{
	"add_prefix_space": false,
	"bos_token": {
	"__type": "AddedToken",
	"content": "<s>",
	"lstrip": false,
	"normalized": true,
	"rstrip": false,
	"single_word": false
	},
	"cls_token": {
	"__type": "AddedToken",
	"content": "<s>",
	"lstrip": false,
	"normalized": true,
	"rstrip": false,
	"single_word": false
	},
	"eos_token": {
	"__type": "AddedToken",
	"content": "</s>",
	"lstrip": false,
	"normalized": true,
	"rstrip": false,
	"single_word": false
	},
	"errors": "replace",
	"mask_token": {
	"__type": "AddedToken",
	"content": "<mask>",
	"lstrip": true,
	"normalized": true,
	"rstrip": false,
	"single_word": false
	},
	"model_max_length": 512,
	"name_or_path": "Lazyhope/python-clone-detection",
	"pad_token": {
	"__type": "AddedToken",
	"content": "<pad>",
	"lstrip": false,
	"normalized": true,
	"rstrip": false,
	"single_word": false
	},
	"sep_token": {
	"__type": "AddedToken",
	"content": "</s>",
	"lstrip": false,
	"normalized": true,
	"rstrip": false,
	"single_word": false
	},
	"special_tokens_map_file": "/root/autodl-tmp/.cache/models--microsoft--graphcodebert-base/snapshots/2b0488a7bb0eefc7041f1bb2cad1ab26b0da269d/special_tokens_map.json",
	"tokenizer_class": "RobertaTokenizer",
	"trim_offsets": true,
	"unk_token": {
	"__type": "AddedToken",
	"content": "<unk>",
	"lstrip": false,
	"normalized": true,
	"rstrip": false,
	"single_word": false
	}
	}