lleticiasilvaa commited on
Commit
fa517b3
·
verified ·
1 Parent(s): e077a9e

Training in progress, step 1250

Browse files
README.md CHANGED
@@ -1,7 +1,7 @@
1
  ---
2
  base_model: stabilityai/stable-code-instruct-3b
3
  library_name: transformers
4
- model_name: StableCode-text2SQL-alias-indentacao
5
  tags:
6
  - generated_from_trainer
7
  - trl
@@ -9,7 +9,7 @@ tags:
9
  licence: license
10
  ---
11
 
12
- # Model Card for StableCode-text2SQL-alias-indentacao
13
 
14
  This model is a fine-tuned version of [stabilityai/stable-code-instruct-3b](https://huggingface.co/stabilityai/stable-code-instruct-3b).
15
  It has been trained using [TRL](https://github.com/huggingface/trl).
@@ -20,24 +20,25 @@ It has been trained using [TRL](https://github.com/huggingface/trl).
20
  from transformers import pipeline
21
 
22
  question = "If you had a time machine, but could only go to the past or the future once and never return, which would you choose and why?"
23
- generator = pipeline("text-generation", model="lleticiasilvaa/StableCode-text2SQL-alias-indentacao", device="cuda")
24
  output = generator([{"role": "user", "content": question}], max_new_tokens=128, return_full_text=False)[0]
25
  print(output["generated_text"])
26
  ```
27
 
28
  ## Training procedure
29
 
 
30
 
31
 
32
  This model was trained with SFT.
33
 
34
  ### Framework versions
35
 
36
- - TRL: 0.12.0
37
- - Transformers: 4.46.2
38
- - Pytorch: 2.5.0+cu121
39
- - Datasets: 3.1.0
40
- - Tokenizers: 0.20.3
41
 
42
  ## Citations
43
 
 
1
  ---
2
  base_model: stabilityai/stable-code-instruct-3b
3
  library_name: transformers
4
+ model_name: StableCode-text2SQL-withoutquantization
5
  tags:
6
  - generated_from_trainer
7
  - trl
 
9
  licence: license
10
  ---
11
 
12
+ # Model Card for StableCode-text2SQL-withoutquantization
13
 
14
  This model is a fine-tuned version of [stabilityai/stable-code-instruct-3b](https://huggingface.co/stabilityai/stable-code-instruct-3b).
15
  It has been trained using [TRL](https://github.com/huggingface/trl).
 
20
  from transformers import pipeline
21
 
22
  question = "If you had a time machine, but could only go to the past or the future once and never return, which would you choose and why?"
23
+ generator = pipeline("text-generation", model="lleticiasilvaa/StableCode-text2SQL-withoutquantization", device="cuda")
24
  output = generator([{"role": "user", "content": question}], max_new_tokens=128, return_full_text=False)[0]
25
  print(output["generated_text"])
26
  ```
27
 
28
  ## Training procedure
29
 
30
+
31
 
32
 
33
  This model was trained with SFT.
34
 
35
  ### Framework versions
36
 
37
+ - TRL: 0.13.0
38
+ - Transformers: 4.47.1
39
+ - Pytorch: 2.5.1+cu121
40
+ - Datasets: 3.2.0
41
+ - Tokenizers: 0.21.0
42
 
43
  ## Citations
44
 
adapter_config.json CHANGED
@@ -6,6 +6,8 @@
6
  },
7
  "base_model_name_or_path": "stabilityai/stable-code-instruct-3b",
8
  "bias": "none",
 
 
9
  "fan_in_fan_out": false,
10
  "inference_mode": true,
11
  "init_lora_weights": true,
@@ -14,6 +16,7 @@
14
  "layers_to_transform": null,
15
  "loftq_config": {},
16
  "lora_alpha": 128,
 
17
  "lora_dropout": 0.1,
18
  "megatron_config": null,
19
  "megatron_core": "megatron.core",
@@ -23,13 +26,13 @@
23
  "rank_pattern": {},
24
  "revision": null,
25
  "target_modules": [
26
- "q_proj",
27
- "o_proj",
28
- "v_proj",
29
  "k_proj",
30
- "up_proj",
 
 
31
  "gate_proj",
32
- "down_proj"
 
33
  ],
34
  "task_type": null,
35
  "use_dora": false,
 
6
  },
7
  "base_model_name_or_path": "stabilityai/stable-code-instruct-3b",
8
  "bias": "none",
9
+ "eva_config": null,
10
+ "exclude_modules": null,
11
  "fan_in_fan_out": false,
12
  "inference_mode": true,
13
  "init_lora_weights": true,
 
16
  "layers_to_transform": null,
17
  "loftq_config": {},
18
  "lora_alpha": 128,
19
+ "lora_bias": false,
20
  "lora_dropout": 0.1,
21
  "megatron_config": null,
22
  "megatron_core": "megatron.core",
 
26
  "rank_pattern": {},
27
  "revision": null,
28
  "target_modules": [
 
 
 
29
  "k_proj",
30
+ "down_proj",
31
+ "v_proj",
32
+ "o_proj",
33
  "gate_proj",
34
+ "q_proj",
35
+ "up_proj"
36
  ],
37
  "task_type": null,
38
  "use_dora": false,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7ab32c23cca063b93ae2b88c96355b5cc260795d91ee4cf1b08c5f5bb776b507
3
  size 400616360
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0f9c750d51f6519dc289b70fa45af7dd6c73dd07f65d521798ef808e1ef90c24
3
  size 400616360
logs/events.out.tfevents.1735923028.1356149f6382.358.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f024c1e2d4631c2b2cba7a7cd69bf12510b023147029fc09c0bd2b4d298bd5c
3
+ size 10670
logs/events.out.tfevents.1736189043.154f07f7b0d9.1770.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:411d2371102f8c8e78ffb5b7931c855affd4e6ceb77b4226bf5ed42c248f1da0
3
+ size 10325
logs/events.out.tfevents.1736193007.154f07f7b0d9.1770.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f9c14789027d905f61df5a045ef15dceff49a4a059ff1afaf2251bf2fb8dc73
3
+ size 6341
logs/events.out.tfevents.1736193779.154f07f7b0d9.1770.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:76fe71fc6491fcac0f506994f9ac674e695e3ac8e16942355319b76cd060841f
3
+ size 6467
tokenizer_config.json CHANGED
@@ -384,6 +384,7 @@
384
  "chat_template": "{% if messages[0]['role'] == 'system' %}{% set loop_messages = messages[1:] %}{% set system_message = messages[0]['content'] %}{% else %}{% set loop_messages = messages %}{% set system_message = 'You are a helpful assistant.' %}{% endif %}{% if not add_generation_prompt is defined %}{% set add_generation_prompt = false %}{% endif %}{% for message in loop_messages %}{% if loop.index0 == 0 %}{{'<|im_start|>system\n' + system_message + '<|im_end|>\n'}}{% endif %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
385
  "clean_up_tokenization_spaces": true,
386
  "eos_token": "<|endoftext|>",
 
387
  "map_device": "auto",
388
  "model_max_length": 4096,
389
  "pad_token": "<|endoftext|>",
 
384
  "chat_template": "{% if messages[0]['role'] == 'system' %}{% set loop_messages = messages[1:] %}{% set system_message = messages[0]['content'] %}{% else %}{% set loop_messages = messages %}{% set system_message = 'You are a helpful assistant.' %}{% endif %}{% if not add_generation_prompt is defined %}{% set add_generation_prompt = false %}{% endif %}{% for message in loop_messages %}{% if loop.index0 == 0 %}{{'<|im_start|>system\n' + system_message + '<|im_end|>\n'}}{% endif %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
385
  "clean_up_tokenization_spaces": true,
386
  "eos_token": "<|endoftext|>",
387
+ "extra_special_tokens": {},
388
  "map_device": "auto",
389
  "model_max_length": 4096,
390
  "pad_token": "<|endoftext|>",
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:da3dedd34988f1200d6dd0bdca9a10b85e9fdb9d16cf44025625c8ff185de71a
3
  size 5560
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:37d85e10062490083f3df78142b22b936ee4c10ad7bb1c35d68c6a9743be03a9
3
  size 5560