curseofknowledge commited on
Commit
af96b41
·
verified ·
1 Parent(s): 6cb5b42

Training in progress, epoch 1

Browse files
README.md CHANGED
@@ -4,8 +4,8 @@ library_name: transformers
4
  model_name: gemma-text-to-sql
5
  tags:
6
  - generated_from_trainer
7
- - trl
8
  - sft
 
9
  licence: license
10
  ---
11
 
@@ -34,11 +34,11 @@ This model was trained with SFT.
34
 
35
  ### Framework versions
36
 
37
- - TRL: 0.18.1
38
- - Transformers: 4.52.4
39
- - Pytorch: 2.7.0+cu118
40
- - Datasets: 3.6.0
41
- - Tokenizers: 0.21.1
42
 
43
  ## Citations
44
 
 
4
  model_name: gemma-text-to-sql
5
  tags:
6
  - generated_from_trainer
 
7
  - sft
8
+ - trl
9
  licence: license
10
  ---
11
 
 
34
 
35
  ### Framework versions
36
 
37
+ - TRL: 0.19.1
38
+ - Transformers: 4.53.2
39
+ - Pytorch: 2.7.1+cu118
40
+ - Datasets: 4.0.0
41
+ - Tokenizers: 0.21.2
42
 
43
  ## Citations
44
 
adapter_config.json CHANGED
@@ -20,20 +20,22 @@
20
  "megatron_core": "megatron.core",
21
  "modules_to_save": null,
22
  "peft_type": "LORA",
 
23
  "r": 16,
24
  "rank_pattern": {},
25
  "revision": null,
26
  "target_modules": [
27
  "o_proj",
28
- "down_proj",
29
  "k_proj",
30
  "up_proj",
31
- "v_proj",
32
  "q_proj",
33
- "gate_proj"
 
 
34
  ],
35
  "task_type": "CAUSAL_LM",
36
  "trainable_token_indices": null,
37
  "use_dora": false,
 
38
  "use_rslora": false
39
  }
 
20
  "megatron_core": "megatron.core",
21
  "modules_to_save": null,
22
  "peft_type": "LORA",
23
+ "qalora_group_size": 16,
24
  "r": 16,
25
  "rank_pattern": {},
26
  "revision": null,
27
  "target_modules": [
28
  "o_proj",
 
29
  "k_proj",
30
  "up_proj",
 
31
  "q_proj",
32
+ "gate_proj",
33
+ "v_proj",
34
+ "down_proj"
35
  ],
36
  "task_type": "CAUSAL_LM",
37
  "trainable_token_indices": null,
38
  "use_dora": false,
39
+ "use_qalora": false,
40
  "use_rslora": false
41
  }
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9566f3cfb7db387835c8302a42348a3523acc0e874dfc125125c9d62321abffb
3
  size 52231312
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:991e98d6dd5ae8e900786b786f86a27f6dd9997fd2d396bfa074c70a04c184bc
3
  size 52231312
runs/Jul19_03-03-05_DESKTOP-NKD4QD0/events.out.tfevents.1752883387.DESKTOP-NKD4QD0.15504.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e9228dca491b6791fa5d5e5a0be0979e49eb88286006417347e3d85722bc62cf
3
+ size 6898
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ae60ed5b58c845f6b4a063623062db18eca22dda99aeb0c7aae3690bcbc52374
3
- size 6097
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d183d4dc9532af96d8f32f89272661e4d9d08773227b09d74445c6c524c1c698
3
+ size 6225