mirajnair commited on
Commit
324ee82
·
verified ·
1 Parent(s): a7f6cd2

update model

Browse files
Files changed (3) hide show
  1. config.json +35 -9
  2. generation_config.json +1 -1
  3. model.safetensors +2 -2
config.json CHANGED
@@ -1,21 +1,47 @@
1
  {
2
  "activation_function": "gelu",
3
  "architectures": [
4
- "GPT2LMHeadModel"
5
  ],
6
  "attn_pdrop": 0.1,
7
  "bos_token_id": "None",
8
  "embd_pdrop": 0.1,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
9
  "eos_token_id": "None",
10
  "initializer_range": 0.02,
11
  "layer_norm_epsilon": 1e-05,
12
- "model_type": "gpt2",
13
- "n_ctx": 32,
14
- "n_embd": 192,
15
- "n_head": 6,
16
  "n_inner": null,
17
- "n_layer": 6,
18
- "n_positions": 32,
19
  "reorder_and_upcast_attn": false,
20
  "resid_pdrop": 0.1,
21
  "scale_attn_by_inverse_layer_idx": false,
@@ -26,7 +52,7 @@
26
  "summary_type": "cls_index",
27
  "summary_use_proj": true,
28
  "torch_dtype": "float32",
29
- "transformers_version": "4.50.3",
30
  "use_cache": true,
31
- "vocab_size": 5
32
  }
 
1
  {
2
  "activation_function": "gelu",
3
  "architectures": [
4
+ "CustomGPT2LMHeadModel"
5
  ],
6
  "attn_pdrop": 0.1,
7
  "bos_token_id": "None",
8
  "embd_pdrop": 0.1,
9
+ "embedding": {
10
+ "block_digit_ids": [
11
+ 3,
12
+ 4,
13
+ 5,
14
+ 6,
15
+ 7,
16
+ 8,
17
+ 9,
18
+ 10,
19
+ 11,
20
+ 12,
21
+ 13,
22
+ 14,
23
+ 15,
24
+ 16,
25
+ 17,
26
+ 18
27
+ ],
28
+ "data_offset": 2,
29
+ "embedding_type": "block",
30
+ "fixed_pos_ntk_alpha": 1.0,
31
+ "fixed_pos_scaling": 0.1,
32
+ "fixed_pos_theta": 10000.0,
33
+ "padding_digit_id": 1
34
+ },
35
  "eos_token_id": "None",
36
  "initializer_range": 0.02,
37
  "layer_norm_epsilon": 1e-05,
38
+ "model_type": "custom-gpt2",
39
+ "n_ctx": 16,
40
+ "n_embd": 256,
41
+ "n_head": 4,
42
  "n_inner": null,
43
+ "n_layer": 8,
44
+ "n_positions": 16,
45
  "reorder_and_upcast_attn": false,
46
  "resid_pdrop": 0.1,
47
  "scale_attn_by_inverse_layer_idx": false,
 
52
  "summary_type": "cls_index",
53
  "summary_use_proj": true,
54
  "torch_dtype": "float32",
55
+ "transformers_version": "4.51.3",
56
  "use_cache": true,
57
+ "vocab_size": 20
58
  }
generation_config.json CHANGED
@@ -2,5 +2,5 @@
2
  "_from_model_config": true,
3
  "bos_token_id": "None",
4
  "eos_token_id": "None",
5
- "transformers_version": "4.50.3"
6
  }
 
2
  "_from_model_config": true,
3
  "bos_token_id": "None",
4
  "eos_token_id": "None",
5
+ "transformers_version": "4.51.3"
6
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c651d15716b4237f87cb9ee879d27f2ccd73145b15be04d82df1a086dc1f174b
3
- size 10714080
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a8f1c83a8248ebedb863d9aedc693fd81b69e4115df05e6a0d11dcd40f2e473b
3
+ size 25321112