riczhou commited on
Commit
2c0b4bb
·
verified ·
1 Parent(s): c84aeac

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
added_tokens.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ {
2
+ "<image_soft_token>": 262144
3
+ }
mlc-chat-config.json ADDED
@@ -0,0 +1,99 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "version": "0.1.0",
3
+ "model_type": "gemma3",
4
+ "quantization": "q4f16_1",
5
+ "model_config": {
6
+ "text_config": {
7
+ "hidden_size": 2560,
8
+ "intermediate_size": 10240,
9
+ "num_hidden_layers": 34,
10
+ "attention_bias": false,
11
+ "num_attention_heads": 8,
12
+ "num_key_value_heads": 4,
13
+ "head_dim": 256,
14
+ "rms_norm_eps": 1e-06,
15
+ "hidden_activation": "gelu_pytorch_tanh",
16
+ "position_embedding_base": 10000,
17
+ "context_window_size": 8192,
18
+ "prefill_chunk_size": 8192,
19
+ "query_pre_attn_scalar": 256,
20
+ "sliding_window": 1024,
21
+ "kwargs": {
22
+ "model_type": "gemma3_text",
23
+ "rope_scaling": {
24
+ "factor": 8.0,
25
+ "rope_type": "linear"
26
+ }
27
+ }
28
+ },
29
+ "vocab_size": 262208,
30
+ "tensor_parallel_shards": 1,
31
+ "max_batch_size": 128,
32
+ "context_window_size": 8192,
33
+ "sliding_window_size": -1,
34
+ "prefill_chunk_size": 8192,
35
+ "is_text_model": false
36
+ },
37
+ "vocab_size": 262208,
38
+ "context_window_size": 8192,
39
+ "sliding_window_size": -1,
40
+ "prefill_chunk_size": 8192,
41
+ "attention_sink_size": -1,
42
+ "tensor_parallel_shards": 1,
43
+ "pipeline_parallel_stages": 1,
44
+ "temperature": 1.0,
45
+ "presence_penalty": 0.0,
46
+ "frequency_penalty": 0.0,
47
+ "repetition_penalty": 1.0,
48
+ "top_p": 0.95,
49
+ "tokenizer_files": [
50
+ "tokenizer.model",
51
+ "tokenizer.json",
52
+ "added_tokens.json",
53
+ "tokenizer_config.json"
54
+ ],
55
+ "tokenizer_info": {
56
+ "token_postproc_method": "byte_fallback",
57
+ "prepend_space_in_encode": false,
58
+ "strip_space_in_decode": false
59
+ },
60
+ "conv_template": {
61
+ "name": "gemma_instruction",
62
+ "system_template": "{system_message}",
63
+ "system_message": "",
64
+ "system_prefix_token_ids": [
65
+ 2
66
+ ],
67
+ "add_role_after_system_message": true,
68
+ "roles": {
69
+ "user": "<start_of_turn>user",
70
+ "assistant": "<start_of_turn>model"
71
+ },
72
+ "role_templates": {
73
+ "user": "{user_message}",
74
+ "assistant": "{assistant_message}",
75
+ "tool": "{tool_message}"
76
+ },
77
+ "messages": [],
78
+ "seps": [
79
+ "<end_of_turn>\n"
80
+ ],
81
+ "role_content_sep": "\n",
82
+ "role_empty_sep": "\n",
83
+ "stop_str": [
84
+ "<end_of_turn>"
85
+ ],
86
+ "stop_token_ids": [
87
+ 1,
88
+ 107
89
+ ],
90
+ "function_string": "",
91
+ "use_function_calling": false
92
+ },
93
+ "pad_token_id": 0,
94
+ "bos_token_id": 2,
95
+ "eos_token_id": [
96
+ 1,
97
+ 106
98
+ ]
99
+ }
ndarray-cache.json ADDED
The diff for this file is too large to render. See raw diff
 
params_shard_0.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:64b9377e53483b31b52dc5a7ad5105f532afca51c9f70146500940badb38b008
3
+ size 335626240
params_shard_1.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:077386c2310c69b5fd7b8627cf07afcb4394749057380e75313e4c2912e69f97
3
+ size 41953280
params_shard_10.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9615ce8263227812883354e51b09d3584e98f0a17f5ce346fe280c66c2e9e195
3
+ size 26214400
params_shard_11.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c7b117c37f0b4eb3f7c4730b9a87e6d7ab0164f9a767bbfb086b5d94af620136
3
+ size 26891264
params_shard_12.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:729831ddad012136eb241c02efad89d2d47571176590a3ced235c9382ca5ec21
3
+ size 26214400
params_shard_13.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f9831a42cc171e77b11be23ccad2f9b3d99885322a8bb801aa6739c661841ebb
3
+ size 26214400
params_shard_14.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d82b74d1f0b177ee265dc013f31b33d954455d0f6613cc70238d2ca6007cd97e
3
+ size 31638016
params_shard_15.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:241879aeff87150a818e1d366fb61918afb99ea0f91565153f870a2caf281c69
3
+ size 26214400
params_shard_16.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:50fba2fba3e0e61883ada494aec1ee07ea3f6fe90695aa8b6f78b21583114754
3
+ size 32790016
params_shard_17.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f0fe51ef07404cab1b3e41d7a567f8bb046e6890d896fbf5256cfc1b3afa190d
3
+ size 26214400
params_shard_18.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d9fc1b533a79649876683cd72e678573256d57bcfdbd8dff1f2b09a212cefd48
3
+ size 28370944
params_shard_19.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1f594e792931a1df7e94dd8237e980e6778e31e182c491688e561d38ddf33345
3
+ size 26214400
params_shard_2.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:96e5eaf4c89e6cfe3af072669079e6f800058e7f9a8c180cbfa521a01e2a5e71
3
+ size 26214400
params_shard_20.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9392b3eb8fd6ca541b32bd118684d585e1a4f933624fcda0992290c45033bb68
3
+ size 26891264
params_shard_21.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5fd24c20ce993f21aadc57b3fedfae22d3bb6ba0f46ca308fe8bb3c25ef7d239
3
+ size 26214400
params_shard_22.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d499f8f4a87d8e9f7444dfc2153549f3a37d6cc7cb266f0370fbf994c4b5065
3
+ size 26891264
params_shard_23.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:279ae680fe1d0ceb4b13141b49b9565f087e0c5fb39e1beb22bdb516277d823d
3
+ size 26214400
params_shard_24.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:041672e567cf1137166d6ed07180b80b9dae82092871473043d2ebfaaa83edc7
3
+ size 26891264
params_shard_25.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:48d13ab2d7f5bc5e17fb43249e237072d3a201af48d0de57e6c63272d01cf191
3
+ size 26214400
params_shard_26.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:124ab303430edeef5702478a8575a99c52cc440724eb31ac41278d83fec47304
3
+ size 26891264
params_shard_27.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:997374ca8a6bd4aecf0529eb7de19337a08e92d336ea0817d7c9f8bb4a22acef
3
+ size 26214400
params_shard_28.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9e65a65acf21087edb10315262110c5679c28de840e7f79ef15a3154b27eed33
3
+ size 26891264
params_shard_29.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c5bc9544515ac33d10dfe095f53c205363a20302935043fb2a509b66b3fb3acc
3
+ size 26214400
params_shard_3.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4fed856efbfd82d2f8137c913d2780eefec383f73c3f87dee7654ead042faa65
3
+ size 26896384
params_shard_30.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0c24e7e004910fbbeea0b3cc373d7a38b7bab33d012dfcf93c0da951365204fa
3
+ size 26891264
params_shard_31.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9b04afef4476bb1ba68fa109ae4c6e104b25f38cc7a9b1463d1850331edee2ae
3
+ size 26214400
params_shard_32.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:91191511f94b5286f3abaa5aa7c598b88eda669ab68133b0abcc2f44a61e12f7
3
+ size 32804352
params_shard_33.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3de07c219f06dac99e1fb9ada367fd7074961f7e3a425a05ac56d849731c8c43
3
+ size 26214400
params_shard_34.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9b83b8fff38c42c27a207a36cbd321cd8a2f13191a430fb487492e659ab60731
3
+ size 31315456
params_shard_35.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0067d71d4c6aaddcea5b972bd11d3534026c324eed7ca34cf05582d3767289e7
3
+ size 26214400
params_shard_36.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:31f05caf856e1a2ba6cdeca75759da42015b51c4174636bb55330708961941d8
3
+ size 31320064
params_shard_37.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9e4388361341623dfb7afa5044c5881392c2bba83edc9d8481a6079973c27efd
3
+ size 26214400
params_shard_38.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ee7092a9a5c53910d868b63d1a9f40f0ec512258a71be2cba1b5fcf590d1ff3c
3
+ size 26891264
params_shard_39.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:44c2d24a550b1e3ac404962f70507eab89378112725a79528f2da253f279d290
3
+ size 26214400
params_shard_4.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c1bd3ed0d249cec00a11cbd2cab7ba059bf2b8190f7854d064b07ceba7ac0167
3
+ size 26214400
params_shard_40.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4086f39453c000b5f1e0c582a6c47439533da2c24290428e227ac920bcf85ab4
3
+ size 26891264
params_shard_41.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:73cd112767c61389c910e4270e5edaab0f25ba1dcd8283a5084ec7862f0335f5
3
+ size 26214400
params_shard_42.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:864dcf8bb2850d7b7f6c38c1c94411dbee2ea58e28a512293fbd0f0958820d0a
3
+ size 26891264
params_shard_43.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e93b0e21dacae3b16635edf2a492a3a6ac9c0dd3fab27120dfc3268bd655044f
3
+ size 26214400
params_shard_44.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b11f9854ea436c68c430c6d29bfdea4ddccc4439f97f48ff91f889c46da5154
3
+ size 26891264
params_shard_45.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d9c6330e54761f2363c95cd88d246abe0cdcc4a4a25b54f429a7c42ea2d43ad0
3
+ size 26214400
params_shard_46.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e5fe584f5e6afe256879da1574842accabf939b91981a42f88287276bf2ffb50
3
+ size 26891264
params_shard_47.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7ff2a4257929d7c04cc202f921b59184b761dc1d158f7be9a99e0f8fa539d5c0
3
+ size 26214400
params_shard_48.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b80da3cb56d4f44de4ea43568569a3c08af3a49891b89eb6f3e71abe7ffcca7f
3
+ size 26891264
params_shard_49.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:69fb31813342f5d87f442c344177879bab1c49e3a1e48feaf729e89168717f0e
3
+ size 26214400
params_shard_5.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cfe137aaa2b7bbadbd6a16f0de9b8c875a0980b0db28f110ae0b12f4b616101d
3
+ size 26891264