riczhou commited on
Commit
2b2fab4
·
verified ·
1 Parent(s): 82c6ace

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
added_tokens.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ {
2
+ "<image_soft_token>": 262144
3
+ }
mlc-chat-config.json ADDED
@@ -0,0 +1,99 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "version": "0.1.0",
3
+ "model_type": "gemma3",
4
+ "quantization": "q4f16_1",
5
+ "model_config": {
6
+ "text_config": {
7
+ "hidden_size": 3840,
8
+ "intermediate_size": 15360,
9
+ "num_hidden_layers": 48,
10
+ "attention_bias": false,
11
+ "num_attention_heads": 16,
12
+ "num_key_value_heads": 8,
13
+ "head_dim": 256,
14
+ "rms_norm_eps": 1e-06,
15
+ "hidden_activation": "gelu_pytorch_tanh",
16
+ "position_embedding_base": 10000,
17
+ "context_window_size": 8192,
18
+ "prefill_chunk_size": 8192,
19
+ "query_pre_attn_scalar": 256,
20
+ "sliding_window": 1024,
21
+ "kwargs": {
22
+ "model_type": "gemma3_text",
23
+ "rope_scaling": {
24
+ "factor": 8.0,
25
+ "rope_type": "linear"
26
+ }
27
+ }
28
+ },
29
+ "vocab_size": 262208,
30
+ "tensor_parallel_shards": 1,
31
+ "max_batch_size": 128,
32
+ "context_window_size": 8192,
33
+ "sliding_window_size": -1,
34
+ "prefill_chunk_size": 8192,
35
+ "is_text_model": false
36
+ },
37
+ "vocab_size": 262208,
38
+ "context_window_size": 8192,
39
+ "sliding_window_size": -1,
40
+ "prefill_chunk_size": 8192,
41
+ "attention_sink_size": -1,
42
+ "tensor_parallel_shards": 1,
43
+ "pipeline_parallel_stages": 1,
44
+ "temperature": 1.0,
45
+ "presence_penalty": 0.0,
46
+ "frequency_penalty": 0.0,
47
+ "repetition_penalty": 1.0,
48
+ "top_p": 0.95,
49
+ "tokenizer_files": [
50
+ "tokenizer.model",
51
+ "tokenizer.json",
52
+ "added_tokens.json",
53
+ "tokenizer_config.json"
54
+ ],
55
+ "tokenizer_info": {
56
+ "token_postproc_method": "byte_fallback",
57
+ "prepend_space_in_encode": false,
58
+ "strip_space_in_decode": false
59
+ },
60
+ "conv_template": {
61
+ "name": "gemma_instruction",
62
+ "system_template": "{system_message}",
63
+ "system_message": "",
64
+ "system_prefix_token_ids": [
65
+ 2
66
+ ],
67
+ "add_role_after_system_message": true,
68
+ "roles": {
69
+ "user": "<start_of_turn>user",
70
+ "assistant": "<start_of_turn>model"
71
+ },
72
+ "role_templates": {
73
+ "user": "{user_message}",
74
+ "assistant": "{assistant_message}",
75
+ "tool": "{tool_message}"
76
+ },
77
+ "messages": [],
78
+ "seps": [
79
+ "<end_of_turn>\n"
80
+ ],
81
+ "role_content_sep": "\n",
82
+ "role_empty_sep": "\n",
83
+ "stop_str": [
84
+ "<end_of_turn>"
85
+ ],
86
+ "stop_token_ids": [
87
+ 1,
88
+ 107
89
+ ],
90
+ "function_string": "",
91
+ "use_function_calling": false
92
+ },
93
+ "pad_token_id": 0,
94
+ "bos_token_id": 2,
95
+ "eos_token_id": [
96
+ 1,
97
+ 106
98
+ ]
99
+ }
ndarray-cache.json ADDED
The diff for this file is too large to render. See raw diff
 
params_shard_0.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b18fe7ba93eb4d604465d51a2f5f6b43b621164c7b759c28650cf30e61452750
3
+ size 503439360
params_shard_1.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0ff13b6b8b28a18abd3b7f7a41b24d3dae0a6a414928970d5313b454bfa736a3
3
+ size 62929920
params_shard_10.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b12d0f110db8a53c9e7f324b4a0254a4b2b96121d05bba0bd2a595892dfb3048
3
+ size 28785664
params_shard_100.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:18066322de58eaecf8ceebbbc2462bb09f83dd2cc8d64436afa2abf2ac4f7746
3
+ size 33447424
params_shard_101.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ee67d185ed2356b236900a3bc9cef1b12d9098fc845c6011b09dfaef441d2586
3
+ size 29990400
params_shard_102.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6f1ce926229d1db8af96c54ee4c16192a6ac51270632c6233e8d770c0fb2385
3
+ size 58982400
params_shard_103.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0e0c72a543ac975597de03b057a09f78bf904b340bb19584ad1e5d5d30de1f98
3
+ size 33201664
params_shard_104.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7b7cb4f322d982fca6e9f4709bfa313106204f633f1599b5e58afc35f1e53051
3
+ size 29491200
params_shard_105.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e4093cedc5b452f1ced924866ec9035762fd297a2945a504b598f358366dcba1
3
+ size 58982400
params_shard_106.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e65cb8163624e702e22b21b8a164868070adfadabd6520a68af27f15b1f08e7b
3
+ size 28785664
params_shard_107.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ed91bea95d27d21b098203565fc3806296fb1b0d1a4b692f47f4dd7a9a73d89
3
+ size 29491200
params_shard_108.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:54718192f9b317e163d2bf93b2fe3c580022b1c61a4593eba44c6d8f3486c26a
3
+ size 58982400
params_shard_109.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4de5d2ba99dca91cc7a8047412a1775258c6a202a6e666c7ca343378d36e38e7
3
+ size 28785152
params_shard_11.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f9b146494ec391013cb08932992e37019f5254eb53d403133805fe792d9454a
3
+ size 29491200
params_shard_110.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd8890577995abf0de97860dd2b67efafb1b3ceece5b26957f6ab1e502d7ff74
3
+ size 29491200
params_shard_111.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:afb2784be0449af9e5c5ebb98eb5433a123cb1ff0ae62c897b0d7da2ff0299e1
3
+ size 58982400
params_shard_112.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:26411bb2a165df0cbbc4d9852be6954cb8b8436d07daee82bad803d30dc6f017
3
+ size 33209344
params_shard_113.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4f499595e7d49fa16426304f649ee0e3598f8a8655e9b5e9e54b680353c98089
3
+ size 29491200
params_shard_114.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c6a588f82c45ce9ab4659fc296ae7cda6d44f155de72edd4cacc5ea56d01c18d
3
+ size 58982400
params_shard_115.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3aea08c537dde3b35c7d57c7693c37e13d8797dc05ca5fc92f546f8914dae4ad
3
+ size 30236672
params_shard_116.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:25b7739dbf8faa22d14d90bef7c9ab0472006e6e452bc3cc12c4bcad093d4460
3
+ size 33447424
params_shard_117.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:05d3b8886922e01f3fd25f29842f8cfc8aa92c230f1a7825f36380d080efdf80
3
+ size 29990400
params_shard_118.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6110750aa339e1bc24dc1304930362d6f6d4eca0847731045efd07dd0729fbbf
3
+ size 58982400
params_shard_119.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2846579aa904ee0d335cd91ecb0a96d968db08c0c38fa1db1be5f20b2e5659e3
3
+ size 33201664
params_shard_12.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:efab9391d009a2e529ad3b4d3e1d47644845f5e3bebbfdf4e22a580dfbd952af
3
+ size 58982400
params_shard_120.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f6341586e7aa0816bd295aad6b568166898cf6f43eb485b023bfebdd54b0e173
3
+ size 58982400
params_shard_121.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1a9fa8f20076aa47fd29074348f40ef751ef9b5fa6fa4a3ebbe64e458b1e05b0
3
+ size 32932864
params_shard_122.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d00bd0a9ec36f1486a0c5e3f04c0a394e3ce4db4662e28afc91311614a8c18a5
3
+ size 29491200
params_shard_123.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7df36d996a9e583180c14002886ba1b0d60c952a8116d598edfad7114e58e587
3
+ size 29491200
params_shard_124.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d8be35fc9169c2325f6058479f8cef46aa69c77c71cf9a56bf8683dd214e6085
3
+ size 58982400
params_shard_125.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9d4234f07840e7f719a8904d0762b7565330acb21f421ef23dad9fcbecb0b200
3
+ size 33485824
params_shard_126.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c23c88d12b002dd5f36ce1890ec7f00131bd838e6ca2643cdc42193227cdd552
3
+ size 29491200
params_shard_127.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a9c6c7b754f4641103eb82b4afd8455dbdd546051fe2c647e86e1f72ee00191d
3
+ size 58982400
params_shard_128.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f8651e1dbf449fcb432e1b7435910fad07d3b6e8f8a6948893b5db4b66aef148
3
+ size 28785152
params_shard_129.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a41d3c8cd5a63eedfdf796e3eaefbb9e3e739d9f82b6082a69f221ec93df8edf
3
+ size 29491200
params_shard_13.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c8f4dd09e12ed64b10b4697e1b1b84ccf029e102d6e0117b5d0f501cf780afbe
3
+ size 28785152
params_shard_130.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:906e67bca1e154842a3f55dcbe8b458e402f0a585809f46b545d8e877fa230d5
3
+ size 58982400
params_shard_131.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:04de447be4ffbf2cc6ae55b83c82154f107d93302d58d8ee9f7355d71a0ebc8b
3
+ size 33209344
params_shard_132.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:212605f2eec0c134c8c5743df5b834b2ce9a570e6f633711b15c20a83c87679a
3
+ size 29491200
params_shard_133.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4b30be5471d4290abcfe6f4c9012e11fb8f1273a51104b861416f0b0798143e7
3
+ size 58982400
params_shard_134.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ea0370b723b0acb1323c9233d066a6bef94cebd45fb843acacd3d066b287d019
3
+ size 30236672
params_shard_135.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e686bd3256edf17795614d0aa83403f286bfd4ace8dca6530189b9eb368a4d81
3
+ size 33447424
params_shard_136.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f320010ecc8699ba6f17625f10edebc5971c1f294c17ed965a68377806ca2b08
3
+ size 29990400
params_shard_137.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:14a2a14ac3fda18f4196af27656fe99196c78c4c4cb53470ea3e45c4f1d40a94
3
+ size 58982400
params_shard_138.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a68e701f96493b523b56fdd5e0a504e8802590e1a07aee10ad061d18d2133812
3
+ size 33201664
params_shard_139.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3b3ec87ba4b6ebab375c49cf66df2416c10882dec6370df49927ec821a3a1945
3
+ size 29491200