willopcbeta commited on
Commit
b356791
·
verified ·
1 Parent(s): 4b94af6

Upload 50 files

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
mlc-chat-config.json ADDED
@@ -0,0 +1,84 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "version": "0.1.0",
3
+ "model_type": "gemma2",
4
+ "quantization": "q4f32_1",
5
+ "model_config": {
6
+ "hidden_size": 2304,
7
+ "intermediate_size": 9216,
8
+ "attention_bias": false,
9
+ "num_attention_heads": 8,
10
+ "num_key_value_heads": 4,
11
+ "head_dim": 256,
12
+ "num_hidden_layers": 26,
13
+ "rms_norm_eps": 1e-06,
14
+ "vocab_size": 256000,
15
+ "hidden_activation": "gelu_pytorch_tanh",
16
+ "position_embedding_base": 10000.0,
17
+ "context_window_size": 4096,
18
+ "prefill_chunk_size": 4096,
19
+ "tensor_parallel_shards": 1,
20
+ "max_batch_size": 128,
21
+ "attn_logit_softcapping": 50.0,
22
+ "final_logit_softcapping": 30.0,
23
+ "query_pre_attn_scalar": 224,
24
+ "sliding_window": 4096
25
+ },
26
+ "vocab_size": 256000,
27
+ "context_window_size": 4096,
28
+ "sliding_window_size": -1,
29
+ "prefill_chunk_size": 4096,
30
+ "attention_sink_size": -1,
31
+ "tensor_parallel_shards": 1,
32
+ "pipeline_parallel_stages": 1,
33
+ "temperature": 1.0,
34
+ "presence_penalty": 0.0,
35
+ "frequency_penalty": 0.0,
36
+ "repetition_penalty": 1.0,
37
+ "top_p": 1.0,
38
+ "tokenizer_files": [
39
+ "tokenizer.model",
40
+ "tokenizer.json",
41
+ "tokenizer_config.json"
42
+ ],
43
+ "tokenizer_info": {
44
+ "token_postproc_method": "byte_fallback",
45
+ "prepend_space_in_encode": false,
46
+ "strip_space_in_decode": false
47
+ },
48
+ "conv_template": {
49
+ "name": "gemma_instruction",
50
+ "system_template": "{system_message}",
51
+ "system_message": "",
52
+ "system_prefix_token_ids": [
53
+ 2
54
+ ],
55
+ "add_role_after_system_message": true,
56
+ "roles": {
57
+ "user": "<start_of_turn>user",
58
+ "assistant": "<start_of_turn>model"
59
+ },
60
+ "role_templates": {
61
+ "user": "{user_message}",
62
+ "assistant": "{assistant_message}",
63
+ "tool": "{tool_message}"
64
+ },
65
+ "messages": [],
66
+ "seps": [
67
+ "<end_of_turn>\n"
68
+ ],
69
+ "role_content_sep": "\n",
70
+ "role_empty_sep": "\n",
71
+ "stop_str": [
72
+ "<end_of_turn>"
73
+ ],
74
+ "stop_token_ids": [
75
+ 1,
76
+ 107
77
+ ],
78
+ "function_string": "",
79
+ "use_function_calling": false
80
+ },
81
+ "pad_token_id": 0,
82
+ "bos_token_id": 2,
83
+ "eos_token_id": 1
84
+ }
ndarray-cache-b16.json ADDED
The diff for this file is too large to render. See raw diff
 
ndarray-cache.json ADDED
The diff for this file is too large to render. See raw diff
 
params_shard_0.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e9b43e33b7e2ce6df4d05647c76d8b4c44e3dd510087a9453ef200bc9fba0612
3
+ size 294912000
params_shard_1.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:83531e44766c063ef2d8275954c2558d77dc58e7804e642a06b995702e676490
3
+ size 36864000
params_shard_10.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ab747b90c3ea26dd5a1b9a5a9235264eaebe3e4150264b0bbc00123e1b89157
3
+ size 33214464
params_shard_11.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:17622b67062bbae61ce3b4cfd63bdc5bcecefbd1cafe921c39b79fe24f1a71ff
3
+ size 33177600
params_shard_12.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1047e18cc4e0e2d461a6ddab7c763e5667574ffcd1ababea3335f8a5b3b2eadd
3
+ size 21233664
params_shard_13.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0ba556f91a7ba7819ffa1eb7328208829373c04dc6a06d1b414f73314b1ebbd3
3
+ size 33214464
params_shard_14.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:126cc854f1c2c70c62539162248ee0c27a6c40fb7e388cdb5f52cbc7c8edfb1e
3
+ size 33177600
params_shard_15.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3dbae3694219920bb7fcb2362be865a3ecb49505b41a1b4eb13a303e200b69b6
3
+ size 21233664
params_shard_16.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:63766b56fd061b049fee0ef8aa9edc23590bf30b2bcf9c7a9617a866aa03a389
3
+ size 33214464
params_shard_17.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff715b1e3748653c53656f6b1a8ae8208b65ecbf8980a4fc2e7f3acd9eae5137
3
+ size 33177600
params_shard_18.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:769eb052090fcad757bbe13f1c8d98f5389090d1ca76e8e7a65c08fdd3da632b
3
+ size 21233664
params_shard_19.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:57daeae836f74837213f9dfe1464171c21168297819c854a01f3ff68a2a79218
3
+ size 33214464
params_shard_2.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f066e08ad385253415a3ed84ec600d9fddf031850b4c39361eb2610cdd4438aa
3
+ size 33182208
params_shard_20.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:858559f568c05c14fbb17fad2d2365bbeb1edf05d2c01470cdabde660af0a83d
3
+ size 33177600
params_shard_21.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9b071afd77a652cda7f4b63ca39ecf042dda244787212ad81d18bc3a0615dcbd
3
+ size 21233664
params_shard_22.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b507980363b8823ca170fe03ac42fce07d10e334fc8d8c0678162f8bc1a804e6
3
+ size 33214464
params_shard_23.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:145bb4711f80a21aa9c1a02344bd155c9dc0b596875c0a303f476a22e0689dec
3
+ size 33177600
params_shard_24.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f6c78adc7e15c0daadfea29398b683d866ec6cfc7d39892e312ddb662f18f4e3
3
+ size 21233664
params_shard_25.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6ac32398ff7454fafcd673d8c172bb536375e65a6ef06613d9a414976391011f
3
+ size 33214464
params_shard_26.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1b68feab3ff904388f5ce3ad1907d21897e862f99a91746ed4d2a2974418cf64
3
+ size 33177600
params_shard_27.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dc41ba58b79908cbe2548cd81025e752b01c6316c8c41d9c7f0a4e7182974c86
3
+ size 31864320
params_shard_28.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0303ed7ab3d6da008bb7ea96415b4d273eb8488439330634e9bf3f1a9baa3226
3
+ size 21233664
params_shard_29.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff8fb82b07213b40d6ae479b9dc43b8655c0d3058b0dc225396d13044757708f
3
+ size 33200640
params_shard_3.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:26752994cbb0c9caa670d0c016b1aadf65648fb87fc112c5e3eed24e975dc20f
3
+ size 21233664
params_shard_30.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b613af83b6288cc52837974ad58f85610c540dd81879178be60c2bb2f2d01faa
3
+ size 33177600
params_shard_31.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e88d2bcccd09f93cec4996a415a893839d2480644f65cb1b469a58ff98504a16
3
+ size 21233664
params_shard_32.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4da375bb80892074c8caf7226c119f019aeaf8927a655a0284543bea6691896c
3
+ size 33214464
params_shard_33.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:66ae3b6f2290aef19e415fcfdf57f5c7b518352bce68b5f275f476625adcaaec
3
+ size 33177600
params_shard_34.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ebfa1b1abbb619ed09dbb07985e5df7696f05dccc2c29a3908977ccd104ddb0f
3
+ size 21233664
params_shard_35.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e196b995ddff0b515bcc48a04a49908a86aaa5c1b23bad9d50c7134d5cf0e248
3
+ size 33214464
params_shard_36.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ef967a4b57be34eec2c473fe5368fa8a9a74e0c02acdf12fa2bddcf72a4a9c5
3
+ size 33177600
params_shard_37.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ddb2f8cf4d4fcc5d31d86f32a8815f12accd43f9eb51183c46fff7b86dc01e83
3
+ size 21233664
params_shard_38.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bc8e27904262b07cc9e87ba4427d64bc4c8a6ada6cbf4e484a885ddd4c6ab6a8
3
+ size 33214464
params_shard_39.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6460ddd46486312f6bd2b2cd8581196fc1b6417dfb56a82005a6b35e94a66b37
3
+ size 21233664
params_shard_4.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:80cd240a75af027b84a987b71075caeab64bbbd0e3cbc01b9b1642823f344d7c
3
+ size 33214464
params_shard_40.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:331ccd29b891513caefc425ce5179832eea41d00580790c524c086dc819ad29c
3
+ size 31882752
params_shard_41.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:44c8098b23a69c1e043765c0b8aa74be841640726b5a958e443a4843a31fb3a0
3
+ size 2658816
params_shard_5.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e80a75bfa0b4add500f34dd34874b9279b15b30f3d0271c0e2696238cf7be7f
3
+ size 33177600
params_shard_6.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f11bad48cd19240f517339320ca82d8af651d9f4128422ad3f2631041b5f1fe4
3
+ size 21233664
params_shard_7.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2393ab6bd225764a8e66e3ab57008e37166965606cc4fcbfe93183086fea9fac
3
+ size 33214464
params_shard_8.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a3cfb41f22c67f4a98efc367dd2cff1541c224aa30f887148b504e3a15c6989f
3
+ size 33177600
params_shard_9.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0476ce2eeb1302029572570dd608cceaee85331643786b926becc36710b461a4
3
+ size 21233664
tensor-cache-b16.json ADDED
The diff for this file is too large to render. See raw diff
 
tensor-cache.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6c36fea8c2ad69ed08c6180b465a70bf23e9bde2453632f9d3ba827383154def
3
+ size 34362885
tokenizer.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6969e64047744a44bb3abfb5c50f8de0f7ed8b571d5444426ef931f651d1a0ef
3
+ size 4241111