Initial commit
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- logs.txt +0 -0
- mlc-chat-config.json +71 -0
- ndarray-cache-b16.json +0 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_100.bin +3 -0
- params_shard_101.bin +3 -0
- params_shard_102.bin +3 -0
- params_shard_103.bin +3 -0
- params_shard_104.bin +3 -0
- params_shard_105.bin +3 -0
- params_shard_106.bin +3 -0
- params_shard_107.bin +3 -0
- params_shard_108.bin +3 -0
- params_shard_109.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_110.bin +3 -0
- params_shard_111.bin +3 -0
- params_shard_112.bin +3 -0
- params_shard_113.bin +3 -0
- params_shard_114.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_14.bin +3 -0
- params_shard_15.bin +3 -0
- params_shard_16.bin +3 -0
- params_shard_17.bin +3 -0
- params_shard_18.bin +3 -0
- params_shard_19.bin +3 -0
- params_shard_2.bin +3 -0
- params_shard_20.bin +3 -0
- params_shard_21.bin +3 -0
- params_shard_22.bin +3 -0
- params_shard_23.bin +3 -0
- params_shard_24.bin +3 -0
- params_shard_25.bin +3 -0
- params_shard_26.bin +3 -0
- params_shard_27.bin +3 -0
- params_shard_28.bin +3 -0
- params_shard_29.bin +3 -0
- params_shard_3.bin +3 -0
- params_shard_30.bin +3 -0
- params_shard_31.bin +3 -0
- params_shard_32.bin +3 -0
- params_shard_33.bin +3 -0
- params_shard_34.bin +3 -0
- params_shard_35.bin +3 -0
- params_shard_36.bin +3 -0
logs.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
mlc-chat-config.json
ADDED
@@ -0,0 +1,71 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"model_type": "llama",
|
3 |
+
"quantization": "q4f32_1",
|
4 |
+
"model_config": {
|
5 |
+
"hidden_size": 4096,
|
6 |
+
"intermediate_size": 11008,
|
7 |
+
"num_attention_heads": 32,
|
8 |
+
"num_hidden_layers": 32,
|
9 |
+
"rms_norm_eps": 1e-05,
|
10 |
+
"vocab_size": 32016,
|
11 |
+
"position_embedding_base": 1000000,
|
12 |
+
"context_window_size": 16384,
|
13 |
+
"prefill_chunk_size": 16384,
|
14 |
+
"num_key_value_heads": 32,
|
15 |
+
"head_dim": 128,
|
16 |
+
"tensor_parallel_shards": 1,
|
17 |
+
"max_batch_size": 80
|
18 |
+
},
|
19 |
+
"vocab_size": 32016,
|
20 |
+
"context_window_size": 16384,
|
21 |
+
"sliding_window_size": -1,
|
22 |
+
"prefill_chunk_size": 16384,
|
23 |
+
"attention_sink_size": -1,
|
24 |
+
"tensor_parallel_shards": 1,
|
25 |
+
"mean_gen_len": 128,
|
26 |
+
"max_gen_len": 512,
|
27 |
+
"shift_fill_factor": 0.3,
|
28 |
+
"temperature": 0.7,
|
29 |
+
"presence_penalty": 0.0,
|
30 |
+
"frequency_penalty": 0.0,
|
31 |
+
"repetition_penalty": 1.0,
|
32 |
+
"top_p": 0.95,
|
33 |
+
"conv_template": {
|
34 |
+
"name": "llama-2",
|
35 |
+
"system_template": "[INST] <<SYS>>\n{system_message}\n<</SYS>>\n\n ",
|
36 |
+
"system_message": "You are a helpful, respectful and honest assistant.",
|
37 |
+
"roles": {
|
38 |
+
"user": "[INST]",
|
39 |
+
"assistant": "[/INST]",
|
40 |
+
"tool": "[INST]"
|
41 |
+
},
|
42 |
+
"role_templates": {
|
43 |
+
"user": "{user_message}",
|
44 |
+
"assistant": "{assistant_message}",
|
45 |
+
"tool": "{tool_message}"
|
46 |
+
},
|
47 |
+
"messages": [],
|
48 |
+
"seps": [
|
49 |
+
" "
|
50 |
+
],
|
51 |
+
"role_content_sep": " ",
|
52 |
+
"role_empty_sep": " ",
|
53 |
+
"stop_str": [
|
54 |
+
"[INST]"
|
55 |
+
],
|
56 |
+
"stop_token_ids": [
|
57 |
+
2
|
58 |
+
],
|
59 |
+
"function_string": "",
|
60 |
+
"use_function_calling": false
|
61 |
+
},
|
62 |
+
"pad_token_id": 0,
|
63 |
+
"bos_token_id": 1,
|
64 |
+
"eos_token_id": 2,
|
65 |
+
"tokenizer_files": [
|
66 |
+
"tokenizer.model",
|
67 |
+
"tokenizer.json",
|
68 |
+
"tokenizer_config.json"
|
69 |
+
],
|
70 |
+
"version": "0.1.0"
|
71 |
+
}
|
ndarray-cache-b16.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:70e0f1ebdf829283a00ad81e3889ae4fe07a53f7fcf07091a9ebd5fd7bd560f4
|
3 |
+
size 65952960
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:91dc38990040f7303b54403b0d38696243f757bd9efec7d1b9a5b5e1b1ece6de
|
3 |
+
size 65952960
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9c5d97c54845cbdf23bf123e0b5e5016ce20dad0a00a3373584ac10a0548f2ff
|
3 |
+
size 45352960
|
params_shard_100.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:907cf15511d7b150e2d6eaf0fc7b9b9c7aa1e6adb607987af181944b0fe4f0f2
|
3 |
+
size 25313280
|
params_shard_101.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8ae42d2be8294986a158f1a5786327f0d90460d25275ba13c55181e8b53cf1c1
|
3 |
+
size 45352960
|
params_shard_102.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c25fca5b4e8fbf5d9027928722ebdc70a37ca8aec5b53ff145936f85de5af9d8
|
3 |
+
size 22609920
|
params_shard_103.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:71c7b6f3f080d57289e4b33752ffe26859620beffa3ba8e1ecc221ed2c460fc5
|
3 |
+
size 32450560
|
params_shard_104.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:487f0d6ae06d5e9a344c5ac13ebb12db88d3bbeae95368e9a7faf196f4951f32
|
3 |
+
size 30113792
|
params_shard_105.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:30d322673c5d5a18c8071c00b354d18745a7b26574003728afb2bed272dbd586
|
3 |
+
size 45352960
|
params_shard_106.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b20a03c10d60a3d2a1153fe1e7afa3a7dfeb5a1ef778ce9c5f8c7c3ead4b928d
|
3 |
+
size 22609920
|
params_shard_107.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e359c1898323065c7115ef90dfb46cb35e29343a489af12592544900d5ab1ec1
|
3 |
+
size 25313280
|
params_shard_108.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9cf508f7323be7db43685aa5371c02bb7cd8b8ca98befc506e0b1e73175c265d
|
3 |
+
size 45352960
|
params_shard_109.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c735c62fae6637269c319e73537d027fd03516efb465f03f419d0720ba963374
|
3 |
+
size 22609920
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e41be3d2e4ec992f5cad292c728b825738359794f28962f68e0474b56b3af513
|
3 |
+
size 30446592
|
params_shard_110.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3ded31ea8ffc93f2c2fe72c5babb0772b156bb465d55732e60d6d9015af3a59
|
3 |
+
size 32450560
|
params_shard_111.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ef3ad9f3a384b1317c618707d8be5da5f799aa3d0322f8c58e15343452f24b17
|
3 |
+
size 30113792
|
params_shard_112.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4e375af3e65ec3cb5e10dbe94ddc3eac15bbfcfa5e7687f114d47f78d469dd30
|
3 |
+
size 45352960
|
params_shard_113.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cae347dab3a6b70a3da9875f905210ffdc570686362289f69e51a429d873574e
|
3 |
+
size 22609920
|
params_shard_114.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9a06f4ff9803bd764fb2b3ffa321437f9aa1439bb4ee78e773db682c41a954b6
|
3 |
+
size 16086016
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7d0ebd61d20fbde28291f92cd83fbd4c1843e7bd85f4c39fc19ac3bb4aac84d2
|
3 |
+
size 25313280
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1bf6182c3bc7418e85cc1f3c53ee066cca48bf10157e6612fdc38492965ff677
|
3 |
+
size 31945728
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ed9da828d2f8d29b6f8c24412bb31bcdf35d6f00004b0e5721406a07d564002d
|
3 |
+
size 45352960
|
params_shard_15.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d9d496f43593a8d512c891e69f11448b35855337c173e912dab07bca45762b59
|
3 |
+
size 22609920
|
params_shard_16.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:24f306baeb6d35c43b7c41b3c52c641b5f198c940cbd4b677637820db6b87612
|
3 |
+
size 25313280
|
params_shard_17.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:71f18e573ae5e2f003f13658ed3d0eeb437ba215a798dcfc5f916755d06a73b5
|
3 |
+
size 45352960
|
params_shard_18.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5dff9a4a2530d114b6741f15c0f9cf84ccb41ab5523bddb63a5e49b80d4e19dc
|
3 |
+
size 22609920
|
params_shard_19.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fb5c9a369e9933c5bd95ff97c373f9881f59816c671aa465562fe7dfea917311
|
3 |
+
size 32450560
|
params_shard_2.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:317eb19ffd1ede0bb4f7779f20151741a49c07bdf849bce88e03fd2ba618d5e4
|
3 |
+
size 25313280
|
params_shard_20.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ad7d5f9189d2ba2e938952e51ed3a5ebfdadbf334a571b53d19c5e5221b25bca
|
3 |
+
size 30113792
|
params_shard_21.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0c6fff8606e579e6e4d5c6361eec050cbcce148a84b5265b1195a7221866c9d7
|
3 |
+
size 45352960
|
params_shard_22.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:07d3a050f5fc5217ca06b384cd60d8dc937b95335d03b12a028ffef564e74799
|
3 |
+
size 22609920
|
params_shard_23.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c6c2118743fea35ab3afa1e9b277e31a2e299b5eb3cf339f44c57d42cac5cd7b
|
3 |
+
size 25313280
|
params_shard_24.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:95784a88661df7a87b99f15b85134dcbec4c7e811f295b2d95ad3b896aad8063
|
3 |
+
size 45352960
|
params_shard_25.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fbd98e2c02a9a67b96c8773e41becfd967d0475aabceadd6e107ea71c7a18387
|
3 |
+
size 22609920
|
params_shard_26.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2fd990307125c023a399ee5ade26fd99f1ad63c08c7a8a8cf29e97d72ab4804b
|
3 |
+
size 32450560
|
params_shard_27.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b7712ace6abedf9e37f7b9b5c342f20724616886d3f643ce2ff11d12c08e1705
|
3 |
+
size 30113792
|
params_shard_28.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0b27a0cce72d60b773eef80b66447095f22e896b16ac74cc49073a47ee818e34
|
3 |
+
size 45352960
|
params_shard_29.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6cc424f74706adfeffa83066b0abf7f8bebcf372db1a130d977a93d82bad5f02
|
3 |
+
size 22609920
|
params_shard_3.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ad5f844b3d1214ecc0934ac4e85919aff808bb857d92e883859582ce011941a8
|
3 |
+
size 45352960
|
params_shard_30.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:06b032d3fdc71e9b0ad522af56ea8304659f8e890e00f7d2d2b281adc2381cc9
|
3 |
+
size 25313280
|
params_shard_31.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5a6aca6614c7b2ce5ec959776224d6c2ab131e97c0747a72cd09a1ddaff2ccef
|
3 |
+
size 45352960
|
params_shard_32.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:44d9091ab532739d0f5df464f820464df2aeb8e6de1a475feedea9a2cdaa3540
|
3 |
+
size 22609920
|
params_shard_33.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6bb852586f76fae6bb4181315cad3c308aedc6c9bddc431e7f83479fb3f974d8
|
3 |
+
size 32450560
|
params_shard_34.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ecb66423e225652890f964de96f897d3041c7528cb5bf0c654713121ccac19fc
|
3 |
+
size 30113792
|
params_shard_35.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:07bb41736da3977461272f77c922b9df80cffc818c8b8c80b1015e6262c9fa08
|
3 |
+
size 45352960
|
params_shard_36.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1a0fda84c800a10028f5149dcb32c5ec82598f2d24b931f8501fef12f2c42b8e
|
3 |
+
size 22609920
|