upload auto_round format
Browse filesSigned-off-by: n1ck-guo <[email protected]>
config.json
CHANGED
@@ -19,11 +19,11 @@
|
|
19 |
"quantization_config": {
|
20 |
"amp": true,
|
21 |
"autoround_version": "0.4.2",
|
|
|
22 |
"batch_size": 8,
|
23 |
"bits": 2,
|
24 |
-
"damp_percent": 0.01,
|
25 |
"data_type": "int",
|
26 |
-
"
|
27 |
"enable_minmax_tuning": true,
|
28 |
"enable_norm_bias_tuning": false,
|
29 |
"enable_quanted_input": true,
|
@@ -34,12 +34,11 @@
|
|
34 |
"lr": 0.0005,
|
35 |
"minmax_lr": 0.0005,
|
36 |
"nsamples": 1024,
|
37 |
-
"quant_method": "
|
38 |
"scale_dtype": "torch.float16",
|
39 |
"seqlen": 2048,
|
40 |
"sym": true,
|
41 |
-
"to_quant_block_names": null
|
42 |
-
"true_sequential": false
|
43 |
},
|
44 |
"rms_norm_eps": 1e-06,
|
45 |
"rope_scaling": null,
|
|
|
19 |
"quantization_config": {
|
20 |
"amp": true,
|
21 |
"autoround_version": "0.4.2",
|
22 |
+
"backend": "auto_round:gptq:exllamav2",
|
23 |
"batch_size": 8,
|
24 |
"bits": 2,
|
|
|
25 |
"data_type": "int",
|
26 |
+
"dataset": "NeelNanda/pile-10k",
|
27 |
"enable_minmax_tuning": true,
|
28 |
"enable_norm_bias_tuning": false,
|
29 |
"enable_quanted_input": true,
|
|
|
34 |
"lr": 0.0005,
|
35 |
"minmax_lr": 0.0005,
|
36 |
"nsamples": 1024,
|
37 |
+
"quant_method": "intel/auto-round",
|
38 |
"scale_dtype": "torch.float16",
|
39 |
"seqlen": 2048,
|
40 |
"sym": true,
|
41 |
+
"to_quant_block_names": null
|
|
|
42 |
},
|
43 |
"rms_norm_eps": 1e-06,
|
44 |
"rope_scaling": null,
|
model-00001-of-00006.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4997831816
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:704b52b6074a16c10bab88925c6c8df9f8a774ec87cd21e68e7cd2cf1b2c8769
|
3 |
size 4997831816
|
model-00002-of-00006.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4943608520
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:df9498984817f3ffccc4885b53129e73ad32496dd1ab7bf56148131818ad3aab
|
3 |
size 4943608520
|
model-00003-of-00006.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4943727032
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:18e864a5c47671dee16ddefad23ebdce2cd6dad6dd16733b06d8849497c97543
|
3 |
size 4943727032
|
model-00004-of-00006.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4943727024
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7613e3932ba7c44e825db22f8d6dc2dd81bcd23ff5275f9efd27287d17448968
|
3 |
size 4943727024
|
model-00005-of-00006.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 2713862656
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b51b7d191285acf680909cb6a521cab4e19c092b12c1318cde5bb3a05fdd6e38
|
3 |
size 2713862656
|