n1ck-guo commited on
Commit
1b1a336
·
1 Parent(s): e25bed0

upload auto_round format

Browse files

Signed-off-by: n1ck-guo <[email protected]>

config.json CHANGED
@@ -19,11 +19,11 @@
19
  "quantization_config": {
20
  "amp": true,
21
  "autoround_version": "0.4.2",
 
22
  "batch_size": 8,
23
  "bits": 2,
24
- "damp_percent": 0.01,
25
  "data_type": "int",
26
- "desc_act": false,
27
  "enable_minmax_tuning": true,
28
  "enable_norm_bias_tuning": false,
29
  "enable_quanted_input": true,
@@ -34,12 +34,11 @@
34
  "lr": 0.0005,
35
  "minmax_lr": 0.0005,
36
  "nsamples": 1024,
37
- "quant_method": "gptq",
38
  "scale_dtype": "torch.float16",
39
  "seqlen": 2048,
40
  "sym": true,
41
- "to_quant_block_names": null,
42
- "true_sequential": false
43
  },
44
  "rms_norm_eps": 1e-06,
45
  "rope_scaling": null,
 
19
  "quantization_config": {
20
  "amp": true,
21
  "autoround_version": "0.4.2",
22
+ "backend": "auto_round:gptq:exllamav2",
23
  "batch_size": 8,
24
  "bits": 2,
 
25
  "data_type": "int",
26
+ "dataset": "NeelNanda/pile-10k",
27
  "enable_minmax_tuning": true,
28
  "enable_norm_bias_tuning": false,
29
  "enable_quanted_input": true,
 
34
  "lr": 0.0005,
35
  "minmax_lr": 0.0005,
36
  "nsamples": 1024,
37
+ "quant_method": "intel/auto-round",
38
  "scale_dtype": "torch.float16",
39
  "seqlen": 2048,
40
  "sym": true,
41
+ "to_quant_block_names": null
 
42
  },
43
  "rms_norm_eps": 1e-06,
44
  "rope_scaling": null,
model-00001-of-00006.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2397d8397bb52d5256453f9305babe26337048de676ca715830c7093ff61836f
3
  size 4997831816
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:704b52b6074a16c10bab88925c6c8df9f8a774ec87cd21e68e7cd2cf1b2c8769
3
  size 4997831816
model-00002-of-00006.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e0a5e68a8d9cbd5798f6b952ff0c4ee879629f08bd73fbafdd0f06bdeed02b2e
3
  size 4943608520
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:df9498984817f3ffccc4885b53129e73ad32496dd1ab7bf56148131818ad3aab
3
  size 4943608520
model-00003-of-00006.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bafbd7cfc6c96122263cca61694c8fa5b0aa5490b5efda94b70b63b975c4dc4c
3
  size 4943727032
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:18e864a5c47671dee16ddefad23ebdce2cd6dad6dd16733b06d8849497c97543
3
  size 4943727032
model-00004-of-00006.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:df77ba4efd8d8d3a47ebd32c36f19b3e4f91e2fa454e0afb73a38cadd9d39a57
3
  size 4943727024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7613e3932ba7c44e825db22f8d6dc2dd81bcd23ff5275f9efd27287d17448968
3
  size 4943727024
model-00005-of-00006.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:26dd7eb3beed75238cf0090c5287be83889375527f20fca1d24ee43f9170fbc0
3
  size 2713862656
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b51b7d191285acf680909cb6a521cab4e19c092b12c1318cde5bb3a05fdd6e38
3
  size 2713862656