Shubhra Pandit
commited on
Commit
·
1252068
1
Parent(s):
3c12e8e
Update model files
Browse files- config.json +6 -7
- model-00001-of-00037.safetensors +2 -2
- model-00002-of-00037.safetensors +2 -2
- model-00003-of-00037.safetensors +2 -2
- model-00004-of-00037.safetensors +2 -2
- model-00005-of-00037.safetensors +2 -2
- model-00006-of-00037.safetensors +2 -2
- model-00007-of-00037.safetensors +2 -2
- model-00008-of-00037.safetensors +2 -2
- model-00009-of-00037.safetensors +2 -2
- model-00010-of-00037.safetensors +2 -2
- model-00011-of-00037.safetensors +2 -2
- model-00012-of-00037.safetensors +2 -2
- model-00013-of-00037.safetensors +2 -2
- model-00014-of-00037.safetensors +2 -2
- model-00015-of-00037.safetensors +2 -2
- model-00016-of-00037.safetensors +2 -2
- model-00017-of-00037.safetensors +2 -2
- model-00018-of-00037.safetensors +2 -2
- model-00019-of-00037.safetensors +2 -2
- model-00020-of-00037.safetensors +2 -2
- model-00021-of-00037.safetensors +2 -2
- model-00022-of-00037.safetensors +2 -2
- model-00023-of-00037.safetensors +2 -2
- model-00024-of-00037.safetensors +2 -2
- model-00025-of-00037.safetensors +2 -2
- model-00026-of-00037.safetensors +2 -2
- model-00027-of-00037.safetensors +2 -2
- model-00028-of-00037.safetensors +2 -2
- model-00029-of-00037.safetensors +2 -2
- model-00030-of-00037.safetensors +2 -2
- model-00031-of-00037.safetensors +2 -2
- model-00032-of-00037.safetensors +2 -2
- model-00033-of-00037.safetensors +2 -2
- model-00034-of-00037.safetensors +2 -2
- model-00035-of-00037.safetensors +2 -2
- model-00036-of-00037.safetensors +2 -2
- model-00037-of-00037.safetensors +2 -2
- model.safetensors.index.json +2 -2
- recipe.yaml +2 -21
config.json
CHANGED
|
@@ -45,20 +45,19 @@
|
|
| 45 |
"dynamic": false,
|
| 46 |
"group_size": 128,
|
| 47 |
"num_bits": 4,
|
| 48 |
-
"observer": "
|
| 49 |
"observer_kwargs": {},
|
|
|
|
| 50 |
"strategy": "group",
|
| 51 |
"symmetric": true,
|
| 52 |
-
"type": "int"
|
|
|
|
| 53 |
}
|
| 54 |
}
|
| 55 |
},
|
| 56 |
"format": "pack-quantized",
|
| 57 |
"global_compression_ratio": null,
|
| 58 |
"ignore": [
|
| 59 |
-
"model.layers.0.mlp.gate_proj",
|
| 60 |
-
"model.layers.1.mlp.gate_proj",
|
| 61 |
-
"model.layers.2.mlp.gate_proj",
|
| 62 |
"lm_head"
|
| 63 |
],
|
| 64 |
"kv_cache_scheme": null,
|
|
@@ -66,7 +65,7 @@
|
|
| 66 |
"quantization_status": "compressed",
|
| 67 |
"sparsity_config": {},
|
| 68 |
"transform_config": {},
|
| 69 |
-
"version": "0.12.3.dev31+gb019b89"
|
| 70 |
},
|
| 71 |
"rms_norm_eps": 1e-05,
|
| 72 |
"rope_scaling": null,
|
|
@@ -78,4 +77,4 @@
|
|
| 78 |
"use_cache": true,
|
| 79 |
"use_qk_norm": true,
|
| 80 |
"vocab_size": 151552
|
| 81 |
-
}
|
|
|
|
| 45 |
"dynamic": false,
|
| 46 |
"group_size": 128,
|
| 47 |
"num_bits": 4,
|
| 48 |
+
"observer": "minmax",
|
| 49 |
"observer_kwargs": {},
|
| 50 |
+
"scale_dtype": null,
|
| 51 |
"strategy": "group",
|
| 52 |
"symmetric": true,
|
| 53 |
+
"type": "int",
|
| 54 |
+
"zp_dtype": null
|
| 55 |
}
|
| 56 |
}
|
| 57 |
},
|
| 58 |
"format": "pack-quantized",
|
| 59 |
"global_compression_ratio": null,
|
| 60 |
"ignore": [
|
|
|
|
|
|
|
|
|
|
| 61 |
"lm_head"
|
| 62 |
],
|
| 63 |
"kv_cache_scheme": null,
|
|
|
|
| 65 |
"quantization_status": "compressed",
|
| 66 |
"sparsity_config": {},
|
| 67 |
"transform_config": {},
|
| 68 |
+
"version": "0.12.3.dev31+gb019b89.d20251216"
|
| 69 |
},
|
| 70 |
"rms_norm_eps": 1e-05,
|
| 71 |
"rope_scaling": null,
|
|
|
|
| 77 |
"use_cache": true,
|
| 78 |
"use_qk_norm": true,
|
| 79 |
"vocab_size": 151552
|
| 80 |
+
}
|
model-00001-of-00037.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e7b2bcc69816d48bdf35fc64f0355b5104e0039d2178f61fea8989d81904e08b
|
| 3 |
+
size 4999471048
|
model-00002-of-00037.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:46321ac0ede036ce4363703692b38cf7a1164c0fecd1f1ea41bd8b110b7f7035
|
| 3 |
+
size 4998300240
|
model-00003-of-00037.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9fcce1e7dc93e4ddf79e0684b6d94257e7fee546b13d33c0f96d83621461b9cc
|
| 3 |
+
size 4997280760
|
model-00004-of-00037.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:347052e23801adabcaaadf48c808804b5c868f72e0f776887ed1a2f23418b343
|
| 3 |
+
size 4998302816
|
model-00005-of-00037.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dbaab130517ff7b7fedd42af62fd6cdd6b88739294969eb99691a019c1c0e262
|
| 3 |
+
size 4997284480
|
model-00006-of-00037.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0b4624f63de0ac57136e51790888142cf0f18cbcfca2bd390c24dff8fe16e0ec
|
| 3 |
+
size 4998303640
|
model-00007-of-00037.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:41e511f237b34f919c8d8c1e75698f5c0317609ce80f4d03efd5cec05e436d68
|
| 3 |
+
size 4997284600
|
model-00008-of-00037.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bee8d3202c0b6d75ae927c72bee9c02174a0647048777d0635373b0162000c09
|
| 3 |
+
size 4998303528
|
model-00009-of-00037.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f5ab9b2860d51dfee53cf3f424cf16ca04ea25d72147fa2c881121ac3074d3db
|
| 3 |
+
size 4997284712
|
model-00010-of-00037.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ff44f85b410734972e8d41daf537f8753a406d4bf9b67293240e1497fa659e1d
|
| 3 |
+
size 4998303456
|
model-00011-of-00037.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b9faac7e2992e1f17e4e573960387ffd4dd0a50a4fceb3087c8c13b5feea549e
|
| 3 |
+
size 4997284832
|
model-00012-of-00037.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6a60f99d2c26c6d7e0db0a87286b6114802e4210621dc12228c989a0246924db
|
| 3 |
+
size 4998303408
|
model-00013-of-00037.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1cbebf09bc507e43395cb106bccec978ea6c57801071d80b440406815d97f69a
|
| 3 |
+
size 4998303984
|
model-00014-of-00037.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7b62048e5ffc061a30e255a236501d6b0764c6c3b7020572991d1b938e059f20
|
| 3 |
+
size 4997284256
|
model-00015-of-00037.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1ffc9ad660a751c10bb1e5700193b93f90d962e0d127c3a6daf233085f6f65ab
|
| 3 |
+
size 4998303864
|
model-00016-of-00037.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7c35043bff000286afaa7cdfd607a8739f9ce53340d843e532b7ec85aafc1109
|
| 3 |
+
size 4997284376
|
model-00017-of-00037.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0a9a820ac78fdde795c4378f4a43032e02e2beebd32a8f859318c418fc9a0219
|
| 3 |
+
size 4998303752
|
model-00018-of-00037.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d7a918bd5c40b5a130fafe54347f8b9d26151a960dc1ed542175ad288f4c4cc1
|
| 3 |
+
size 4997284488
|
model-00019-of-00037.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8aa286e5975611d52cd58fd0ade3eb2dc44c093815c858191fe7e60751896055
|
| 3 |
+
size 4998303632
|
model-00020-of-00037.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d4379ba66ab0bd562e37599a3213a6184eb6e31b43de32267e042925f5d4ecab
|
| 3 |
+
size 4997284608
|
model-00021-of-00037.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e279032f627c1646cf4ff24bf6f4ebdacbc3c147663a6e592db52a448e48b423
|
| 3 |
+
size 4998303520
|
model-00022-of-00037.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dcb2941674fbd161c14f510e37a85cf8ce030d7a6088294c9d6e17e39756c682
|
| 3 |
+
size 4997284720
|
model-00023-of-00037.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:485dc1746278e5b7aaa9ddec6807aec2261c2838c1d0f2331252879a8ba57fa4
|
| 3 |
+
size 4998303456
|
model-00024-of-00037.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6a3f9d5e2419c2d569b65ed0e6c648a3c28a237ec86ba4360b054dbcef045bcb
|
| 3 |
+
size 4997284840
|
model-00025-of-00037.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:08d77fe6861ba4226da422d61bdf27d9dcc3b77acaf3592721dcbabadc6fe008
|
| 3 |
+
size 4998303400
|
model-00026-of-00037.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c9773b3cf0311d3b645412370e26df556a5811c2c98395b88bee587926e8b8cb
|
| 3 |
+
size 4998303976
|
model-00027-of-00037.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:45b4b57734d3bfaa2006c7f591365312a92deac3703b11c486545702b09a3840
|
| 3 |
+
size 4997284264
|
model-00028-of-00037.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:02ab6a0fe1da903f69ea8c51e8657560036eabf2b22c07293d03696f83b6f815
|
| 3 |
+
size 4998303856
|
model-00029-of-00037.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:25e9cd3dc3feb967804ac140f6a9062e675326dd4e855a13e6116a018a30f721
|
| 3 |
+
size 4997284384
|
model-00030-of-00037.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ca401ce3e94a62ec419536857c3a0dd2a22d6fe50ff8ed02d9406e2df87af07b
|
| 3 |
+
size 4998303744
|
model-00031-of-00037.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8e9cc10ccc62c247a84d544a204d5a6a081afab2b57c310a34ee315224828f26
|
| 3 |
+
size 4997284496
|
model-00032-of-00037.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:72f8455a39b70d36c9a9a8f5aa700b6336af558bf08494870031bd5fb0504732
|
| 3 |
+
size 4998303624
|
model-00033-of-00037.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ec641831537c5b883d06c4c6e42b32104d0ff96c385b30791ae8212d6fd4f2f4
|
| 3 |
+
size 4997284616
|
model-00034-of-00037.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2add5e53c6269a7e04d5918faf90ae7729e8e441948c2d653abd4590b7ab83c2
|
| 3 |
+
size 4998303504
|
model-00035-of-00037.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cb3338fa36ad496b86950f6109c22d04b308845f5d75f8fd40fdc9ebd3de3456
|
| 3 |
+
size 4997284736
|
model-00036-of-00037.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:251a1db220cead58fa9f7efe15ead5a8e22f1a6063446d3d03d4d63186038d9a
|
| 3 |
+
size 4998303456
|
model-00037-of-00037.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1216c4476e72be10cf7313494b311053789133c54afbe2835d47c7931548aae8
|
| 3 |
+
size 4419730336
|
model.safetensors.index.json
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e82645b7359e97d49c9a0918a4d765dee570aafb41168b1a8aedeaf9b1db898f
|
| 3 |
+
size 12668756
|
recipe.yaml
CHANGED
|
@@ -1,28 +1,9 @@
|
|
| 1 |
default_stage:
|
| 2 |
default_modifiers:
|
| 3 |
GPTQModifier:
|
| 4 |
-
config_groups:
|
| 5 |
-
group_0:
|
| 6 |
-
targets: [Linear]
|
| 7 |
-
weights:
|
| 8 |
-
num_bits: 4
|
| 9 |
-
type: int
|
| 10 |
-
symmetric: true
|
| 11 |
-
group_size: 128
|
| 12 |
-
strategy: group
|
| 13 |
-
block_structure: null
|
| 14 |
-
dynamic: false
|
| 15 |
-
actorder: !!python/object/apply:compressed_tensors.quantization.quant_args.ActivationOrdering [
|
| 16 |
-
static]
|
| 17 |
-
scale_dtype: null
|
| 18 |
-
zp_dtype: null
|
| 19 |
-
observer: memoryless_minmax
|
| 20 |
-
observer_kwargs: {}
|
| 21 |
-
input_activations: null
|
| 22 |
-
output_activations: null
|
| 23 |
-
format: null
|
| 24 |
targets: [Linear]
|
| 25 |
-
ignore: [lm_head
|
|
|
|
| 26 |
block_size: 128
|
| 27 |
dampening_frac: 0.01
|
| 28 |
actorder: static
|
|
|
|
| 1 |
default_stage:
|
| 2 |
default_modifiers:
|
| 3 |
GPTQModifier:
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 4 |
targets: [Linear]
|
| 5 |
+
ignore: [lm_head]
|
| 6 |
+
scheme: W4A16
|
| 7 |
block_size: 128
|
| 8 |
dampening_frac: 0.01
|
| 9 |
actorder: static
|