File size: 2,171 Bytes
e9e21d9 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 |
{
"producer": {
"name": "modelopt",
"version": "0.35.1"
},
"quantization": {
"quant_algo": "NVFP4",
"kv_cache_quant_algo": null,
"group_size": 16,
"exclude_modules": [
"head",
"layers.0.attn*",
"layers.1.attn*",
"layers.10.attn*",
"layers.11.attn*",
"layers.12.attn*",
"layers.13.attn*",
"layers.14.attn*",
"layers.15.attn*",
"layers.16.attn*",
"layers.17.attn*",
"layers.18.attn*",
"layers.19.attn*",
"layers.2.attn*",
"layers.20.attn*",
"layers.21.attn*",
"layers.22.attn*",
"layers.23.attn*",
"layers.24.attn*",
"layers.25.attn*",
"layers.26.attn*",
"layers.27.attn*",
"layers.28.attn*",
"layers.29.attn*",
"layers.3.attn*",
"layers.30.attn*",
"layers.31.attn*",
"layers.32.attn*",
"layers.33.attn*",
"layers.34.attn*",
"layers.35.attn*",
"layers.36.attn*",
"layers.37.attn*",
"layers.38.attn*",
"layers.39.attn*",
"layers.4.attn*",
"layers.40.attn*",
"layers.41.attn*",
"layers.42.attn*",
"layers.43.attn*",
"layers.44.attn*",
"layers.45.attn*",
"layers.46.attn*",
"layers.47.attn*",
"layers.48.attn*",
"layers.49.attn*",
"layers.5.attn*",
"layers.50.attn*",
"layers.51.attn*",
"layers.52.attn*",
"layers.53.attn*",
"layers.54.attn*",
"layers.55.attn*",
"layers.56.attn*",
"layers.57.attn*",
"layers.58.attn*",
"layers.59.attn*",
"layers.6.attn*",
"layers.60.attn*",
"layers.7.attn*",
"layers.8.attn*",
"layers.9.attn*",
"layers.61*"
]
}
} |