ronantakizawa commited on
Commit
83bf26a
·
verified ·
1 Parent(s): 3b9ff18

Add quantization configuration metadata

Browse files
Files changed (1) hide show
  1. quantization_config.json +22 -0
quantization_config.json ADDED
@@ -0,0 +1,22 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "quant_method": "gptq",
3
+ "bits": 4,
4
+ "group_size": 128,
5
+ "desc_act": true,
6
+ "sym": true,
7
+ "dataset": "lmms-lab/flickr30k",
8
+ "calibration_samples": 256,
9
+ "model_seqlen": 2048,
10
+ "block_name_to_quantize": "LlamaDecoderLayer",
11
+ "module_name_preceding_first_block": [
12
+ "model.vision_model",
13
+ "model.connector"
14
+ ],
15
+ "quantization_tool": "llm-compressor",
16
+ "preserved_components": [
17
+ "vision_model",
18
+ "vision_tower",
19
+ "connector",
20
+ "lm_head"
21
+ ]
22
+ }