Thomaschtl commited on
Commit
898e755
·
verified ·
1 Parent(s): 0f6fc6d

Upload quantization_info.json with huggingface_hub

Browse files
Files changed (1) hide show
  1. quantization_info.json +19 -0
quantization_info.json ADDED
@@ -0,0 +1,19 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_name": "luca-deandrea/MNLP_M3_mcqa_model",
3
+ "quantization_method": "bitsandbytes",
4
+ "config_name": "bnb_4bit_nf4",
5
+ "description": "4-bit NF4 with double quantization",
6
+ "expected_compression": "~8x",
7
+ "quantization_config": {
8
+ "load_in_4bit": true,
9
+ "load_in_8bit": false,
10
+ "bnb_4bit_quant_type": "nf4",
11
+ "bnb_4bit_use_double_quant": true,
12
+ "bnb_4bit_compute_dtype": "torch.bfloat16",
13
+ "llm_int8_threshold": 6.0
14
+ },
15
+ "timestamp": "2025-06-10 21:31:13",
16
+ "loading_time_seconds": 10.503286600112915,
17
+ "memory_usage_gb": 0.5012297630310059,
18
+ "test_generation": "Hello, I am a 16-year-old girl. I have"
19
+ }