Thomaschtl
/

4bit_fp4

+{
+  "model_name": "Qwen/Qwen3-0.6B-Base",
+  "quantization_method": "bitsandbytes",
+  "config_name": "bnb_4bit_fp4",
+  "description": "4-bit FP4 with double quantization",
+  "expected_compression": "~8x",
+  "quantization_config": {
+    "load_in_4bit": true,
+    "load_in_8bit": false,
+    "bnb_4bit_quant_type": "fp4",
+    "bnb_4bit_use_double_quant": true,
+    "bnb_4bit_compute_dtype": "torch.float16",
+    "llm_int8_threshold": 6.0
+  },
+  "timestamp": "2025-06-10 21:17:24",
+  "loading_time_seconds": 4.421220541000366,
+  "memory_usage_gb": 0.5096735954284668,
+  "test_generation": "Hello, I am a student in the field of computer science and I"
+}