Delete .ipynb_checkpoints

Browse files

Files changed (2) hide show

.ipynb_checkpoints/README-checkpoint.md +0 -15
.ipynb_checkpoints/config-checkpoint.json +0 -114

.ipynb_checkpoints/README-checkpoint.md DELETED Viewed

@@ -1,15 +0,0 @@
----
-license: apache-2.0
-base_model:
-- allenai/Olmo-3-7B-Think
-tags:
-- llmcompressor
----
-This is [allenai/Olmo-3-7B-Think](https://huggingface.co/allenai/Olmo-3-7B-Think) quantized with [LLM Compressor](https://github.com/vllm-project/llm-compressor) with Smoothquant (W8A8). The model is compatible with vLLM (tested: v0.11.2). Tested with an RTX 4090.
-- **Developed by:** [The Kaitchup](https://kaitchup.substack.com/)
-- **License:** Apache 2.0 license
-## How to Support My Work
-Subscribe to [The Kaitchup](https://kaitchup.substack.com/subscribe). This helps me a lot to continue quantizing and evaluating models for free. Or you can "[buy me a kofi](https://ko-fi.com/bnjmn_marie)".

.ipynb_checkpoints/config-checkpoint.json DELETED Viewed

@@ -1,114 +0,0 @@
-{
-  "architectures": [
-    "Olmo3ForCausalLM"
-  ],
-  "attention_bias": false,
-  "attention_dropout": 0.0,
-  "dtype": "bfloat16",
-  "eos_token_id": 100257,
-  "hidden_act": "silu",
-  "hidden_size": 4096,
-  "initializer_range": 0.02,
-  "intermediate_size": 11008,
-  "layer_types": [
-    "sliding_attention",
-    "sliding_attention",
-    "sliding_attention",
-    "full_attention",
-    "sliding_attention",
-    "sliding_attention",
-    "sliding_attention",
-    "full_attention",
-    "sliding_attention",
-    "sliding_attention",
-    "sliding_attention",
-    "full_attention",
-    "sliding_attention",
-    "sliding_attention",
-    "sliding_attention",
-    "full_attention",
-    "sliding_attention",
-    "sliding_attention",
-    "sliding_attention",
-    "full_attention",
-    "sliding_attention",
-    "sliding_attention",
-    "sliding_attention",
-    "full_attention",
-    "sliding_attention",
-    "sliding_attention",
-    "sliding_attention",
-    "full_attention",
-    "sliding_attention",
-    "sliding_attention",
-    "sliding_attention",
-    "full_attention"
-  ],
-  "max_position_embeddings": 65536,
-  "model_type": "olmo3",
-  "num_attention_heads": 32,
-  "num_hidden_layers": 32,
-  "num_key_value_heads": 32,
-  "pad_token_id": 100277,
-  "quantization_config": {
-    "config_groups": {
-      "group_0": {
-        "format": "int-quantized",
-        "input_activations": {
-          "actorder": null,
-          "block_structure": null,
-          "dynamic": true,
-          "group_size": null,
-          "num_bits": 8,
-          "observer": null,
-          "observer_kwargs": {},
-          "strategy": "token",
-          "symmetric": true,
-          "type": "int"
-        },
-        "output_activations": null,
-        "targets": [
-          "Linear"
-        ],
-        "weights": {
-          "actorder": null,
-          "block_structure": null,
-          "dynamic": false,
-          "group_size": null,
-          "num_bits": 8,
-          "observer": "minmax",
-          "observer_kwargs": {},
-          "strategy": "channel",
-          "symmetric": true,
-          "type": "int"
-        }
-      }
-    },
-    "format": "int-quantized",
-    "global_compression_ratio": null,
-    "ignore": [
-      "lm_head"
-    ],
-    "kv_cache_scheme": null,
-    "quant_method": "compressed-tensors",
-    "quantization_status": "compressed",
-    "sparsity_config": {},
-    "transform_config": {},
-    "version": "0.12.3.a20251114"
-  },
-  "rms_norm_eps": 1e-06,
-  "rope_scaling": {
-    "attention_factor": 1.2079441541679836,
-    "beta_fast": 32,
-    "beta_slow": 1,
-    "factor": 8.0,
-    "original_max_position_embeddings": 8192,
-    "rope_type": "yarn"
-  },
-  "rope_theta": 500000,
-  "sliding_window": 4096,
-  "tie_word_embeddings": false,
-  "transformers_version": "4.57.3",
-  "use_cache": false,
-  "vocab_size": 100278
-}