diff --git a/metadata.json b/metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..990dd96f91d99211157cca0e1ba3ed2f1d6a3682 --- /dev/null +++ b/metadata.json @@ -0,0 +1,1148 @@ +{ + "model_type": "llama", + "num_layers": 224, + "precisions": [ + "FP8_Dynamic", + "FP8_Block", + "NVFP4" + ], + "precision_configs": { + "FP8_Dynamic": { + "effective_bits": 8.0, + "num_bits": 8, + "strategy": "channel" + }, + "FP8_Block": { + "effective_bits": 8.0, + "num_bits": 8, + "strategy": "block" + }, + "NVFP4": { + "effective_bits": 4.0, + "num_bits": 4, + "strategy": "tensor_group" + } + }, + "layer_paths": { + "model.layers.0.self_attn.q_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.0.self_attn.q_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.0.self_attn.q_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.0.self_attn.q_proj/NVFP4.pth" + }, + "model.layers.0.self_attn.k_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.0.self_attn.k_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.0.self_attn.k_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.0.self_attn.k_proj/NVFP4.pth" + }, + "model.layers.0.self_attn.v_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.0.self_attn.v_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.0.self_attn.v_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.0.self_attn.v_proj/NVFP4.pth" + }, + "model.layers.0.self_attn.o_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.0.self_attn.o_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.0.self_attn.o_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.0.self_attn.o_proj/NVFP4.pth" + }, + "model.layers.0.mlp.gate_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.0.mlp.gate_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.0.mlp.gate_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.0.mlp.gate_proj/NVFP4.pth" + }, + "model.layers.0.mlp.up_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.0.mlp.up_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.0.mlp.up_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.0.mlp.up_proj/NVFP4.pth" + }, + "model.layers.0.mlp.down_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.0.mlp.down_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.0.mlp.down_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.0.mlp.down_proj/NVFP4.pth" + }, + "model.layers.1.self_attn.q_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.1.self_attn.q_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.1.self_attn.q_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.1.self_attn.q_proj/NVFP4.pth" + }, + "model.layers.1.self_attn.k_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.1.self_attn.k_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.1.self_attn.k_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.1.self_attn.k_proj/NVFP4.pth" + }, + "model.layers.1.self_attn.v_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.1.self_attn.v_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.1.self_attn.v_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.1.self_attn.v_proj/NVFP4.pth" + }, + "model.layers.1.self_attn.o_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.1.self_attn.o_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.1.self_attn.o_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.1.self_attn.o_proj/NVFP4.pth" + }, + "model.layers.1.mlp.gate_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.1.mlp.gate_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.1.mlp.gate_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.1.mlp.gate_proj/NVFP4.pth" + }, + "model.layers.1.mlp.up_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.1.mlp.up_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.1.mlp.up_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.1.mlp.up_proj/NVFP4.pth" + }, + "model.layers.1.mlp.down_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.1.mlp.down_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.1.mlp.down_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.1.mlp.down_proj/NVFP4.pth" + }, + "model.layers.2.self_attn.q_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.2.self_attn.q_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.2.self_attn.q_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.2.self_attn.q_proj/NVFP4.pth" + }, + "model.layers.2.self_attn.k_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.2.self_attn.k_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.2.self_attn.k_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.2.self_attn.k_proj/NVFP4.pth" + }, + "model.layers.2.self_attn.v_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.2.self_attn.v_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.2.self_attn.v_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.2.self_attn.v_proj/NVFP4.pth" + }, + "model.layers.2.self_attn.o_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.2.self_attn.o_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.2.self_attn.o_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.2.self_attn.o_proj/NVFP4.pth" + }, + "model.layers.2.mlp.gate_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.2.mlp.gate_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.2.mlp.gate_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.2.mlp.gate_proj/NVFP4.pth" + }, + "model.layers.2.mlp.up_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.2.mlp.up_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.2.mlp.up_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.2.mlp.up_proj/NVFP4.pth" + }, + "model.layers.2.mlp.down_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.2.mlp.down_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.2.mlp.down_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.2.mlp.down_proj/NVFP4.pth" + }, + "model.layers.3.self_attn.q_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.3.self_attn.q_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.3.self_attn.q_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.3.self_attn.q_proj/NVFP4.pth" + }, + "model.layers.3.self_attn.k_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.3.self_attn.k_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.3.self_attn.k_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.3.self_attn.k_proj/NVFP4.pth" + }, + "model.layers.3.self_attn.v_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.3.self_attn.v_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.3.self_attn.v_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.3.self_attn.v_proj/NVFP4.pth" + }, + "model.layers.3.self_attn.o_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.3.self_attn.o_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.3.self_attn.o_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.3.self_attn.o_proj/NVFP4.pth" + }, + "model.layers.3.mlp.gate_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.3.mlp.gate_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.3.mlp.gate_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.3.mlp.gate_proj/NVFP4.pth" + }, + "model.layers.3.mlp.up_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.3.mlp.up_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.3.mlp.up_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.3.mlp.up_proj/NVFP4.pth" + }, + "model.layers.3.mlp.down_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.3.mlp.down_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.3.mlp.down_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.3.mlp.down_proj/NVFP4.pth" + }, + "model.layers.4.self_attn.q_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.4.self_attn.q_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.4.self_attn.q_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.4.self_attn.q_proj/NVFP4.pth" + }, + "model.layers.4.self_attn.k_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.4.self_attn.k_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.4.self_attn.k_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.4.self_attn.k_proj/NVFP4.pth" + }, + "model.layers.4.self_attn.v_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.4.self_attn.v_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.4.self_attn.v_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.4.self_attn.v_proj/NVFP4.pth" + }, + "model.layers.4.self_attn.o_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.4.self_attn.o_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.4.self_attn.o_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.4.self_attn.o_proj/NVFP4.pth" + }, + "model.layers.4.mlp.gate_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.4.mlp.gate_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.4.mlp.gate_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.4.mlp.gate_proj/NVFP4.pth" + }, + "model.layers.4.mlp.up_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.4.mlp.up_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.4.mlp.up_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.4.mlp.up_proj/NVFP4.pth" + }, + "model.layers.4.mlp.down_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.4.mlp.down_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.4.mlp.down_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.4.mlp.down_proj/NVFP4.pth" + }, + "model.layers.5.self_attn.q_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.5.self_attn.q_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.5.self_attn.q_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.5.self_attn.q_proj/NVFP4.pth" + }, + "model.layers.5.self_attn.k_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.5.self_attn.k_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.5.self_attn.k_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.5.self_attn.k_proj/NVFP4.pth" + }, + "model.layers.5.self_attn.v_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.5.self_attn.v_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.5.self_attn.v_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.5.self_attn.v_proj/NVFP4.pth" + }, + "model.layers.5.self_attn.o_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.5.self_attn.o_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.5.self_attn.o_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.5.self_attn.o_proj/NVFP4.pth" + }, + "model.layers.5.mlp.gate_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.5.mlp.gate_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.5.mlp.gate_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.5.mlp.gate_proj/NVFP4.pth" + }, + "model.layers.5.mlp.up_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.5.mlp.up_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.5.mlp.up_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.5.mlp.up_proj/NVFP4.pth" + }, + "model.layers.5.mlp.down_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.5.mlp.down_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.5.mlp.down_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.5.mlp.down_proj/NVFP4.pth" + }, + "model.layers.6.self_attn.q_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.6.self_attn.q_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.6.self_attn.q_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.6.self_attn.q_proj/NVFP4.pth" + }, + "model.layers.6.self_attn.k_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.6.self_attn.k_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.6.self_attn.k_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.6.self_attn.k_proj/NVFP4.pth" + }, + "model.layers.6.self_attn.v_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.6.self_attn.v_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.6.self_attn.v_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.6.self_attn.v_proj/NVFP4.pth" + }, + "model.layers.6.self_attn.o_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.6.self_attn.o_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.6.self_attn.o_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.6.self_attn.o_proj/NVFP4.pth" + }, + "model.layers.6.mlp.gate_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.6.mlp.gate_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.6.mlp.gate_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.6.mlp.gate_proj/NVFP4.pth" + }, + "model.layers.6.mlp.up_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.6.mlp.up_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.6.mlp.up_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.6.mlp.up_proj/NVFP4.pth" + }, + "model.layers.6.mlp.down_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.6.mlp.down_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.6.mlp.down_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.6.mlp.down_proj/NVFP4.pth" + }, + "model.layers.7.self_attn.q_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.7.self_attn.q_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.7.self_attn.q_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.7.self_attn.q_proj/NVFP4.pth" + }, + "model.layers.7.self_attn.k_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.7.self_attn.k_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.7.self_attn.k_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.7.self_attn.k_proj/NVFP4.pth" + }, + "model.layers.7.self_attn.v_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.7.self_attn.v_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.7.self_attn.v_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.7.self_attn.v_proj/NVFP4.pth" + }, + "model.layers.7.self_attn.o_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.7.self_attn.o_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.7.self_attn.o_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.7.self_attn.o_proj/NVFP4.pth" + }, + "model.layers.7.mlp.gate_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.7.mlp.gate_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.7.mlp.gate_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.7.mlp.gate_proj/NVFP4.pth" + }, + "model.layers.7.mlp.up_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.7.mlp.up_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.7.mlp.up_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.7.mlp.up_proj/NVFP4.pth" + }, + "model.layers.7.mlp.down_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.7.mlp.down_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.7.mlp.down_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.7.mlp.down_proj/NVFP4.pth" + }, + "model.layers.8.self_attn.q_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.8.self_attn.q_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.8.self_attn.q_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.8.self_attn.q_proj/NVFP4.pth" + }, + "model.layers.8.self_attn.k_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.8.self_attn.k_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.8.self_attn.k_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.8.self_attn.k_proj/NVFP4.pth" + }, + "model.layers.8.self_attn.v_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.8.self_attn.v_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.8.self_attn.v_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.8.self_attn.v_proj/NVFP4.pth" + }, + "model.layers.8.self_attn.o_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.8.self_attn.o_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.8.self_attn.o_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.8.self_attn.o_proj/NVFP4.pth" + }, + "model.layers.8.mlp.gate_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.8.mlp.gate_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.8.mlp.gate_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.8.mlp.gate_proj/NVFP4.pth" + }, + "model.layers.8.mlp.up_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.8.mlp.up_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.8.mlp.up_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.8.mlp.up_proj/NVFP4.pth" + }, + "model.layers.8.mlp.down_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.8.mlp.down_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.8.mlp.down_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.8.mlp.down_proj/NVFP4.pth" + }, + "model.layers.9.self_attn.q_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.9.self_attn.q_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.9.self_attn.q_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.9.self_attn.q_proj/NVFP4.pth" + }, + "model.layers.9.self_attn.k_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.9.self_attn.k_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.9.self_attn.k_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.9.self_attn.k_proj/NVFP4.pth" + }, + "model.layers.9.self_attn.v_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.9.self_attn.v_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.9.self_attn.v_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.9.self_attn.v_proj/NVFP4.pth" + }, + "model.layers.9.self_attn.o_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.9.self_attn.o_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.9.self_attn.o_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.9.self_attn.o_proj/NVFP4.pth" + }, + "model.layers.9.mlp.gate_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.9.mlp.gate_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.9.mlp.gate_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.9.mlp.gate_proj/NVFP4.pth" + }, + "model.layers.9.mlp.up_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.9.mlp.up_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.9.mlp.up_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.9.mlp.up_proj/NVFP4.pth" + }, + "model.layers.9.mlp.down_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.9.mlp.down_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.9.mlp.down_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.9.mlp.down_proj/NVFP4.pth" + }, + "model.layers.10.self_attn.q_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.10.self_attn.q_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.10.self_attn.q_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.10.self_attn.q_proj/NVFP4.pth" + }, + "model.layers.10.self_attn.k_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.10.self_attn.k_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.10.self_attn.k_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.10.self_attn.k_proj/NVFP4.pth" + }, + "model.layers.10.self_attn.v_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.10.self_attn.v_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.10.self_attn.v_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.10.self_attn.v_proj/NVFP4.pth" + }, + "model.layers.10.self_attn.o_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.10.self_attn.o_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.10.self_attn.o_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.10.self_attn.o_proj/NVFP4.pth" + }, + "model.layers.10.mlp.gate_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.10.mlp.gate_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.10.mlp.gate_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.10.mlp.gate_proj/NVFP4.pth" + }, + "model.layers.10.mlp.up_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.10.mlp.up_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.10.mlp.up_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.10.mlp.up_proj/NVFP4.pth" + }, + "model.layers.10.mlp.down_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.10.mlp.down_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.10.mlp.down_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.10.mlp.down_proj/NVFP4.pth" + }, + "model.layers.11.self_attn.q_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.11.self_attn.q_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.11.self_attn.q_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.11.self_attn.q_proj/NVFP4.pth" + }, + "model.layers.11.self_attn.k_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.11.self_attn.k_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.11.self_attn.k_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.11.self_attn.k_proj/NVFP4.pth" + }, + "model.layers.11.self_attn.v_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.11.self_attn.v_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.11.self_attn.v_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.11.self_attn.v_proj/NVFP4.pth" + }, + "model.layers.11.self_attn.o_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.11.self_attn.o_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.11.self_attn.o_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.11.self_attn.o_proj/NVFP4.pth" + }, + "model.layers.11.mlp.gate_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.11.mlp.gate_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.11.mlp.gate_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.11.mlp.gate_proj/NVFP4.pth" + }, + "model.layers.11.mlp.up_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.11.mlp.up_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.11.mlp.up_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.11.mlp.up_proj/NVFP4.pth" + }, + "model.layers.11.mlp.down_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.11.mlp.down_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.11.mlp.down_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.11.mlp.down_proj/NVFP4.pth" + }, + "model.layers.12.self_attn.q_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.12.self_attn.q_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.12.self_attn.q_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.12.self_attn.q_proj/NVFP4.pth" + }, + "model.layers.12.self_attn.k_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.12.self_attn.k_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.12.self_attn.k_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.12.self_attn.k_proj/NVFP4.pth" + }, + "model.layers.12.self_attn.v_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.12.self_attn.v_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.12.self_attn.v_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.12.self_attn.v_proj/NVFP4.pth" + }, + "model.layers.12.self_attn.o_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.12.self_attn.o_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.12.self_attn.o_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.12.self_attn.o_proj/NVFP4.pth" + }, + "model.layers.12.mlp.gate_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.12.mlp.gate_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.12.mlp.gate_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.12.mlp.gate_proj/NVFP4.pth" + }, + "model.layers.12.mlp.up_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.12.mlp.up_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.12.mlp.up_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.12.mlp.up_proj/NVFP4.pth" + }, + "model.layers.12.mlp.down_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.12.mlp.down_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.12.mlp.down_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.12.mlp.down_proj/NVFP4.pth" + }, + "model.layers.13.self_attn.q_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.13.self_attn.q_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.13.self_attn.q_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.13.self_attn.q_proj/NVFP4.pth" + }, + "model.layers.13.self_attn.k_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.13.self_attn.k_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.13.self_attn.k_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.13.self_attn.k_proj/NVFP4.pth" + }, + "model.layers.13.self_attn.v_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.13.self_attn.v_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.13.self_attn.v_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.13.self_attn.v_proj/NVFP4.pth" + }, + "model.layers.13.self_attn.o_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.13.self_attn.o_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.13.self_attn.o_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.13.self_attn.o_proj/NVFP4.pth" + }, + "model.layers.13.mlp.gate_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.13.mlp.gate_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.13.mlp.gate_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.13.mlp.gate_proj/NVFP4.pth" + }, + "model.layers.13.mlp.up_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.13.mlp.up_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.13.mlp.up_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.13.mlp.up_proj/NVFP4.pth" + }, + "model.layers.13.mlp.down_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.13.mlp.down_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.13.mlp.down_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.13.mlp.down_proj/NVFP4.pth" + }, + "model.layers.14.self_attn.q_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.14.self_attn.q_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.14.self_attn.q_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.14.self_attn.q_proj/NVFP4.pth" + }, + "model.layers.14.self_attn.k_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.14.self_attn.k_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.14.self_attn.k_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.14.self_attn.k_proj/NVFP4.pth" + }, + "model.layers.14.self_attn.v_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.14.self_attn.v_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.14.self_attn.v_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.14.self_attn.v_proj/NVFP4.pth" + }, + "model.layers.14.self_attn.o_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.14.self_attn.o_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.14.self_attn.o_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.14.self_attn.o_proj/NVFP4.pth" + }, + "model.layers.14.mlp.gate_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.14.mlp.gate_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.14.mlp.gate_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.14.mlp.gate_proj/NVFP4.pth" + }, + "model.layers.14.mlp.up_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.14.mlp.up_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.14.mlp.up_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.14.mlp.up_proj/NVFP4.pth" + }, + "model.layers.14.mlp.down_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.14.mlp.down_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.14.mlp.down_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.14.mlp.down_proj/NVFP4.pth" + }, + "model.layers.15.self_attn.q_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.15.self_attn.q_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.15.self_attn.q_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.15.self_attn.q_proj/NVFP4.pth" + }, + "model.layers.15.self_attn.k_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.15.self_attn.k_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.15.self_attn.k_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.15.self_attn.k_proj/NVFP4.pth" + }, + "model.layers.15.self_attn.v_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.15.self_attn.v_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.15.self_attn.v_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.15.self_attn.v_proj/NVFP4.pth" + }, + "model.layers.15.self_attn.o_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.15.self_attn.o_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.15.self_attn.o_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.15.self_attn.o_proj/NVFP4.pth" + }, + "model.layers.15.mlp.gate_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.15.mlp.gate_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.15.mlp.gate_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.15.mlp.gate_proj/NVFP4.pth" + }, + "model.layers.15.mlp.up_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.15.mlp.up_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.15.mlp.up_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.15.mlp.up_proj/NVFP4.pth" + }, + "model.layers.15.mlp.down_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.15.mlp.down_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.15.mlp.down_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.15.mlp.down_proj/NVFP4.pth" + }, + "model.layers.16.self_attn.q_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.16.self_attn.q_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.16.self_attn.q_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.16.self_attn.q_proj/NVFP4.pth" + }, + "model.layers.16.self_attn.k_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.16.self_attn.k_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.16.self_attn.k_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.16.self_attn.k_proj/NVFP4.pth" + }, + "model.layers.16.self_attn.v_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.16.self_attn.v_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.16.self_attn.v_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.16.self_attn.v_proj/NVFP4.pth" + }, + "model.layers.16.self_attn.o_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.16.self_attn.o_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.16.self_attn.o_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.16.self_attn.o_proj/NVFP4.pth" + }, + "model.layers.16.mlp.gate_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.16.mlp.gate_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.16.mlp.gate_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.16.mlp.gate_proj/NVFP4.pth" + }, + "model.layers.16.mlp.up_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.16.mlp.up_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.16.mlp.up_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.16.mlp.up_proj/NVFP4.pth" + }, + "model.layers.16.mlp.down_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.16.mlp.down_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.16.mlp.down_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.16.mlp.down_proj/NVFP4.pth" + }, + "model.layers.17.self_attn.q_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.17.self_attn.q_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.17.self_attn.q_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.17.self_attn.q_proj/NVFP4.pth" + }, + "model.layers.17.self_attn.k_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.17.self_attn.k_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.17.self_attn.k_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.17.self_attn.k_proj/NVFP4.pth" + }, + "model.layers.17.self_attn.v_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.17.self_attn.v_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.17.self_attn.v_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.17.self_attn.v_proj/NVFP4.pth" + }, + "model.layers.17.self_attn.o_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.17.self_attn.o_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.17.self_attn.o_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.17.self_attn.o_proj/NVFP4.pth" + }, + "model.layers.17.mlp.gate_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.17.mlp.gate_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.17.mlp.gate_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.17.mlp.gate_proj/NVFP4.pth" + }, + "model.layers.17.mlp.up_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.17.mlp.up_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.17.mlp.up_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.17.mlp.up_proj/NVFP4.pth" + }, + "model.layers.17.mlp.down_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.17.mlp.down_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.17.mlp.down_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.17.mlp.down_proj/NVFP4.pth" + }, + "model.layers.18.self_attn.q_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.18.self_attn.q_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.18.self_attn.q_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.18.self_attn.q_proj/NVFP4.pth" + }, + "model.layers.18.self_attn.k_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.18.self_attn.k_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.18.self_attn.k_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.18.self_attn.k_proj/NVFP4.pth" + }, + "model.layers.18.self_attn.v_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.18.self_attn.v_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.18.self_attn.v_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.18.self_attn.v_proj/NVFP4.pth" + }, + "model.layers.18.self_attn.o_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.18.self_attn.o_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.18.self_attn.o_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.18.self_attn.o_proj/NVFP4.pth" + }, + "model.layers.18.mlp.gate_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.18.mlp.gate_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.18.mlp.gate_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.18.mlp.gate_proj/NVFP4.pth" + }, + "model.layers.18.mlp.up_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.18.mlp.up_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.18.mlp.up_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.18.mlp.up_proj/NVFP4.pth" + }, + "model.layers.18.mlp.down_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.18.mlp.down_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.18.mlp.down_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.18.mlp.down_proj/NVFP4.pth" + }, + "model.layers.19.self_attn.q_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.19.self_attn.q_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.19.self_attn.q_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.19.self_attn.q_proj/NVFP4.pth" + }, + "model.layers.19.self_attn.k_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.19.self_attn.k_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.19.self_attn.k_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.19.self_attn.k_proj/NVFP4.pth" + }, + "model.layers.19.self_attn.v_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.19.self_attn.v_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.19.self_attn.v_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.19.self_attn.v_proj/NVFP4.pth" + }, + "model.layers.19.self_attn.o_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.19.self_attn.o_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.19.self_attn.o_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.19.self_attn.o_proj/NVFP4.pth" + }, + "model.layers.19.mlp.gate_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.19.mlp.gate_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.19.mlp.gate_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.19.mlp.gate_proj/NVFP4.pth" + }, + "model.layers.19.mlp.up_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.19.mlp.up_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.19.mlp.up_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.19.mlp.up_proj/NVFP4.pth" + }, + "model.layers.19.mlp.down_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.19.mlp.down_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.19.mlp.down_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.19.mlp.down_proj/NVFP4.pth" + }, + "model.layers.20.self_attn.q_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.20.self_attn.q_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.20.self_attn.q_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.20.self_attn.q_proj/NVFP4.pth" + }, + "model.layers.20.self_attn.k_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.20.self_attn.k_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.20.self_attn.k_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.20.self_attn.k_proj/NVFP4.pth" + }, + "model.layers.20.self_attn.v_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.20.self_attn.v_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.20.self_attn.v_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.20.self_attn.v_proj/NVFP4.pth" + }, + "model.layers.20.self_attn.o_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.20.self_attn.o_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.20.self_attn.o_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.20.self_attn.o_proj/NVFP4.pth" + }, + "model.layers.20.mlp.gate_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.20.mlp.gate_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.20.mlp.gate_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.20.mlp.gate_proj/NVFP4.pth" + }, + "model.layers.20.mlp.up_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.20.mlp.up_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.20.mlp.up_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.20.mlp.up_proj/NVFP4.pth" + }, + "model.layers.20.mlp.down_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.20.mlp.down_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.20.mlp.down_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.20.mlp.down_proj/NVFP4.pth" + }, + "model.layers.21.self_attn.q_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.21.self_attn.q_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.21.self_attn.q_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.21.self_attn.q_proj/NVFP4.pth" + }, + "model.layers.21.self_attn.k_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.21.self_attn.k_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.21.self_attn.k_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.21.self_attn.k_proj/NVFP4.pth" + }, + "model.layers.21.self_attn.v_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.21.self_attn.v_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.21.self_attn.v_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.21.self_attn.v_proj/NVFP4.pth" + }, + "model.layers.21.self_attn.o_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.21.self_attn.o_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.21.self_attn.o_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.21.self_attn.o_proj/NVFP4.pth" + }, + "model.layers.21.mlp.gate_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.21.mlp.gate_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.21.mlp.gate_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.21.mlp.gate_proj/NVFP4.pth" + }, + "model.layers.21.mlp.up_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.21.mlp.up_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.21.mlp.up_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.21.mlp.up_proj/NVFP4.pth" + }, + "model.layers.21.mlp.down_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.21.mlp.down_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.21.mlp.down_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.21.mlp.down_proj/NVFP4.pth" + }, + "model.layers.22.self_attn.q_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.22.self_attn.q_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.22.self_attn.q_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.22.self_attn.q_proj/NVFP4.pth" + }, + "model.layers.22.self_attn.k_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.22.self_attn.k_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.22.self_attn.k_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.22.self_attn.k_proj/NVFP4.pth" + }, + "model.layers.22.self_attn.v_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.22.self_attn.v_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.22.self_attn.v_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.22.self_attn.v_proj/NVFP4.pth" + }, + "model.layers.22.self_attn.o_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.22.self_attn.o_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.22.self_attn.o_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.22.self_attn.o_proj/NVFP4.pth" + }, + "model.layers.22.mlp.gate_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.22.mlp.gate_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.22.mlp.gate_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.22.mlp.gate_proj/NVFP4.pth" + }, + "model.layers.22.mlp.up_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.22.mlp.up_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.22.mlp.up_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.22.mlp.up_proj/NVFP4.pth" + }, + "model.layers.22.mlp.down_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.22.mlp.down_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.22.mlp.down_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.22.mlp.down_proj/NVFP4.pth" + }, + "model.layers.23.self_attn.q_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.23.self_attn.q_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.23.self_attn.q_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.23.self_attn.q_proj/NVFP4.pth" + }, + "model.layers.23.self_attn.k_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.23.self_attn.k_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.23.self_attn.k_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.23.self_attn.k_proj/NVFP4.pth" + }, + "model.layers.23.self_attn.v_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.23.self_attn.v_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.23.self_attn.v_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.23.self_attn.v_proj/NVFP4.pth" + }, + "model.layers.23.self_attn.o_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.23.self_attn.o_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.23.self_attn.o_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.23.self_attn.o_proj/NVFP4.pth" + }, + "model.layers.23.mlp.gate_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.23.mlp.gate_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.23.mlp.gate_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.23.mlp.gate_proj/NVFP4.pth" + }, + "model.layers.23.mlp.up_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.23.mlp.up_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.23.mlp.up_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.23.mlp.up_proj/NVFP4.pth" + }, + "model.layers.23.mlp.down_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.23.mlp.down_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.23.mlp.down_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.23.mlp.down_proj/NVFP4.pth" + }, + "model.layers.24.self_attn.q_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.24.self_attn.q_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.24.self_attn.q_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.24.self_attn.q_proj/NVFP4.pth" + }, + "model.layers.24.self_attn.k_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.24.self_attn.k_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.24.self_attn.k_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.24.self_attn.k_proj/NVFP4.pth" + }, + "model.layers.24.self_attn.v_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.24.self_attn.v_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.24.self_attn.v_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.24.self_attn.v_proj/NVFP4.pth" + }, + "model.layers.24.self_attn.o_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.24.self_attn.o_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.24.self_attn.o_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.24.self_attn.o_proj/NVFP4.pth" + }, + "model.layers.24.mlp.gate_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.24.mlp.gate_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.24.mlp.gate_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.24.mlp.gate_proj/NVFP4.pth" + }, + "model.layers.24.mlp.up_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.24.mlp.up_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.24.mlp.up_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.24.mlp.up_proj/NVFP4.pth" + }, + "model.layers.24.mlp.down_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.24.mlp.down_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.24.mlp.down_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.24.mlp.down_proj/NVFP4.pth" + }, + "model.layers.25.self_attn.q_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.25.self_attn.q_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.25.self_attn.q_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.25.self_attn.q_proj/NVFP4.pth" + }, + "model.layers.25.self_attn.k_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.25.self_attn.k_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.25.self_attn.k_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.25.self_attn.k_proj/NVFP4.pth" + }, + "model.layers.25.self_attn.v_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.25.self_attn.v_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.25.self_attn.v_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.25.self_attn.v_proj/NVFP4.pth" + }, + "model.layers.25.self_attn.o_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.25.self_attn.o_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.25.self_attn.o_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.25.self_attn.o_proj/NVFP4.pth" + }, + "model.layers.25.mlp.gate_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.25.mlp.gate_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.25.mlp.gate_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.25.mlp.gate_proj/NVFP4.pth" + }, + "model.layers.25.mlp.up_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.25.mlp.up_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.25.mlp.up_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.25.mlp.up_proj/NVFP4.pth" + }, + "model.layers.25.mlp.down_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.25.mlp.down_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.25.mlp.down_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.25.mlp.down_proj/NVFP4.pth" + }, + "model.layers.26.self_attn.q_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.26.self_attn.q_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.26.self_attn.q_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.26.self_attn.q_proj/NVFP4.pth" + }, + "model.layers.26.self_attn.k_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.26.self_attn.k_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.26.self_attn.k_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.26.self_attn.k_proj/NVFP4.pth" + }, + "model.layers.26.self_attn.v_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.26.self_attn.v_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.26.self_attn.v_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.26.self_attn.v_proj/NVFP4.pth" + }, + "model.layers.26.self_attn.o_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.26.self_attn.o_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.26.self_attn.o_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.26.self_attn.o_proj/NVFP4.pth" + }, + "model.layers.26.mlp.gate_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.26.mlp.gate_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.26.mlp.gate_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.26.mlp.gate_proj/NVFP4.pth" + }, + "model.layers.26.mlp.up_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.26.mlp.up_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.26.mlp.up_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.26.mlp.up_proj/NVFP4.pth" + }, + "model.layers.26.mlp.down_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.26.mlp.down_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.26.mlp.down_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.26.mlp.down_proj/NVFP4.pth" + }, + "model.layers.27.self_attn.q_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.27.self_attn.q_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.27.self_attn.q_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.27.self_attn.q_proj/NVFP4.pth" + }, + "model.layers.27.self_attn.k_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.27.self_attn.k_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.27.self_attn.k_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.27.self_attn.k_proj/NVFP4.pth" + }, + "model.layers.27.self_attn.v_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.27.self_attn.v_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.27.self_attn.v_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.27.self_attn.v_proj/NVFP4.pth" + }, + "model.layers.27.self_attn.o_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.27.self_attn.o_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.27.self_attn.o_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.27.self_attn.o_proj/NVFP4.pth" + }, + "model.layers.27.mlp.gate_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.27.mlp.gate_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.27.mlp.gate_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.27.mlp.gate_proj/NVFP4.pth" + }, + "model.layers.27.mlp.up_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.27.mlp.up_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.27.mlp.up_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.27.mlp.up_proj/NVFP4.pth" + }, + "model.layers.27.mlp.down_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.27.mlp.down_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.27.mlp.down_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.27.mlp.down_proj/NVFP4.pth" + }, + "model.layers.28.self_attn.q_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.28.self_attn.q_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.28.self_attn.q_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.28.self_attn.q_proj/NVFP4.pth" + }, + "model.layers.28.self_attn.k_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.28.self_attn.k_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.28.self_attn.k_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.28.self_attn.k_proj/NVFP4.pth" + }, + "model.layers.28.self_attn.v_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.28.self_attn.v_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.28.self_attn.v_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.28.self_attn.v_proj/NVFP4.pth" + }, + "model.layers.28.self_attn.o_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.28.self_attn.o_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.28.self_attn.o_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.28.self_attn.o_proj/NVFP4.pth" + }, + "model.layers.28.mlp.gate_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.28.mlp.gate_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.28.mlp.gate_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.28.mlp.gate_proj/NVFP4.pth" + }, + "model.layers.28.mlp.up_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.28.mlp.up_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.28.mlp.up_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.28.mlp.up_proj/NVFP4.pth" + }, + "model.layers.28.mlp.down_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.28.mlp.down_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.28.mlp.down_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.28.mlp.down_proj/NVFP4.pth" + }, + "model.layers.29.self_attn.q_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.29.self_attn.q_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.29.self_attn.q_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.29.self_attn.q_proj/NVFP4.pth" + }, + "model.layers.29.self_attn.k_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.29.self_attn.k_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.29.self_attn.k_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.29.self_attn.k_proj/NVFP4.pth" + }, + "model.layers.29.self_attn.v_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.29.self_attn.v_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.29.self_attn.v_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.29.self_attn.v_proj/NVFP4.pth" + }, + "model.layers.29.self_attn.o_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.29.self_attn.o_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.29.self_attn.o_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.29.self_attn.o_proj/NVFP4.pth" + }, + "model.layers.29.mlp.gate_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.29.mlp.gate_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.29.mlp.gate_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.29.mlp.gate_proj/NVFP4.pth" + }, + "model.layers.29.mlp.up_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.29.mlp.up_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.29.mlp.up_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.29.mlp.up_proj/NVFP4.pth" + }, + "model.layers.29.mlp.down_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.29.mlp.down_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.29.mlp.down_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.29.mlp.down_proj/NVFP4.pth" + }, + "model.layers.30.self_attn.q_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.30.self_attn.q_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.30.self_attn.q_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.30.self_attn.q_proj/NVFP4.pth" + }, + "model.layers.30.self_attn.k_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.30.self_attn.k_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.30.self_attn.k_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.30.self_attn.k_proj/NVFP4.pth" + }, + "model.layers.30.self_attn.v_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.30.self_attn.v_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.30.self_attn.v_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.30.self_attn.v_proj/NVFP4.pth" + }, + "model.layers.30.self_attn.o_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.30.self_attn.o_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.30.self_attn.o_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.30.self_attn.o_proj/NVFP4.pth" + }, + "model.layers.30.mlp.gate_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.30.mlp.gate_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.30.mlp.gate_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.30.mlp.gate_proj/NVFP4.pth" + }, + "model.layers.30.mlp.up_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.30.mlp.up_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.30.mlp.up_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.30.mlp.up_proj/NVFP4.pth" + }, + "model.layers.30.mlp.down_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.30.mlp.down_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.30.mlp.down_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.30.mlp.down_proj/NVFP4.pth" + }, + "model.layers.31.self_attn.q_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.31.self_attn.q_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.31.self_attn.q_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.31.self_attn.q_proj/NVFP4.pth" + }, + "model.layers.31.self_attn.k_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.31.self_attn.k_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.31.self_attn.k_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.31.self_attn.k_proj/NVFP4.pth" + }, + "model.layers.31.self_attn.v_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.31.self_attn.v_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.31.self_attn.v_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.31.self_attn.v_proj/NVFP4.pth" + }, + "model.layers.31.self_attn.o_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.31.self_attn.o_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.31.self_attn.o_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.31.self_attn.o_proj/NVFP4.pth" + }, + "model.layers.31.mlp.gate_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.31.mlp.gate_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.31.mlp.gate_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.31.mlp.gate_proj/NVFP4.pth" + }, + "model.layers.31.mlp.up_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.31.mlp.up_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.31.mlp.up_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.31.mlp.up_proj/NVFP4.pth" + }, + "model.layers.31.mlp.down_proj": { + "FP8_Dynamic": "quantized_layers/model.layers.31.mlp.down_proj/FP8_Dynamic.pth", + "FP8_Block": "quantized_layers/model.layers.31.mlp.down_proj/FP8_Block.pth", + "NVFP4": "quantized_layers/model.layers.31.mlp.down_proj/NVFP4.pth" + } + } +} \ No newline at end of file diff --git a/model.layers.0.mlp.down_proj/FP8_Block.pth b/model.layers.0.mlp.down_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..8ec89053ec6bc95e3be4bd1d49b4d84d9b03ff5d --- /dev/null +++ b/model.layers.0.mlp.down_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39a5b2065a072a24494f7230e390a4e775adb84cb6655cba6eddd1a5486d11b5 +size 117442359 diff --git a/model.layers.0.mlp.down_proj/FP8_Dynamic.pth b/model.layers.0.mlp.down_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..114dec2ed71ecfd073f03bc1b2d355b5a2eb4c77 --- /dev/null +++ b/model.layers.0.mlp.down_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58405ec430978bbe2082b7569c8377c06af37f9ebf4fba8800202271348a8613 +size 117442373 diff --git a/model.layers.0.mlp.down_proj/NVFP4.pth b/model.layers.0.mlp.down_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..d1cc3f823b9493d2a6ec7b4dc744138d56fde497 --- /dev/null +++ b/model.layers.0.mlp.down_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f60f0b99c635540e979975831899c5ea3119fbf3ba4f37c6a45664952ac85f58 +size 117442267 diff --git a/model.layers.0.mlp.gate_proj/FP8_Block.pth b/model.layers.0.mlp.gate_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..b332d3754fab65276d5d4d81b7b6f9632c2ac65e --- /dev/null +++ b/model.layers.0.mlp.gate_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d95f99af91d3bc222e8c45cdcf037e5b65f5c023aeb2bdb20f2b1fddbb3c8ef +size 117442359 diff --git a/model.layers.0.mlp.gate_proj/FP8_Dynamic.pth b/model.layers.0.mlp.gate_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..b4c626bd6b4bf5a902ee28b5f01f2833c21e966b --- /dev/null +++ b/model.layers.0.mlp.gate_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f94b79a766c65795496d41e927ec68c67baf4e1f4ece95faa464e26bbc65eae +size 117442373 diff --git a/model.layers.0.mlp.gate_proj/NVFP4.pth b/model.layers.0.mlp.gate_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..652002f64318218ed1813dbfec554e35d5905e66 --- /dev/null +++ b/model.layers.0.mlp.gate_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a429c738073d528249ca9eab09e1fb41841e2b61f0cc4de39e75e5a9e9f40de +size 117442267 diff --git a/model.layers.0.mlp.up_proj/FP8_Block.pth b/model.layers.0.mlp.up_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..8d5860fb108dc184440ac1ce45547fe4ef32a9c7 --- /dev/null +++ b/model.layers.0.mlp.up_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:974c4b0c5dd003fe125111164643d5a1fdd254a19d915157dea2b1cecb2d6edf +size 117442359 diff --git a/model.layers.0.mlp.up_proj/FP8_Dynamic.pth b/model.layers.0.mlp.up_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..e9feb88f1651028d7d6a17def61761ba21ffe1ef --- /dev/null +++ b/model.layers.0.mlp.up_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2085117fc6b0db4d3f29d49cbc56139e315d4aa0a4f662094cf32a67046eefb4 +size 117442373 diff --git a/model.layers.0.mlp.up_proj/NVFP4.pth b/model.layers.0.mlp.up_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..665dab7634d1e079417d4c5bfa5fdf64099c2895 --- /dev/null +++ b/model.layers.0.mlp.up_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e057693b6bfce3c6726e98a686932b13737118696dc56174c14c7e2246aaad7b +size 117442267 diff --git a/model.layers.0.self_attn.k_proj/FP8_Block.pth b/model.layers.0.self_attn.k_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..2006e57d49b227cbb763909692aaeb23254da34b --- /dev/null +++ b/model.layers.0.self_attn.k_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2b5faf6367c3703c1593c8785ad143270d80914768436fe1424318ff55687ac +size 8390455 diff --git a/model.layers.0.self_attn.k_proj/FP8_Dynamic.pth b/model.layers.0.self_attn.k_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..3883c58db7c6c0b050d047c2c9c065cbf381d682 --- /dev/null +++ b/model.layers.0.self_attn.k_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97bcdf10f857baf6ff5529cf2d1e5a27bbc678d97997b2900320c5de74742774 +size 8390469 diff --git a/model.layers.0.self_attn.k_proj/NVFP4.pth b/model.layers.0.self_attn.k_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..4b9603becf773f22a292aa37b6097ecc107c1b48 --- /dev/null +++ b/model.layers.0.self_attn.k_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f65698d124b7c1d181dca6162711c843ba4f5d490585c20d62c83b516b66794 +size 8390363 diff --git a/model.layers.0.self_attn.o_proj/FP8_Block.pth b/model.layers.0.self_attn.o_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..57de429c5fdd1d5df72773b9d4f6513cc9e2123b --- /dev/null +++ b/model.layers.0.self_attn.o_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:123f6080593d2441f5c0910bb97ce24cfa01404d46041fe6c3aeee75c5a8dbc4 +size 33556279 diff --git a/model.layers.0.self_attn.o_proj/FP8_Dynamic.pth b/model.layers.0.self_attn.o_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..07d00eb1412fa5828d1df827cf6a8067a45905d8 --- /dev/null +++ b/model.layers.0.self_attn.o_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f04130a870297081a00731315c3d64410edfed3c8fb797ae48ed8a07fe53e5c9 +size 33556293 diff --git a/model.layers.0.self_attn.o_proj/NVFP4.pth b/model.layers.0.self_attn.o_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..fe31309f0098f5bcaeec47f2c4d236441a7951c0 --- /dev/null +++ b/model.layers.0.self_attn.o_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:060385094a6f336853a0aa25e26bed26bd1005b3690c02d13677719bcfcd3bae +size 33556187 diff --git a/model.layers.0.self_attn.q_proj/FP8_Block.pth b/model.layers.0.self_attn.q_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..199f4a05ddd5ccdf37b132d77bde427465900328 --- /dev/null +++ b/model.layers.0.self_attn.q_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c4d2e42ef16c881782ac43d174d99416d6b20265ecb3101cbfa12ccacf23b40 +size 33556279 diff --git a/model.layers.0.self_attn.q_proj/FP8_Dynamic.pth b/model.layers.0.self_attn.q_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..9a71a88595dc232ea81eb9969f60783faee1c057 --- /dev/null +++ b/model.layers.0.self_attn.q_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d2b6b7c0cb0d3c16a86287bc68154fc27e0e318d60173223bef9c4ef03ead93 +size 33556293 diff --git a/model.layers.0.self_attn.q_proj/NVFP4.pth b/model.layers.0.self_attn.q_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..3acc4f5b0426c5ebff6070ab0d8c3a3f8b76cfd1 --- /dev/null +++ b/model.layers.0.self_attn.q_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74ac207a12365392d5b70ae762738c96cca92fe4c766975986d11115d0054914 +size 33556187 diff --git a/model.layers.0.self_attn.v_proj/FP8_Block.pth b/model.layers.0.self_attn.v_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..6d2c1299456aa0a6660d0ae999b58b696d2c6217 --- /dev/null +++ b/model.layers.0.self_attn.v_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa98789413d14912736ab2c1cc8d0400bc7d2d7f2341bb2fd2221a5500a9bd35 +size 8390455 diff --git a/model.layers.0.self_attn.v_proj/FP8_Dynamic.pth b/model.layers.0.self_attn.v_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..81e94b79d19321fafa136b5e92df70c96c665e95 --- /dev/null +++ b/model.layers.0.self_attn.v_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d24a54c4e7d657f679d85fc4cbacf5fd0b47ccb316d1cc52b0787efba278b6e0 +size 8390469 diff --git a/model.layers.0.self_attn.v_proj/NVFP4.pth b/model.layers.0.self_attn.v_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..44f9440e7d7fe949cfd652a9dbec4fb3ad8e15e9 --- /dev/null +++ b/model.layers.0.self_attn.v_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d04a06a5605a533a12ee5f2096efe79b258af286e3da28bf6326a6ada797f5bb +size 8390363 diff --git a/model.layers.1.mlp.down_proj/FP8_Block.pth b/model.layers.1.mlp.down_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..528160b3edb0ea41dd87b3fe548b785330609ba9 --- /dev/null +++ b/model.layers.1.mlp.down_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97f4c3356c72d615bf69ae80261279c2d844a38c357fb42fd91ecfe2f0efc076 +size 117442359 diff --git a/model.layers.1.mlp.down_proj/FP8_Dynamic.pth b/model.layers.1.mlp.down_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..0de16136f3daf90367a8a109da5b741d00563780 --- /dev/null +++ b/model.layers.1.mlp.down_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d1dfbb1d48975bb896b031956c3862ac6dc00006bd91e1793f5c4aa1464d250 +size 117442373 diff --git a/model.layers.1.mlp.down_proj/NVFP4.pth b/model.layers.1.mlp.down_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..01faae512fa0fc4c41f3244ef2080f0c45a50ad8 --- /dev/null +++ b/model.layers.1.mlp.down_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76269fe3798f0aded6158eafbc67deff240ae696519e0de3292ca9916048523a +size 117442267 diff --git a/model.layers.1.mlp.gate_proj/FP8_Block.pth b/model.layers.1.mlp.gate_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..ee9a1278bd6f2668f13524b88293aa7a46b16061 --- /dev/null +++ b/model.layers.1.mlp.gate_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c124aa5b52a855ee5c76ec910df3124dfccbccb14a7ec39a11cc2d07a36bfc5 +size 117442359 diff --git a/model.layers.1.mlp.gate_proj/FP8_Dynamic.pth b/model.layers.1.mlp.gate_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..b7b13ccee489572c6f13329a67c55a76d8b58b0a --- /dev/null +++ b/model.layers.1.mlp.gate_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5ac3b7ca16de58b3ac5e8ef9712fd52687ab7d426a18266019f353a497ac1d3 +size 117442373 diff --git a/model.layers.1.mlp.gate_proj/NVFP4.pth b/model.layers.1.mlp.gate_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..35c883b730c45f736f4fcaef7fb2c04e6b85266b --- /dev/null +++ b/model.layers.1.mlp.gate_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:391f675bf9012bcf4af252901e44afb426e599bb9793285312fff518b9409322 +size 117442267 diff --git a/model.layers.1.mlp.up_proj/FP8_Block.pth b/model.layers.1.mlp.up_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..247d137c1b6d1cc3adf92b2ca0ad2a7dcbfca9c7 --- /dev/null +++ b/model.layers.1.mlp.up_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b6e1ac61264e534ed42dfeaba6ecc9c0a7479b5a12a14cf203cd6ebeaff7edb +size 117442359 diff --git a/model.layers.1.mlp.up_proj/FP8_Dynamic.pth b/model.layers.1.mlp.up_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..d07118bf40d6a99c10d7105fb0799cda610c5920 --- /dev/null +++ b/model.layers.1.mlp.up_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2be56c2a9c86205c1decb940b79c025e355875327df3ca5dbf43ec94ee441a7 +size 117442373 diff --git a/model.layers.1.mlp.up_proj/NVFP4.pth b/model.layers.1.mlp.up_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..bcb978e5e8e40a5ba08508e4384a83875db6255a --- /dev/null +++ b/model.layers.1.mlp.up_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b07c43e6b9f63a9b047ecd107148952191bcf2191af7538c6cb4ee424fb6f49 +size 117442267 diff --git a/model.layers.1.self_attn.k_proj/FP8_Block.pth b/model.layers.1.self_attn.k_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..50876b2fd21dc56e47f4a14577621ed62bb70615 --- /dev/null +++ b/model.layers.1.self_attn.k_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c204a8373646eeb212ed55867290449328a2e609f8298a7a9324290e09bab690 +size 8390455 diff --git a/model.layers.1.self_attn.k_proj/FP8_Dynamic.pth b/model.layers.1.self_attn.k_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..1f7c86387fac5ee8252768536f88b966ff348910 --- /dev/null +++ b/model.layers.1.self_attn.k_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c512b0b0acca91bd0f10f5dfc28678d8e728aaa7d768a855917d17a1d0df84f +size 8390469 diff --git a/model.layers.1.self_attn.k_proj/NVFP4.pth b/model.layers.1.self_attn.k_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..ca0cef726692791b016a7bd735b44752857b15b7 --- /dev/null +++ b/model.layers.1.self_attn.k_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0abbfc750d622b61806ed375c1da3138c09f86ef1e38af6b8ccf3c2e352ce903 +size 8390363 diff --git a/model.layers.1.self_attn.o_proj/FP8_Block.pth b/model.layers.1.self_attn.o_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..7d87b21adb6b6b0e1317886f4a5a6c93f957ebb5 --- /dev/null +++ b/model.layers.1.self_attn.o_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a22bcaed6353dbc68bb1d860de5215833f5f6fb4e58561c4b4dc91981afc046 +size 33556279 diff --git a/model.layers.1.self_attn.o_proj/FP8_Dynamic.pth b/model.layers.1.self_attn.o_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..c7821750b9a08bcc59bf23e4ec753c7d1eda494e --- /dev/null +++ b/model.layers.1.self_attn.o_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f78a75238732ec84ed7cc6d35f3712b86a24559c85cf4d5dc539d2f5cb005be3 +size 33556293 diff --git a/model.layers.1.self_attn.o_proj/NVFP4.pth b/model.layers.1.self_attn.o_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..6f7a0e7016f099a2b11a735487c821a2e2fea404 --- /dev/null +++ b/model.layers.1.self_attn.o_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3ca3261ec1d6b02dde86ee497f7dfeea3f0bc63934f400eb674391b0f5c9da6 +size 33556187 diff --git a/model.layers.1.self_attn.q_proj/FP8_Block.pth b/model.layers.1.self_attn.q_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..1e9c6606a861f33eb9f18c7588d05119949e835c --- /dev/null +++ b/model.layers.1.self_attn.q_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5da85ebd784f19349018bd4bb883702d50637e056fd2b7d3f1f311a37c44b0e4 +size 33556279 diff --git a/model.layers.1.self_attn.q_proj/FP8_Dynamic.pth b/model.layers.1.self_attn.q_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..a385822e3037f167bced3554333207603cb71f98 --- /dev/null +++ b/model.layers.1.self_attn.q_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69d6c090098660296c7e48577d44889f1232764bc035662e7322f526bdc7ed60 +size 33556293 diff --git a/model.layers.1.self_attn.q_proj/NVFP4.pth b/model.layers.1.self_attn.q_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..b04be5ebb3dca66ec63e5b4eaff74b515ed7073c --- /dev/null +++ b/model.layers.1.self_attn.q_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92bc1756877bef1ccc76df6306ad016d963678fbfc752d35a8b986ef49d31e77 +size 33556187 diff --git a/model.layers.1.self_attn.v_proj/FP8_Block.pth b/model.layers.1.self_attn.v_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..905f9a55f15fcaf067bb2f6e34ef4ad6110b1e4f --- /dev/null +++ b/model.layers.1.self_attn.v_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:073ede965bda0ca3bc10b1201b8c721d275cbeed6ec54b6754feb815a2171b47 +size 8390455 diff --git a/model.layers.1.self_attn.v_proj/FP8_Dynamic.pth b/model.layers.1.self_attn.v_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..34ccfa6d38dcd4a3ea1586165369f2d5ffe93979 --- /dev/null +++ b/model.layers.1.self_attn.v_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d2d7b6efd362f1fb64c0d95d3a76ae61231d56bd0b65cc4523861781bd9357a +size 8390469 diff --git a/model.layers.1.self_attn.v_proj/NVFP4.pth b/model.layers.1.self_attn.v_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..b8a37d47ac92938bb5eb7ce51f70b45e56596f2e --- /dev/null +++ b/model.layers.1.self_attn.v_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c36dd7cf7552779e6a5ea331d9fb76ec342e0661e91b2b3a724fbb4483dbdfe +size 8390363 diff --git a/model.layers.10.mlp.down_proj/FP8_Block.pth b/model.layers.10.mlp.down_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..07799172ed88aa4ffb29c2b28ad690097ab8e853 --- /dev/null +++ b/model.layers.10.mlp.down_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ea3b2d9dfd3c89690ede2337ea42509821a8903056fe5bac9014cb3e41bf5f5 +size 117442359 diff --git a/model.layers.10.mlp.down_proj/FP8_Dynamic.pth b/model.layers.10.mlp.down_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..a6f4433916b4e01a5eb9ddaa42df09823e687de8 --- /dev/null +++ b/model.layers.10.mlp.down_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:416821f070b257ddf155a1ed6ec9fda0a98a14d21051c8c3178d49f48b176cc6 +size 117442373 diff --git a/model.layers.10.mlp.down_proj/NVFP4.pth b/model.layers.10.mlp.down_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..b21ef06b1b3c44cbcad94e346c6f6ae84bf76e30 --- /dev/null +++ b/model.layers.10.mlp.down_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a820fc0fa4abe50f3334ccc2b5c204fa149ef119013769896b9016e4e43da27e +size 117442267 diff --git a/model.layers.10.mlp.gate_proj/FP8_Block.pth b/model.layers.10.mlp.gate_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..163b77bfe1c23abc8003d4c22c1c1e94658083b2 --- /dev/null +++ b/model.layers.10.mlp.gate_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9b94673fef98d0b627ea4aa1e720f7cd6d5431f3e22a522c2494f120cf1e08e +size 117442359 diff --git a/model.layers.10.mlp.gate_proj/FP8_Dynamic.pth b/model.layers.10.mlp.gate_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..f1eef2b93d2fc8734dbfce776956d42cf257d223 --- /dev/null +++ b/model.layers.10.mlp.gate_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56d7b4ded6d9efd100d9c265b65bcfa2dc2ef135a21bd706105e598f17131d71 +size 117442373 diff --git a/model.layers.10.mlp.gate_proj/NVFP4.pth b/model.layers.10.mlp.gate_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..95b98e59c4236f06205689f545ea5c1038d8d8fc --- /dev/null +++ b/model.layers.10.mlp.gate_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:039514d63db0496aa1a8067fc5c66199cb28a0ba071be6fe06607bd4c9571a3a +size 117442267 diff --git a/model.layers.10.mlp.up_proj/FP8_Block.pth b/model.layers.10.mlp.up_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..5ad9b65d9d5fdc5d88610eed6e106d1a67febdb0 --- /dev/null +++ b/model.layers.10.mlp.up_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68ec769ec3e170d376cfffdc718475908477aa8115d0e559d3654e52aa1060fd +size 117442359 diff --git a/model.layers.10.mlp.up_proj/FP8_Dynamic.pth b/model.layers.10.mlp.up_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..1d405d9e74a7ff853875ad7ad293f2bba1ea2d83 --- /dev/null +++ b/model.layers.10.mlp.up_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97a6608bc0229c11f69f1eb26482a447f47d1b500b73d7e67d1f1d89245b6f97 +size 117442373 diff --git a/model.layers.10.mlp.up_proj/NVFP4.pth b/model.layers.10.mlp.up_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..6a08955c3c278ef22dbe76e144cc6e04bea9962a --- /dev/null +++ b/model.layers.10.mlp.up_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1439b617bb124c33bd963506d76540d96c4ac9f69fc96521225ce0e96b37f58 +size 117442267 diff --git a/model.layers.10.self_attn.k_proj/FP8_Block.pth b/model.layers.10.self_attn.k_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..ec04ea404b7df6d4fc47c0081a774cd32e38ace5 --- /dev/null +++ b/model.layers.10.self_attn.k_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c39a4ddb556f1bac5322310f4e74eaf9ebf6044b2aec5b68c1a4bf62aa0cba4 +size 8390455 diff --git a/model.layers.10.self_attn.k_proj/FP8_Dynamic.pth b/model.layers.10.self_attn.k_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..b1193b09b12a0360c12df6abda715f1800e97f8d --- /dev/null +++ b/model.layers.10.self_attn.k_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad080f3f7d1f1682285320c645cd4ed59e9debe127762d3aa21e44530b0c4bc8 +size 8390469 diff --git a/model.layers.10.self_attn.k_proj/NVFP4.pth b/model.layers.10.self_attn.k_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..2baed4137e9675ae2432ce189d55aafd9b0f0af8 --- /dev/null +++ b/model.layers.10.self_attn.k_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5981533e46d2cb1a7f537eeffdda799e91acd69b673850dcccd76d44a0e6533 +size 8390363 diff --git a/model.layers.10.self_attn.o_proj/FP8_Block.pth b/model.layers.10.self_attn.o_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..65667e43ada2068c764d4bcea1e7670c9ddb19fe --- /dev/null +++ b/model.layers.10.self_attn.o_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11adab4fc343951d87f8456b7d5755a99f752a90cfa95f3af66bd5471015c12d +size 33556279 diff --git a/model.layers.10.self_attn.o_proj/FP8_Dynamic.pth b/model.layers.10.self_attn.o_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..c64ae64fa569b66acdbe0d202b392de8aaa79bc8 --- /dev/null +++ b/model.layers.10.self_attn.o_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e51dfe40c52fe3f66b666fa9f6f56d03221471cbed22b13c0f334da1817034a8 +size 33556293 diff --git a/model.layers.10.self_attn.o_proj/NVFP4.pth b/model.layers.10.self_attn.o_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..28a09ed4d322f81ed8ba7dec8559acf4e832a71a --- /dev/null +++ b/model.layers.10.self_attn.o_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75e0c4963c206cba53c1b381bbf762268afe47a8eefa311753da79c146fa606c +size 33556187 diff --git a/model.layers.10.self_attn.q_proj/FP8_Block.pth b/model.layers.10.self_attn.q_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..3ace5d34cc477e017cbfb26fae62126d00245b3e --- /dev/null +++ b/model.layers.10.self_attn.q_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4288b8945e8bc480b58f53c0ce080c6f99b6b849f4fe9a4bb18f95fda21c636 +size 33556279 diff --git a/model.layers.10.self_attn.q_proj/FP8_Dynamic.pth b/model.layers.10.self_attn.q_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..c6f86d6fb4d9b5bc933c0f57aa885652e5c8e362 --- /dev/null +++ b/model.layers.10.self_attn.q_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c34758ccde322fa5448acc099fe7ebb470eece6f3af889b818da76ab23bbd67 +size 33556293 diff --git a/model.layers.10.self_attn.q_proj/NVFP4.pth b/model.layers.10.self_attn.q_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..f02123e2f459b9b79988cf048f053b181715fc27 --- /dev/null +++ b/model.layers.10.self_attn.q_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01481867ea507cbd0761b0b1692c2b54abf9b735556bc598f88378b78d3a60c4 +size 33556187 diff --git a/model.layers.10.self_attn.v_proj/FP8_Block.pth b/model.layers.10.self_attn.v_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..ee7b66fa94ddf54a9c1fe3dbf6affac426f8a31a --- /dev/null +++ b/model.layers.10.self_attn.v_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7af54154a01f6d7b551a372d1d9c1e39a18a10d0936f076cfbbfc43275377bac +size 8390455 diff --git a/model.layers.10.self_attn.v_proj/FP8_Dynamic.pth b/model.layers.10.self_attn.v_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..7c8a607b8b42e875c414b0decea7807a7fa86b64 --- /dev/null +++ b/model.layers.10.self_attn.v_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bf719f1c841b7628ea67c2acaed12d70b47fad3c2a7a2be734c92abc1873549 +size 8390469 diff --git a/model.layers.10.self_attn.v_proj/NVFP4.pth b/model.layers.10.self_attn.v_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..a96bf02b9b7dfa313a4cb8b3cd5a71a96decc2a5 --- /dev/null +++ b/model.layers.10.self_attn.v_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec7a9c7e03cc66240907333d5131e442acdd70f16879dba87896de54f7379ce9 +size 8390363 diff --git a/model.layers.11.mlp.down_proj/FP8_Block.pth b/model.layers.11.mlp.down_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..ebb63c56c13ac56b782e3bb8685cc39668e64189 --- /dev/null +++ b/model.layers.11.mlp.down_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da5ad0b7445949359149ef53283219bc8f0c9789659c7143228c30c463f88aa6 +size 117442359 diff --git a/model.layers.11.mlp.down_proj/FP8_Dynamic.pth b/model.layers.11.mlp.down_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..723626788a549d47a77747e34386d783f7291be7 --- /dev/null +++ b/model.layers.11.mlp.down_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:225a1598a0d772e8ac8197d86c9c44cd0e0528b24635558044c78e6673aca8a4 +size 117442373 diff --git a/model.layers.11.mlp.down_proj/NVFP4.pth b/model.layers.11.mlp.down_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..0e050634a81a31749a693449c7c493650b8b6e58 --- /dev/null +++ b/model.layers.11.mlp.down_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d4b37da4642c7b85946da52a13d06c94245e1534a98a813cdcad406c3414bc0 +size 117442267 diff --git a/model.layers.11.mlp.gate_proj/FP8_Block.pth b/model.layers.11.mlp.gate_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..bc6404ef71561cc66ebb17fb2804cc46c8b65a0c --- /dev/null +++ b/model.layers.11.mlp.gate_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e8c427ba9aaca6abdc614261608a08831ed118626caf1d28589721dfd616f75 +size 117442359 diff --git a/model.layers.11.mlp.gate_proj/FP8_Dynamic.pth b/model.layers.11.mlp.gate_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..54020cbbd5762d0ac0a8c37565fa8148f281dac2 --- /dev/null +++ b/model.layers.11.mlp.gate_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:266e9d279be8fa40586cd9d6ca97a24bb09ec0f58220594565f12818aa706f59 +size 117442373 diff --git a/model.layers.11.mlp.gate_proj/NVFP4.pth b/model.layers.11.mlp.gate_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..a65d8359a5291c175caafa1d39e75e57fb0dd942 --- /dev/null +++ b/model.layers.11.mlp.gate_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b0f40af169aeaaf3584c3dcd401c0cac909ad385b6cc805dea061a02c1dc4e6 +size 117442267 diff --git a/model.layers.11.mlp.up_proj/FP8_Block.pth b/model.layers.11.mlp.up_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..2cdb07c228ea9b9ba452d44e185868fc331b520e --- /dev/null +++ b/model.layers.11.mlp.up_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8c827a04724f79b57b025b2511277f246c8bb495cb33bdd1cde8265bc95c7b9 +size 117442359 diff --git a/model.layers.11.mlp.up_proj/FP8_Dynamic.pth b/model.layers.11.mlp.up_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..b6ea09260df15e600dba5d6cab29baf6d2996493 --- /dev/null +++ b/model.layers.11.mlp.up_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:610d49395805bae6483b2d4e64ba33d0dd5976f1902f2af9ded848a2c2bc7e7a +size 117442373 diff --git a/model.layers.11.mlp.up_proj/NVFP4.pth b/model.layers.11.mlp.up_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..88e0b4c1e0e938bf827cdce0404f5a10582406df --- /dev/null +++ b/model.layers.11.mlp.up_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b83afeb9f5ffb6cf0119143166f4bbc0253a97e2b154b419586dae6d85893eda +size 117442267 diff --git a/model.layers.11.self_attn.k_proj/FP8_Block.pth b/model.layers.11.self_attn.k_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..76479684b25176c225a0f8ebd14b856dfbd59115 --- /dev/null +++ b/model.layers.11.self_attn.k_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8bf530d13c9f37b662b24742a1e878afd33bc1472f5d4586c5d69695f3bcad5 +size 8390455 diff --git a/model.layers.11.self_attn.k_proj/FP8_Dynamic.pth b/model.layers.11.self_attn.k_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..ea3a18ca67dbcd0a9f7a6e94ac8ad8bc20f36ca3 --- /dev/null +++ b/model.layers.11.self_attn.k_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3a26f6636124d68fb4d4cab45312ef69ff7443435bf7ea4e23729c0ff86bf23 +size 8390469 diff --git a/model.layers.11.self_attn.k_proj/NVFP4.pth b/model.layers.11.self_attn.k_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..50050dcfc05721b94216f4d8452088c901e707c3 --- /dev/null +++ b/model.layers.11.self_attn.k_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de0f855bddd3ff7576fb685e30b5176fd9f85f7175a8c5e03a0825d12aa1491a +size 8390363 diff --git a/model.layers.11.self_attn.o_proj/FP8_Block.pth b/model.layers.11.self_attn.o_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..ec266bcb6c9070b472001114a7a1cb6e541626f9 --- /dev/null +++ b/model.layers.11.self_attn.o_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa2ec2f1da52a546d6c013bea75b70b734e379115e74dcac0e4f6bd226246ca0 +size 33556279 diff --git a/model.layers.11.self_attn.o_proj/FP8_Dynamic.pth b/model.layers.11.self_attn.o_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..c4c3bcebe20eabba1fc48cb3c0ef9c1d7372f925 --- /dev/null +++ b/model.layers.11.self_attn.o_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca0c793591704aae78b4529c8b42d83d89058aa65a3f1dc0b4a7658b0ee93ca8 +size 33556293 diff --git a/model.layers.11.self_attn.o_proj/NVFP4.pth b/model.layers.11.self_attn.o_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..b255188f4335b3eec333dbde49601c37392398cb --- /dev/null +++ b/model.layers.11.self_attn.o_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3faf0d6ac3f20f8446c9de81d44ab7c0e13d7cbad678feaadbbda89daab4b0d +size 33556187 diff --git a/model.layers.11.self_attn.q_proj/FP8_Block.pth b/model.layers.11.self_attn.q_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..506d708850e587b294b3ad366f9d79640f1baabb --- /dev/null +++ b/model.layers.11.self_attn.q_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0797915360f5a0d299596465d1e8af4b32043ea3ef114d14de7aaf687365cef1 +size 33556279 diff --git a/model.layers.11.self_attn.q_proj/FP8_Dynamic.pth b/model.layers.11.self_attn.q_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..6d91fcbed1f6c380a5dfaf4324b230a351002507 --- /dev/null +++ b/model.layers.11.self_attn.q_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d23e1289e525041cfd67d7f86c6aec21aec34766801db7222962d89b40a7d126 +size 33556293 diff --git a/model.layers.11.self_attn.q_proj/NVFP4.pth b/model.layers.11.self_attn.q_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..9d8fa07077780bf7390709d9bb72963ca749bc31 --- /dev/null +++ b/model.layers.11.self_attn.q_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a936400dfea336530296672632db9e2dfff46173566723b42cc9ec14de30a8b +size 33556187 diff --git a/model.layers.11.self_attn.v_proj/FP8_Block.pth b/model.layers.11.self_attn.v_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..db7d835950db608d3fd91f96e61923b2fc8b5844 --- /dev/null +++ b/model.layers.11.self_attn.v_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d8b44603f1498219326793eb468c9141f02121f1e69b5811417b1d07d9f18d0 +size 8390455 diff --git a/model.layers.11.self_attn.v_proj/FP8_Dynamic.pth b/model.layers.11.self_attn.v_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..5e1cf5ae8ac7bb6038e6a69e3c1501d3011da6fe --- /dev/null +++ b/model.layers.11.self_attn.v_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eea1b1c5f7b910791bafdffaf2dcaea4feeb39513ba4bdd63cf3d793aa05e9e0 +size 8390469 diff --git a/model.layers.11.self_attn.v_proj/NVFP4.pth b/model.layers.11.self_attn.v_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..739e687f4896f0ed031bf9a0208c74ea7fd991e8 --- /dev/null +++ b/model.layers.11.self_attn.v_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dca6a1496380736fe629bd457efa24b34336e8ac51bf66306d68cdb85c5dcdc1 +size 8390363 diff --git a/model.layers.12.mlp.down_proj/FP8_Block.pth b/model.layers.12.mlp.down_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..2470c13e19b5d314e2b64129b4580c704280211b --- /dev/null +++ b/model.layers.12.mlp.down_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df2f5638f231fe17c91049d0744ac8f39a70e41dbf22c6272b6a02aceece71fb +size 117442359 diff --git a/model.layers.12.mlp.down_proj/FP8_Dynamic.pth b/model.layers.12.mlp.down_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..d8aa747b34bfced4804a8f453cee8bd68de6b841 --- /dev/null +++ b/model.layers.12.mlp.down_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e469cf8891ecc719b69b7ecce44bb40f1383bc5cb26c024ac31b82ab5d5c381b +size 117442373 diff --git a/model.layers.12.mlp.down_proj/NVFP4.pth b/model.layers.12.mlp.down_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..e0ab6a360dac50ded1611b031992608ff10dc162 --- /dev/null +++ b/model.layers.12.mlp.down_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60e02d27c41be8513ae604e38ed440c648e521cf830062d31a961ba4e32891a8 +size 117442267 diff --git a/model.layers.12.mlp.gate_proj/FP8_Block.pth b/model.layers.12.mlp.gate_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..b2739a0bb70d5636450906a2f89e276e3a92736d --- /dev/null +++ b/model.layers.12.mlp.gate_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e775a5efc7e41662fadb9eb0cda900a62e40f25040b1fe50d4afc7b3091b84c +size 117442359 diff --git a/model.layers.12.mlp.gate_proj/FP8_Dynamic.pth b/model.layers.12.mlp.gate_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..3bdd242e6314c3f8950c8d86640d1cbf43cd33ea --- /dev/null +++ b/model.layers.12.mlp.gate_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a722515c3ea3ea41ab7230b400c5d7140acf4373bcea4689d5fd3dba9bbe3fa +size 117442373 diff --git a/model.layers.12.mlp.gate_proj/NVFP4.pth b/model.layers.12.mlp.gate_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..b81c2caab4af361ac551a0c11dc68ec4b0994edf --- /dev/null +++ b/model.layers.12.mlp.gate_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13459ce231ad3425c4d330f41d63d01798fcedb142d220ccb9f34b8c3ac417e7 +size 117442267 diff --git a/model.layers.12.mlp.up_proj/FP8_Block.pth b/model.layers.12.mlp.up_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..3eb4b8e5f33010250e9da9a8c123a8ef116ec3c0 --- /dev/null +++ b/model.layers.12.mlp.up_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62a84195b77650460dc9157c834856458db2ab7c994bc3022b0a4e377224a953 +size 117442359 diff --git a/model.layers.12.mlp.up_proj/FP8_Dynamic.pth b/model.layers.12.mlp.up_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..caecbbca5186c3255d10a7f42a6e799e4e53f483 --- /dev/null +++ b/model.layers.12.mlp.up_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f32ef16da67289925b2c65bf8a79c400bfcf5f28154690c2d8f9ac057c168b1f +size 117442373 diff --git a/model.layers.12.mlp.up_proj/NVFP4.pth b/model.layers.12.mlp.up_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..16a58b0f206d424288e29fb236442429173957fa --- /dev/null +++ b/model.layers.12.mlp.up_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d771e639d9c26661a6e93b72ddaaba4997f58b956bd68d21c5de763377cdfa8b +size 117442267 diff --git a/model.layers.12.self_attn.k_proj/FP8_Block.pth b/model.layers.12.self_attn.k_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..dbe5231b07f803e5580b5cf1f00e73f9300174b7 --- /dev/null +++ b/model.layers.12.self_attn.k_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dda7633d86f4fc9ce9d32a89a0a818dcfe9168a45f00653679eeea3031ce5880 +size 8390455 diff --git a/model.layers.12.self_attn.k_proj/FP8_Dynamic.pth b/model.layers.12.self_attn.k_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..1c765b80296db1874749d3e9650ccf1f47931108 --- /dev/null +++ b/model.layers.12.self_attn.k_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8795caef4223a83ba2626ba65f098c01e034a4d17c8f4d5b7dc931e583ee6603 +size 8390469 diff --git a/model.layers.12.self_attn.k_proj/NVFP4.pth b/model.layers.12.self_attn.k_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..f16e69d7622c08ca24126ac0955f7cafa1cf4b4d --- /dev/null +++ b/model.layers.12.self_attn.k_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8122a7ba0ce395444d8175c0a67da1318bc8df8eb1fd3401f73b926177c19ff +size 8390363 diff --git a/model.layers.12.self_attn.o_proj/FP8_Block.pth b/model.layers.12.self_attn.o_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..d6aa60226d012c8da2d98318e148595a8684bf55 --- /dev/null +++ b/model.layers.12.self_attn.o_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d352d2b7860dae2184dc63e4b9b252aa094bcc983f6ea6414fbf44348a53ec12 +size 33556279 diff --git a/model.layers.12.self_attn.o_proj/FP8_Dynamic.pth b/model.layers.12.self_attn.o_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..5eeae0a1cd767b6aabc4e2b452f7b85fd6d1b24e --- /dev/null +++ b/model.layers.12.self_attn.o_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d540c984f6cc8d8a49f57cc54c82f0db98c85da4fe59c075aa1ba754f0a84d7a +size 33556293 diff --git a/model.layers.12.self_attn.o_proj/NVFP4.pth b/model.layers.12.self_attn.o_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..1ce01796ff2b9e8e225387c766da51f636f8b1f1 --- /dev/null +++ b/model.layers.12.self_attn.o_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f2de4c42ef9bca40293e7d5fd2742a1ee86246a68cd3abbdce1e4109652979a +size 33556187 diff --git a/model.layers.12.self_attn.q_proj/FP8_Block.pth b/model.layers.12.self_attn.q_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..48620dbffde678e227332fa617591d23697a7003 --- /dev/null +++ b/model.layers.12.self_attn.q_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b33f171904e090500d798d0ade00ceb62307d997491b8b04c803b803b0562584 +size 33556279 diff --git a/model.layers.12.self_attn.q_proj/FP8_Dynamic.pth b/model.layers.12.self_attn.q_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..d59eb7a22d59b14865a1fd6dc80cd3b401261c70 --- /dev/null +++ b/model.layers.12.self_attn.q_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2de3cf65066738cea83a47d83e3c3126132747e657dc615390e871951a9145b2 +size 33556293 diff --git a/model.layers.12.self_attn.q_proj/NVFP4.pth b/model.layers.12.self_attn.q_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..4e2a728abda8c930d339eb3d6fb4458b74ef061a --- /dev/null +++ b/model.layers.12.self_attn.q_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbfad83976b0ee05009a55ba7d8f0105a65e2be9ada13fcec5138ce5fd3a7ceb +size 33556187 diff --git a/model.layers.12.self_attn.v_proj/FP8_Block.pth b/model.layers.12.self_attn.v_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..960f822fec1f9c7422e2eec466c61ab54c4d96a6 --- /dev/null +++ b/model.layers.12.self_attn.v_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:001ecba2e19187a57783c46cfb3b0c7cd537d41ffd9aad3879fd23bfc51095d6 +size 8390455 diff --git a/model.layers.12.self_attn.v_proj/FP8_Dynamic.pth b/model.layers.12.self_attn.v_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..b9de6bc1bbb67797e7a0f29a22006c97234d6beb --- /dev/null +++ b/model.layers.12.self_attn.v_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59a2c37c6913926f11ee0a4dcb4564d6c442c05337725950aa05e58ee6e2dda9 +size 8390469 diff --git a/model.layers.12.self_attn.v_proj/NVFP4.pth b/model.layers.12.self_attn.v_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..2ffb09a23af30a333d7ba7da7963638eb127cfeb --- /dev/null +++ b/model.layers.12.self_attn.v_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da181f856b8d302e5308b8f1ffc0d95380dd62c5ec73d2a955bb30260647a457 +size 8390363 diff --git a/model.layers.13.mlp.down_proj/FP8_Block.pth b/model.layers.13.mlp.down_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..d2136d9bf92dab2b5e8cb147613a6f00c1d1e97c --- /dev/null +++ b/model.layers.13.mlp.down_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:745b43f914ccf2091786aee124a86db107963b0cd142d7ea2a80e4d43522e152 +size 117442359 diff --git a/model.layers.13.mlp.down_proj/FP8_Dynamic.pth b/model.layers.13.mlp.down_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..d5ad76172160d38ec9b573c96f92fa0834253423 --- /dev/null +++ b/model.layers.13.mlp.down_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ecef5ca7c5c60bbcdf3e829a4fc7cee276f25db0aa9c3d8d0c7deb574a836aa +size 117442373 diff --git a/model.layers.13.mlp.down_proj/NVFP4.pth b/model.layers.13.mlp.down_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..c27a0df341789014279ff07c4c00331cea3d7982 --- /dev/null +++ b/model.layers.13.mlp.down_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2854d5fad30b5809af22988523488093a1ea01be70e365f5c1461ded544531f +size 117442267 diff --git a/model.layers.13.mlp.gate_proj/FP8_Block.pth b/model.layers.13.mlp.gate_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..e274bf8e7b9b8e6491723249cfac3c687234275f --- /dev/null +++ b/model.layers.13.mlp.gate_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f36a9eb0f67ddb7669d56d72c44fd788f644ecb58385a6ad71339c99e469d805 +size 117442359 diff --git a/model.layers.13.mlp.gate_proj/FP8_Dynamic.pth b/model.layers.13.mlp.gate_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..246fd3d58bfa8fc16ffae5c61ce8f205d9cceb4a --- /dev/null +++ b/model.layers.13.mlp.gate_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e71abdcf266df3d2b8169690bd273a7fae0e4a69f9e5f0ae545e637472fb9295 +size 117442373 diff --git a/model.layers.13.mlp.gate_proj/NVFP4.pth b/model.layers.13.mlp.gate_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..1850f4f5266bc391001f97bf15457e194549f927 --- /dev/null +++ b/model.layers.13.mlp.gate_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4e72624a62f990e60b9a057c50c4986a2ee14bfbc23285816fe4eb2393f867c +size 117442267 diff --git a/model.layers.13.mlp.up_proj/FP8_Block.pth b/model.layers.13.mlp.up_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..d9e974473e451a26ef7048c888408e4f49c2c6e0 --- /dev/null +++ b/model.layers.13.mlp.up_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bfdeeca167bc8bfcfd970dfb529776129fb1b30600d05efa9ca90fe19b29129 +size 117442359 diff --git a/model.layers.13.mlp.up_proj/FP8_Dynamic.pth b/model.layers.13.mlp.up_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..595d8ad4ff64dbf98a59eb20707c6af0ba453072 --- /dev/null +++ b/model.layers.13.mlp.up_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a73c1873c347360e7902d4861ed92ef34c36d6e3ef6d2da9bc4897e64a3dd21 +size 117442373 diff --git a/model.layers.13.mlp.up_proj/NVFP4.pth b/model.layers.13.mlp.up_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..f571a5e9b7aced3c03adefa6dc5d914d45db4ab1 --- /dev/null +++ b/model.layers.13.mlp.up_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afdbb0e1729dba70f394a7be52226d62f001b21a6a2cd4fbde316d21d07af23c +size 117442267 diff --git a/model.layers.13.self_attn.k_proj/FP8_Block.pth b/model.layers.13.self_attn.k_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..cb3e8986444cb343d86f2b17f2668421dc609f9f --- /dev/null +++ b/model.layers.13.self_attn.k_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edc768faff501a0ac7a6990c0d7b4efc1d6a7354844b6f06b0aa0c46db306651 +size 8390455 diff --git a/model.layers.13.self_attn.k_proj/FP8_Dynamic.pth b/model.layers.13.self_attn.k_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..2ccc55e72d241c640b17001f81d9f52464086bc2 --- /dev/null +++ b/model.layers.13.self_attn.k_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b8254f766592c902e0c27148f38ee7eb6a1a3122ad82001968ddecbbdb85b55 +size 8390469 diff --git a/model.layers.13.self_attn.k_proj/NVFP4.pth b/model.layers.13.self_attn.k_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..d15007341e5d9752bf90e00bd68b124fa4da86af --- /dev/null +++ b/model.layers.13.self_attn.k_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd24f73059a90e8678058628dd8c0d3ccc0b1ba3a3fec54e83835f27d9869b34 +size 8390363 diff --git a/model.layers.13.self_attn.o_proj/FP8_Block.pth b/model.layers.13.self_attn.o_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..c13866c87127f1819071f1d168b10fb1528ebbeb --- /dev/null +++ b/model.layers.13.self_attn.o_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a865abf0acc8cf9220be417074079753e71f16c92311f902a97c7de7c74266ed +size 33556279 diff --git a/model.layers.13.self_attn.o_proj/FP8_Dynamic.pth b/model.layers.13.self_attn.o_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..471b461f99b41c92147bd3d382128271b2c89fe3 --- /dev/null +++ b/model.layers.13.self_attn.o_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2457ce5acc23fc46113ab06f8bac7848eacf27caabe689a0b712eed17c7cd446 +size 33556293 diff --git a/model.layers.13.self_attn.o_proj/NVFP4.pth b/model.layers.13.self_attn.o_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..378eec2b2ea8dbbc20763ed7577e0e3b5fecdea9 --- /dev/null +++ b/model.layers.13.self_attn.o_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c40ea73f726bbaa7053a7ca40d1031ba69f2fbb49e545a8384db62383b533c7 +size 33556187 diff --git a/model.layers.13.self_attn.q_proj/FP8_Block.pth b/model.layers.13.self_attn.q_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..963b2132f253694f4f298b23d6c970a08d15db0a --- /dev/null +++ b/model.layers.13.self_attn.q_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d4c12f8c883d95b5eac248d17c4e731c7d2e64e0dd5ed87d15b1dfdd1bc26ea +size 33556279 diff --git a/model.layers.13.self_attn.q_proj/FP8_Dynamic.pth b/model.layers.13.self_attn.q_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..fa30d837af731a651bfdfd0614de49bb57e3d903 --- /dev/null +++ b/model.layers.13.self_attn.q_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38a892f23830d24f95b9c49b2736415ad4db36be68078dbb9378d18cdd4c88d6 +size 33556293 diff --git a/model.layers.13.self_attn.q_proj/NVFP4.pth b/model.layers.13.self_attn.q_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..c4e72982b8117a1eb4870c47353dadb8c0998ee1 --- /dev/null +++ b/model.layers.13.self_attn.q_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fc41edb776ffe519048c1e4bad4bdad3c827df74ab356c9dcc511fcc3927192 +size 33556187 diff --git a/model.layers.13.self_attn.v_proj/FP8_Block.pth b/model.layers.13.self_attn.v_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..00f1af8491f6d69425e2837eb4e863b08f95860c --- /dev/null +++ b/model.layers.13.self_attn.v_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fb810283c73e59c1f99cef5110695cc7e9014c61b3be7cc65a30278b5dbdd82 +size 8390455 diff --git a/model.layers.13.self_attn.v_proj/FP8_Dynamic.pth b/model.layers.13.self_attn.v_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..ddd58b2bd4c3d19e7866889c3d517d32ce306e44 --- /dev/null +++ b/model.layers.13.self_attn.v_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bde6f2c6c6cb8701a3924a7476dd6ff638e682c9b49e95c72964c9b21cd8aa23 +size 8390469 diff --git a/model.layers.13.self_attn.v_proj/NVFP4.pth b/model.layers.13.self_attn.v_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..650c517224f9ef2f9aa7960554bf4a1d0c5567b8 --- /dev/null +++ b/model.layers.13.self_attn.v_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:001770743623233a048b58ca7cc13ddb0fbd18f3faab6d09fbc74681866e12c5 +size 8390363 diff --git a/model.layers.14.mlp.down_proj/FP8_Block.pth b/model.layers.14.mlp.down_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..83132022db1d9694b1b2ee595acdeaa2349fcb75 --- /dev/null +++ b/model.layers.14.mlp.down_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9b9612ad23e957c7ee994960146b4b34cd828c52a297893c606b8354dcb855d +size 117442359 diff --git a/model.layers.14.mlp.down_proj/FP8_Dynamic.pth b/model.layers.14.mlp.down_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..e3fb5b6e3064f2e247b858e30d9e8b73339c46b8 --- /dev/null +++ b/model.layers.14.mlp.down_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:189591f1d1a633b6b96487c5ea77c0c79765942794c8ed97b05c48e590ae8439 +size 117442373 diff --git a/model.layers.14.mlp.down_proj/NVFP4.pth b/model.layers.14.mlp.down_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..ec308268fca509028f14f639885e374ec12c2eef --- /dev/null +++ b/model.layers.14.mlp.down_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a380bca39815b45c96f74a0f060a793119b0824f06189e0abd0b2a867fa20afa +size 117442267 diff --git a/model.layers.14.mlp.gate_proj/FP8_Block.pth b/model.layers.14.mlp.gate_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..a41dc6f2a717fe97f363de00a6bf09ad4d63d88f --- /dev/null +++ b/model.layers.14.mlp.gate_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c7dd66d5786a00e4ce16c5cd37b10231f4d5a0cc4139cdb22c49e39a436fd78 +size 117442359 diff --git a/model.layers.14.mlp.gate_proj/FP8_Dynamic.pth b/model.layers.14.mlp.gate_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..9621c5efd64a9a4abe7dac77db76864e31e2a358 --- /dev/null +++ b/model.layers.14.mlp.gate_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70f9e36a94e13ed95aabbb1f9a523d206a70764830a0550037a5e9683fcfba9e +size 117442373 diff --git a/model.layers.14.mlp.gate_proj/NVFP4.pth b/model.layers.14.mlp.gate_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..c7af705387ca21041154a69240f3750839610682 --- /dev/null +++ b/model.layers.14.mlp.gate_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:327b52b1f6d7828a525c00d36acd2b2397a13e2efc42949f38b9fc84f90c489e +size 117442267 diff --git a/model.layers.14.mlp.up_proj/FP8_Block.pth b/model.layers.14.mlp.up_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..43c25add8bf99761a203b6ca65b0afb138421a47 --- /dev/null +++ b/model.layers.14.mlp.up_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1dd2db607d004dec3af9ea4c9fb3ca24594c29ab677a75c1bd900648283709d4 +size 117442359 diff --git a/model.layers.14.mlp.up_proj/FP8_Dynamic.pth b/model.layers.14.mlp.up_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..8263eb341b9e55098c7c5793e6c877d1e20166c2 --- /dev/null +++ b/model.layers.14.mlp.up_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a299de0f7f0f393087bd8c61e710f0cfecfc0f6d9f22650753952268557d4ac8 +size 117442373 diff --git a/model.layers.14.mlp.up_proj/NVFP4.pth b/model.layers.14.mlp.up_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..63a3d3e49600801fd2691657b6930a5f470353d9 --- /dev/null +++ b/model.layers.14.mlp.up_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:982490512968bb8ce00397c9a5bf10643492eab77e3ad438fe3d217d05512e3b +size 117442267 diff --git a/model.layers.14.self_attn.k_proj/FP8_Block.pth b/model.layers.14.self_attn.k_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..1c93f9e9a2c0c6cffbfe81447e76bc626d7e94d8 --- /dev/null +++ b/model.layers.14.self_attn.k_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8934c93dc7e3c78235baa73d0820c2eff425442833ffbd356aed2a1ac7a004a4 +size 8390455 diff --git a/model.layers.14.self_attn.k_proj/FP8_Dynamic.pth b/model.layers.14.self_attn.k_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..3b853c85a77414523e338dde2b16cb382f8d7768 --- /dev/null +++ b/model.layers.14.self_attn.k_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b16311335fba8093dc97575196877d58155a5ce29ae4cac8979cdd3598fc0632 +size 8390469 diff --git a/model.layers.14.self_attn.k_proj/NVFP4.pth b/model.layers.14.self_attn.k_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..4a0b53337202a9fc1ccd3d47f01e6c8fded1966f --- /dev/null +++ b/model.layers.14.self_attn.k_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83a847338da3ccfaad6446c30be6c3c3cc659c829503cc30110c12b4f94420b2 +size 8390363 diff --git a/model.layers.14.self_attn.o_proj/FP8_Block.pth b/model.layers.14.self_attn.o_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..6a8804c4b54271281f7d3b62fd9f793787392473 --- /dev/null +++ b/model.layers.14.self_attn.o_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e98d3330443bcf9897bcbc56e44acc1343578a7d258985be5076f25cb9e94007 +size 33556279 diff --git a/model.layers.14.self_attn.o_proj/FP8_Dynamic.pth b/model.layers.14.self_attn.o_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..1766bce5e6a442d1673f69aa5afb804be7d32838 --- /dev/null +++ b/model.layers.14.self_attn.o_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b039a3cfccf07cb1cb025acf0266c2d9ddfcc2053a653e6df9f808c39b25d364 +size 33556293 diff --git a/model.layers.14.self_attn.o_proj/NVFP4.pth b/model.layers.14.self_attn.o_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..07dbcc2b5f132177a8dec58600aa0a0513619a45 --- /dev/null +++ b/model.layers.14.self_attn.o_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:915f07d314b2727c683a23e7972057321243287a12ff59538fd0571ff40fc24e +size 33556187 diff --git a/model.layers.14.self_attn.q_proj/FP8_Block.pth b/model.layers.14.self_attn.q_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..afd1728c58424eb2122f35a63f654a761cd3668a --- /dev/null +++ b/model.layers.14.self_attn.q_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:467ab7b5b5717a546b15153a2e32c9f9a098ead4c2a627b4a320b0ff858db005 +size 33556279 diff --git a/model.layers.14.self_attn.q_proj/FP8_Dynamic.pth b/model.layers.14.self_attn.q_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..d51160f05bac943ed0f979cae2fe1b2805439436 --- /dev/null +++ b/model.layers.14.self_attn.q_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1adcb1354e565446412c795e7dfc118b93fd61935b8048f1ad0ba7aae487b200 +size 33556293 diff --git a/model.layers.14.self_attn.q_proj/NVFP4.pth b/model.layers.14.self_attn.q_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..e1cbe39913c7d655d0d55d616d253c4712fafb3b --- /dev/null +++ b/model.layers.14.self_attn.q_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffe8121ad374228a6f477c080a11c0b59b1df0a41cc774d6aa3743f4e3b8ad98 +size 33556187 diff --git a/model.layers.14.self_attn.v_proj/FP8_Block.pth b/model.layers.14.self_attn.v_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..099f9ec9e25239dccf5155acd4ff6f7553b84ccd --- /dev/null +++ b/model.layers.14.self_attn.v_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f54b153c2c55276d9e32fce8a5fb49c36446b3f75f68c5a3be9ea955cc08fa84 +size 8390455 diff --git a/model.layers.14.self_attn.v_proj/FP8_Dynamic.pth b/model.layers.14.self_attn.v_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..33cc7e360d78ec650e276554ecdf2653ced47f7e --- /dev/null +++ b/model.layers.14.self_attn.v_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a319afada5245f633b9987d3d95a7524f1779cfecec1c495c4c8de12a12cde6a +size 8390469 diff --git a/model.layers.14.self_attn.v_proj/NVFP4.pth b/model.layers.14.self_attn.v_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..d2114e79a3dcc3dfbab3e7eabf3f9d4dabf1b906 --- /dev/null +++ b/model.layers.14.self_attn.v_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d748f38063e8d927daeb1787769a46d2ab95743a90ff348a5e4fdc799599596 +size 8390363 diff --git a/model.layers.15.mlp.down_proj/FP8_Block.pth b/model.layers.15.mlp.down_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..e73cca2b03fa55498c906bbf613625f8a5974f28 --- /dev/null +++ b/model.layers.15.mlp.down_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a03e420698cbba1c13262aa756bddaf58a6679d2cc322e1f2b5fddc9060d128c +size 117442359 diff --git a/model.layers.15.mlp.down_proj/FP8_Dynamic.pth b/model.layers.15.mlp.down_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..25c332a09faf7e5ec06e582c1120524bf51e6017 --- /dev/null +++ b/model.layers.15.mlp.down_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e905486ec5db95933dba6dfe300b2ad3754827634345d7cce562a9ae71af238 +size 117442373 diff --git a/model.layers.15.mlp.down_proj/NVFP4.pth b/model.layers.15.mlp.down_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..069700f689ca9381a7346e78e37ab1d6fd365563 --- /dev/null +++ b/model.layers.15.mlp.down_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e77107b2e604ace0fdeb4207635d75615c7ddc52c2faf0f7b20f48c5e469f7f7 +size 117442267 diff --git a/model.layers.15.mlp.gate_proj/FP8_Block.pth b/model.layers.15.mlp.gate_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..d84662d1cfbde2d56b65972b5af8fd754fcbe50c --- /dev/null +++ b/model.layers.15.mlp.gate_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46f103c761f3104547f59f5609c359ed025692dd8e56e8d47d0f08492d0629e0 +size 117442359 diff --git a/model.layers.15.mlp.gate_proj/FP8_Dynamic.pth b/model.layers.15.mlp.gate_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..ac4ab88d93213af0dd14a2cedd8b0965a94ac4ae --- /dev/null +++ b/model.layers.15.mlp.gate_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0812f11c311490e89b1476c213dacd576ea99f5ffc8e03983bd19f01ecfd672 +size 117442373 diff --git a/model.layers.15.mlp.gate_proj/NVFP4.pth b/model.layers.15.mlp.gate_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..d6df063985fde339159bfa1ed8409900b84991bf --- /dev/null +++ b/model.layers.15.mlp.gate_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92552a7835101c4618a7ca6a1b82d7c48d430f95d6c584c338ceb3b1c6597a8e +size 117442267 diff --git a/model.layers.15.mlp.up_proj/FP8_Block.pth b/model.layers.15.mlp.up_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..88e0e4c59eae0a0734c881ec90d16911e700a7fd --- /dev/null +++ b/model.layers.15.mlp.up_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e76e58feb417970e170ceb6cbe61353b0407620568ea50c78f243df245679a5 +size 117442359 diff --git a/model.layers.15.mlp.up_proj/FP8_Dynamic.pth b/model.layers.15.mlp.up_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..c32bbf6e518e51356523d6accb9f96a6d4bffa00 --- /dev/null +++ b/model.layers.15.mlp.up_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:efd6d0f62a07eeab3873108ad5dcde950fba2a3806903b530be9d4414793e11e +size 117442373 diff --git a/model.layers.15.mlp.up_proj/NVFP4.pth b/model.layers.15.mlp.up_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..06f5cf2a8d823591859096713bc62514f0000a5f --- /dev/null +++ b/model.layers.15.mlp.up_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff640a2b511d43ea03607950f6bf5c1510abb92fb6c74591aeb1169f753c71ce +size 117442267 diff --git a/model.layers.15.self_attn.k_proj/FP8_Block.pth b/model.layers.15.self_attn.k_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..3575ed41420ab4bbc47e56daf945f2162e2dd7cd --- /dev/null +++ b/model.layers.15.self_attn.k_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a84742725de88dbaea6bc08fb9c09cdc822cecc505476285123295a339fba01 +size 8390455 diff --git a/model.layers.15.self_attn.k_proj/FP8_Dynamic.pth b/model.layers.15.self_attn.k_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..fcd6fb71ea11815d8ccad4019b76cafb2a8d8ec7 --- /dev/null +++ b/model.layers.15.self_attn.k_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:569733363c6fbb08c458432648406693f3cc5f25e950a759953e36521be4c240 +size 8390469 diff --git a/model.layers.15.self_attn.k_proj/NVFP4.pth b/model.layers.15.self_attn.k_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..1bfb158e4c3244dad65b9741ee97ac6eeea19f14 --- /dev/null +++ b/model.layers.15.self_attn.k_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1c5ee4299704555e4f0bd9ca43e14f7af756ae9ec25fceb39a15e7e93fa51e2 +size 8390363 diff --git a/model.layers.15.self_attn.o_proj/FP8_Block.pth b/model.layers.15.self_attn.o_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..5bca3aa7ee9479164afce20f00ac4bcafcb87999 --- /dev/null +++ b/model.layers.15.self_attn.o_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7845153c8a7cc7dd55f280dafc7c9c4c0e7f9f92a8a34c2425819fc287040181 +size 33556279 diff --git a/model.layers.15.self_attn.o_proj/FP8_Dynamic.pth b/model.layers.15.self_attn.o_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..4a5122c7afa557f92c9b308f481304dc28f391a1 --- /dev/null +++ b/model.layers.15.self_attn.o_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ce9c57ebb6ec3aba97bd60e96f68c83e46cadb727844fce5e0e9475e738667c +size 33556293 diff --git a/model.layers.15.self_attn.o_proj/NVFP4.pth b/model.layers.15.self_attn.o_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..9a95c1ca1a73137212909fd6b7d923c3bf16294a --- /dev/null +++ b/model.layers.15.self_attn.o_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fb03bb09815f625339c9fee4273ad8aaab510c74dbe963ff82aeea5f7446046 +size 33556187 diff --git a/model.layers.15.self_attn.q_proj/FP8_Block.pth b/model.layers.15.self_attn.q_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..74c3f69516ca32f3f720d5fab4e54559523f9011 --- /dev/null +++ b/model.layers.15.self_attn.q_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1387d1e6fab0eb843fe995b6a3c0bcc1f36e8a3ec4db5996d6154e2fe70ad54d +size 33556279 diff --git a/model.layers.15.self_attn.q_proj/FP8_Dynamic.pth b/model.layers.15.self_attn.q_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..ba814d31e8c0ca9d063a8f8c3ce8443c11392da8 --- /dev/null +++ b/model.layers.15.self_attn.q_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44a0398ad4c02bd132860126287a3e55b89491dc89666e7ca58f926d8eefc6e8 +size 33556293 diff --git a/model.layers.15.self_attn.q_proj/NVFP4.pth b/model.layers.15.self_attn.q_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..458d8da390edb51a91c2bcb7192ea0bcd38b619a --- /dev/null +++ b/model.layers.15.self_attn.q_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:545472a584ef4b84b265d89ee9fc64a0c6d5c1ae66152b9cb0026c15360ff73d +size 33556187 diff --git a/model.layers.15.self_attn.v_proj/FP8_Block.pth b/model.layers.15.self_attn.v_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..7c887552171c6b5f2bd0afef4d94e7fbbb056955 --- /dev/null +++ b/model.layers.15.self_attn.v_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95597c5ab58e165cc59d2a9d79becde1c6283a05a5a4475ef5c08c3bf0230596 +size 8390455 diff --git a/model.layers.15.self_attn.v_proj/FP8_Dynamic.pth b/model.layers.15.self_attn.v_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..bf3d36639aaab96957caa47a5339656a0dc77d25 --- /dev/null +++ b/model.layers.15.self_attn.v_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4764590d58b498c4f989a8e23300635fb1923ec12d5f86e10abde8a988593dd +size 8390469 diff --git a/model.layers.15.self_attn.v_proj/NVFP4.pth b/model.layers.15.self_attn.v_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..f7308f1865af34111f1eaba59abc294dad6f51b9 --- /dev/null +++ b/model.layers.15.self_attn.v_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:efabd788426efe4d3d2ad9550412bcf0dfe74e94a3e084cbb89ec9a687e08448 +size 8390363 diff --git a/model.layers.16.mlp.down_proj/FP8_Block.pth b/model.layers.16.mlp.down_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..78ba9382dde0e61d6263eaea08ee61412fc2a76a --- /dev/null +++ b/model.layers.16.mlp.down_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ca20d39f66d3233409c4eb27a7d5db9b83958f43d4e43d7e7f37bc5b0e77a3b +size 117442359 diff --git a/model.layers.16.mlp.down_proj/FP8_Dynamic.pth b/model.layers.16.mlp.down_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..b1c34f3dad2e01ff690266592fed6efbd04d67fe --- /dev/null +++ b/model.layers.16.mlp.down_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe4946badc6d9dfa6f1dcc1217107b3580efc6b88d7d2627cf733b1484452069 +size 117442373 diff --git a/model.layers.16.mlp.down_proj/NVFP4.pth b/model.layers.16.mlp.down_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..9a779ff4436c613901f20c1761c742e9b47f87dd --- /dev/null +++ b/model.layers.16.mlp.down_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a043a217e1a1661da04d1731b4847fb02c438e19ee33f22f4b4dff8965bc26a +size 117442267 diff --git a/model.layers.16.mlp.gate_proj/FP8_Block.pth b/model.layers.16.mlp.gate_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..00529df7cb5b650484469a1366a8ecbe2f1f0b3f --- /dev/null +++ b/model.layers.16.mlp.gate_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:baa393bd534223f9ba5d49aa702934499cb3b74f0a88c4ab1151a1ad8794855e +size 117442359 diff --git a/model.layers.16.mlp.gate_proj/FP8_Dynamic.pth b/model.layers.16.mlp.gate_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..16f1e59ecc628e60906aa374234a99b944778ed8 --- /dev/null +++ b/model.layers.16.mlp.gate_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3be8fff4da8db96ee59a274970132f6ee23a54c0ad1bca06688e369401a5e9d +size 117442373 diff --git a/model.layers.16.mlp.gate_proj/NVFP4.pth b/model.layers.16.mlp.gate_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..2439da07efa6b91979fe6a98c3e1e776969cd470 --- /dev/null +++ b/model.layers.16.mlp.gate_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7139bc5064a166c1f62c174274bbaaaf68d719c743a04f5ad518f3c8b461e6d +size 117442267 diff --git a/model.layers.16.mlp.up_proj/FP8_Block.pth b/model.layers.16.mlp.up_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..23a771c775fb514db5509a671d54e8b13d7a5af8 --- /dev/null +++ b/model.layers.16.mlp.up_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee0442bd2dae27da01d0ad46e36756f030ff56fa0ed1b0cd569e0064852e0d3d +size 117442359 diff --git a/model.layers.16.mlp.up_proj/FP8_Dynamic.pth b/model.layers.16.mlp.up_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..eb9e1497e4478c608525ff18a7f2300c77dd078e --- /dev/null +++ b/model.layers.16.mlp.up_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52a68be55facc567cf7f43ac21169d2abf27e6c46b8474f3218078c28bf5a6e4 +size 117442373 diff --git a/model.layers.16.mlp.up_proj/NVFP4.pth b/model.layers.16.mlp.up_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..f4a0c4cf66e35422694e8660b5725da65611db9f --- /dev/null +++ b/model.layers.16.mlp.up_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6da1688b3a280048ec21f93ef02690754be31cfbe672f0f9db4981fe383ce81c +size 117442267 diff --git a/model.layers.16.self_attn.k_proj/FP8_Block.pth b/model.layers.16.self_attn.k_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..d006709c92d8fb7426b996d2c8345dc3087083b3 --- /dev/null +++ b/model.layers.16.self_attn.k_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5b28b6fc4d946c2566161736e14952ca5fa9be1b47372e7b0b948ff445e1d3c +size 8390455 diff --git a/model.layers.16.self_attn.k_proj/FP8_Dynamic.pth b/model.layers.16.self_attn.k_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..3d36a14268f5b910c1a1e762049c50707093c538 --- /dev/null +++ b/model.layers.16.self_attn.k_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebe50fff4dc9f4bf37e4d9e5adf172ea41f1ae11b47754cef310e85fb12fca28 +size 8390469 diff --git a/model.layers.16.self_attn.k_proj/NVFP4.pth b/model.layers.16.self_attn.k_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..4ffda840d330c305d61f0c9f03fba58b4ce5ce57 --- /dev/null +++ b/model.layers.16.self_attn.k_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0893cb471addf5a3e8afda44ee5860ff2ccf0f8f4a0e220994c9ce821f87399f +size 8390363 diff --git a/model.layers.16.self_attn.o_proj/FP8_Block.pth b/model.layers.16.self_attn.o_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..a5998e0cf63c17c0ffeb1bf7388378bd1a9cff75 --- /dev/null +++ b/model.layers.16.self_attn.o_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0dbc75ad6307327f44d1ce851b8a6600f8999650d80cd6a674c6c10c1ee05c4b +size 33556279 diff --git a/model.layers.16.self_attn.o_proj/FP8_Dynamic.pth b/model.layers.16.self_attn.o_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..ef0b2e09bd4eab6b5d64a86697069f45decd0631 --- /dev/null +++ b/model.layers.16.self_attn.o_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:164aa360a5952f57b5d6a7d54b2d6708f3624129ebc7bb18feb7399e8617598d +size 33556293 diff --git a/model.layers.16.self_attn.o_proj/NVFP4.pth b/model.layers.16.self_attn.o_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..a60eb1c04fcc86f602cc8aa8d70a28cfe0b874ac --- /dev/null +++ b/model.layers.16.self_attn.o_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1947624985344206789a5c03d4cdc0c24ecf3504d6c6d14005ce3283ae1f77ef +size 33556187 diff --git a/model.layers.16.self_attn.q_proj/FP8_Block.pth b/model.layers.16.self_attn.q_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..c039c3b167ccbb54fd574a38694e7d64d0f6fd49 --- /dev/null +++ b/model.layers.16.self_attn.q_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d78a3ba90695002add989caf18197d3079c27896651135ae877f5a579840ea03 +size 33556279 diff --git a/model.layers.16.self_attn.q_proj/FP8_Dynamic.pth b/model.layers.16.self_attn.q_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..8b778c96bd0f1a969ddd62e800f0b41e3df1aa6a --- /dev/null +++ b/model.layers.16.self_attn.q_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8448a12f56287db35cc565f65b5789f16d01e4bd9f8b3a8a448cf8bf11aca8b7 +size 33556293 diff --git a/model.layers.16.self_attn.q_proj/NVFP4.pth b/model.layers.16.self_attn.q_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..78ae0104f2b9cc64f6af52f3afbe6f1bb99e0a7b --- /dev/null +++ b/model.layers.16.self_attn.q_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:007ec0bb867f87c9386a0fc66d0dfe974767df9c268dea57cd07c9525be02538 +size 33556187 diff --git a/model.layers.16.self_attn.v_proj/FP8_Block.pth b/model.layers.16.self_attn.v_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..06dad3f0899abd8160cef32e90c3b6d89cfd3a2e --- /dev/null +++ b/model.layers.16.self_attn.v_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:929dd0f55454b3166ececb8664bb8903f5c4e5d0e3596d3866a4de68c4268b55 +size 8390455 diff --git a/model.layers.16.self_attn.v_proj/FP8_Dynamic.pth b/model.layers.16.self_attn.v_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..2d413983cec67b29dc6622e35fb205788dd700c0 --- /dev/null +++ b/model.layers.16.self_attn.v_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36514ad70ea6b9f30785c70417565188c2bb2c217ba6a272c0f16529d6260d27 +size 8390469 diff --git a/model.layers.16.self_attn.v_proj/NVFP4.pth b/model.layers.16.self_attn.v_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..62d0023a48ce39d0cdb069277eb542a477e3e0a6 --- /dev/null +++ b/model.layers.16.self_attn.v_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b99aafe70e0b2123398121b5a12500ed4ac9dec86ec4a222e6c67ada2972cd0 +size 8390363 diff --git a/model.layers.17.mlp.down_proj/FP8_Block.pth b/model.layers.17.mlp.down_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..089999ff89fe9943903821dd065aea092314ffda --- /dev/null +++ b/model.layers.17.mlp.down_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b08e64bf07d12eb3a90d25c24875a44bb460cff02bdc21add57014e3d7503da +size 117442359 diff --git a/model.layers.17.mlp.down_proj/FP8_Dynamic.pth b/model.layers.17.mlp.down_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..c0053e6177704180f8c36c122dbf1e02d069b4e0 --- /dev/null +++ b/model.layers.17.mlp.down_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d3b3c317df74ae273364e161a2137097a678f99d702f784d41fac34b51923a0 +size 117442373 diff --git a/model.layers.17.mlp.down_proj/NVFP4.pth b/model.layers.17.mlp.down_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..3fa8aa20dbc3497b8f7a02521028adf19bc897c8 --- /dev/null +++ b/model.layers.17.mlp.down_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c56e8d40a1f3952180f2773153ca94afcacbe5857b868e51c22cd9d3dd0a364c +size 117442267 diff --git a/model.layers.17.mlp.gate_proj/FP8_Block.pth b/model.layers.17.mlp.gate_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..dade0ce0b018fc4454f0c07107894f653d0b1a32 --- /dev/null +++ b/model.layers.17.mlp.gate_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4f57fc986cc0623daedbc250d7ce521ddcdb739938e36cc240783a4c10d31a4 +size 117442359 diff --git a/model.layers.17.mlp.gate_proj/FP8_Dynamic.pth b/model.layers.17.mlp.gate_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..111e2bca4570bdbd9a759253efc55ab2041c1546 --- /dev/null +++ b/model.layers.17.mlp.gate_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d65e22154e807cb98c6f0dced3b9843b970bd1efc3440bd478878a1fae26cfc +size 117442373 diff --git a/model.layers.17.mlp.gate_proj/NVFP4.pth b/model.layers.17.mlp.gate_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..c50a4ab0fcb74e1a5ff5c8e56a8c8b614e3e8e92 --- /dev/null +++ b/model.layers.17.mlp.gate_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43e265d52dd708e6fea06461c58f76d1a88e1847b674e0e02918a6e1eb67e71c +size 117442267 diff --git a/model.layers.17.mlp.up_proj/FP8_Block.pth b/model.layers.17.mlp.up_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..3e8d4e42925ea37cd045847b57420af624196ad0 --- /dev/null +++ b/model.layers.17.mlp.up_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e13821646cfc42306d9691785cd1263e25e9f6b95fc17a5b61c32abf2bc39c0 +size 117442359 diff --git a/model.layers.17.mlp.up_proj/FP8_Dynamic.pth b/model.layers.17.mlp.up_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..7c1489756e003296948ae67afea118e8223f3bbc --- /dev/null +++ b/model.layers.17.mlp.up_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72b95f9481ce9e68ee49c06906bbcf70cfd184cbbf6f332b35af1422c942b44b +size 117442373 diff --git a/model.layers.17.mlp.up_proj/NVFP4.pth b/model.layers.17.mlp.up_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..0fb7586d52a293b40e1c1aa359bafab0ff5c9830 --- /dev/null +++ b/model.layers.17.mlp.up_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27c02acf53d22820e734e198240067e3786011e0950ca0440433f97a0abf45ad +size 117442267 diff --git a/model.layers.17.self_attn.k_proj/FP8_Block.pth b/model.layers.17.self_attn.k_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..72ca7800c51c5f6644f9149f25e9f092febb11e8 --- /dev/null +++ b/model.layers.17.self_attn.k_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fca1433739dc83114a18dbc2c432d3b32a68e1c83a158d2c485f8bafc8ff790 +size 8390455 diff --git a/model.layers.17.self_attn.k_proj/FP8_Dynamic.pth b/model.layers.17.self_attn.k_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..8feeea4fa1bc5ac4fa718375bdcc0dab2a446a81 --- /dev/null +++ b/model.layers.17.self_attn.k_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c540ccd39ad60a639c67067e15fa71c8f9370dde6505b3fa5118aa6fd7e7c878 +size 8390469 diff --git a/model.layers.17.self_attn.k_proj/NVFP4.pth b/model.layers.17.self_attn.k_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..37177a93483ca95f4e4418005686d5df21a3dbd0 --- /dev/null +++ b/model.layers.17.self_attn.k_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1f7a638af11b43ffd691f585ae927a4ac2cb8d5bce893794a9eee5be4a3e3ea +size 8390363 diff --git a/model.layers.17.self_attn.o_proj/FP8_Block.pth b/model.layers.17.self_attn.o_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..50bc6de39d5b2ff006e8a4fa9e2047c60c664765 --- /dev/null +++ b/model.layers.17.self_attn.o_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdde88c953f937edf8cc8dbc00140e0717c31d77c8d999c2e8de7c2ba481f45e +size 33556279 diff --git a/model.layers.17.self_attn.o_proj/FP8_Dynamic.pth b/model.layers.17.self_attn.o_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..e08193fc7298edd38b9273808dd8c1352a1665f9 --- /dev/null +++ b/model.layers.17.self_attn.o_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f8ed9a83e342255f96e226935a1554b3d6fbd5b7f1e30e92ab61317f65483f7 +size 33556293 diff --git a/model.layers.17.self_attn.o_proj/NVFP4.pth b/model.layers.17.self_attn.o_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..8963dbb3030434db44c6aa992ec24d2ca6f4e345 --- /dev/null +++ b/model.layers.17.self_attn.o_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68f0dcc5ac85cf11b988c4bdb9a057934a4b0b03efc2815185c5784b6b39d64e +size 33556187 diff --git a/model.layers.17.self_attn.q_proj/FP8_Block.pth b/model.layers.17.self_attn.q_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..a3575542c8e1f2b9d9f1b6c926655cd8897c3846 --- /dev/null +++ b/model.layers.17.self_attn.q_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15fac251a9c296eee5682784a6219c0dba654226161ffc5a54061c716b0e5c57 +size 33556279 diff --git a/model.layers.17.self_attn.q_proj/FP8_Dynamic.pth b/model.layers.17.self_attn.q_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..b7132644e9113ede2b710159b32fcc3acc3f0e55 --- /dev/null +++ b/model.layers.17.self_attn.q_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfbb63717cb011016018c49b9c99ce833547e00bfbaedd24d534ec5727c53a9b +size 33556293 diff --git a/model.layers.17.self_attn.q_proj/NVFP4.pth b/model.layers.17.self_attn.q_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..bdf54c041917ec6c3164e1f17b0236ccb497d1c1 --- /dev/null +++ b/model.layers.17.self_attn.q_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df75f17c7fef9d87cd1e212b7c460da4593b63f99ac79a0e76b4954ab326455c +size 33556187 diff --git a/model.layers.17.self_attn.v_proj/FP8_Block.pth b/model.layers.17.self_attn.v_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..a90254788ccb6cdc10eec1f44b454315aabcd6cc --- /dev/null +++ b/model.layers.17.self_attn.v_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03c73ea842f0e9ad8c6116cf10d5ea6895f23e86fade00aaabc6982a5828ca14 +size 8390455 diff --git a/model.layers.17.self_attn.v_proj/FP8_Dynamic.pth b/model.layers.17.self_attn.v_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..1ecd9ec6cd29a7450c9861a4445afaf197623ddc --- /dev/null +++ b/model.layers.17.self_attn.v_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89f3717b565fe0bd316232ed7516a813ff896ce1694ee76b4a448bec2f8133ee +size 8390469 diff --git a/model.layers.17.self_attn.v_proj/NVFP4.pth b/model.layers.17.self_attn.v_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..522891ff14fa5d5ec111b73a8947d382391bc296 --- /dev/null +++ b/model.layers.17.self_attn.v_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba2a4a2ad3f13e31cf3bdd3935fa9f995beebe92aead60bff8f4d0a5c335b9a9 +size 8390363 diff --git a/model.layers.18.mlp.down_proj/FP8_Block.pth b/model.layers.18.mlp.down_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..a119f71ec68be732d82aa8f8888c661b374dd5a2 --- /dev/null +++ b/model.layers.18.mlp.down_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbd7b38b791a9093c30bc07a6002490303868ea9849042e58b1787ba2cd8a6f0 +size 117442359 diff --git a/model.layers.18.mlp.down_proj/FP8_Dynamic.pth b/model.layers.18.mlp.down_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..1c6cab13969b62b0a4f64f4b80719ae30e4b9aad --- /dev/null +++ b/model.layers.18.mlp.down_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:311cf6ba9a2c66bebdffc8aed02a6c5067cd2f7bb85ff4a174bcb8ba29ee7207 +size 117442373 diff --git a/model.layers.18.mlp.down_proj/NVFP4.pth b/model.layers.18.mlp.down_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..f015e49cfd75b1e330a52c8b87ae2ba61d58ab57 --- /dev/null +++ b/model.layers.18.mlp.down_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:efc3ce524ee8733854c27e43dec2ba5031a87844fb885d4c1ea994d99fa890f5 +size 117442267 diff --git a/model.layers.18.mlp.gate_proj/FP8_Block.pth b/model.layers.18.mlp.gate_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..1c207c021a1a2821e2e7d480758c3bb8a9862b34 --- /dev/null +++ b/model.layers.18.mlp.gate_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:217e460eba1904d4c48c634f1d4eda633a99652b38f94adc5ba8f65cbc7a45fa +size 117442359 diff --git a/model.layers.18.mlp.gate_proj/FP8_Dynamic.pth b/model.layers.18.mlp.gate_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..13299aba14b3ee4d1d72340a7cff916cdc531eb8 --- /dev/null +++ b/model.layers.18.mlp.gate_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f11473e70e08dfafbd35d66f79c49de4aff570ffb2318cafd2b6da693e7e67db +size 117442373 diff --git a/model.layers.18.mlp.gate_proj/NVFP4.pth b/model.layers.18.mlp.gate_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..e876b17fef24d9a6c7c8e67a7cdbe68a27164ac9 --- /dev/null +++ b/model.layers.18.mlp.gate_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a218dc4a93c3a86e8ab080dbcf4bab55bfe2ae026641bde4379ee9ae645179fe +size 117442267 diff --git a/model.layers.18.mlp.up_proj/FP8_Block.pth b/model.layers.18.mlp.up_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..51530abd655b6f198d118a424d956db7d4f6acd2 --- /dev/null +++ b/model.layers.18.mlp.up_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e90f3372d6c8ba8ff7b51cee05857dd3e81f476d718f7d7e0586b836b8cc9bb2 +size 117442359 diff --git a/model.layers.18.mlp.up_proj/FP8_Dynamic.pth b/model.layers.18.mlp.up_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..dda7f308d1a527bdff195d92b15be28a8eb955bc --- /dev/null +++ b/model.layers.18.mlp.up_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f2fae28d9c5b11c8204aab739afa28ea2946d1118a24f72e17bc2e3c67bb467 +size 117442373 diff --git a/model.layers.18.mlp.up_proj/NVFP4.pth b/model.layers.18.mlp.up_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..bbb3cf68c7bf1c760c3826035373a31fafc5fa12 --- /dev/null +++ b/model.layers.18.mlp.up_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:903d7c1a7bc8cc75e199d68a7d1eeb0ff8b1b7c325e201aa6748e2729bbc0a3e +size 117442267 diff --git a/model.layers.18.self_attn.k_proj/FP8_Block.pth b/model.layers.18.self_attn.k_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..6713e7300de22cad179da28c8ddd07bf59cad8ca --- /dev/null +++ b/model.layers.18.self_attn.k_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4a6abad8edc5097b87ebed03c7c9eb5ada427440244182f94e6c6389696347e +size 8390455 diff --git a/model.layers.18.self_attn.k_proj/FP8_Dynamic.pth b/model.layers.18.self_attn.k_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..c5f540134ab49bc38ded8d601e06c3d5bbb3070b --- /dev/null +++ b/model.layers.18.self_attn.k_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d39c8ca222143ec5ca3921335e77e722467a59d3a6266ce121a60c10957d8e4c +size 8390469 diff --git a/model.layers.18.self_attn.k_proj/NVFP4.pth b/model.layers.18.self_attn.k_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..04c7d53d7a45faac7f732f181e04886847ed0b32 --- /dev/null +++ b/model.layers.18.self_attn.k_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4063f97f7bfbe3296bcbeafa8e8ede4ab7c27da85367c84b9e7007dac33dfe3e +size 8390363 diff --git a/model.layers.18.self_attn.o_proj/FP8_Block.pth b/model.layers.18.self_attn.o_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..1a8c6692eeba92121be8dec33e84a83462bb7cd7 --- /dev/null +++ b/model.layers.18.self_attn.o_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdca356b3ff431b62e57816231bf8a97308a1f1396808ce884ca780c6a10b9c2 +size 33556279 diff --git a/model.layers.18.self_attn.o_proj/FP8_Dynamic.pth b/model.layers.18.self_attn.o_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..e8682c14a57dd6050f27ae18d5d72114d2b123f7 --- /dev/null +++ b/model.layers.18.self_attn.o_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:791a88c524c5d1f04b990efbc402f03e38d123248d3dab88998c7c5bae6909d3 +size 33556293 diff --git a/model.layers.18.self_attn.o_proj/NVFP4.pth b/model.layers.18.self_attn.o_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..5f3200845ab93cf19b341444c9eb721ed7a89eaa --- /dev/null +++ b/model.layers.18.self_attn.o_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6477be884d4fccd7859f9746796ecf07783e5cf9527fd403decc38d68198149 +size 33556187 diff --git a/model.layers.18.self_attn.q_proj/FP8_Block.pth b/model.layers.18.self_attn.q_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..016e7aa2f99a9b24e85a0e6b96753e1c6011d7d1 --- /dev/null +++ b/model.layers.18.self_attn.q_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:207014de33912ffeebbf50740d3c54779c269b3a5c7081fd297354994b12590e +size 33556279 diff --git a/model.layers.18.self_attn.q_proj/FP8_Dynamic.pth b/model.layers.18.self_attn.q_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..134c77af5e8ee33e06d4bcff83e80b2191db629a --- /dev/null +++ b/model.layers.18.self_attn.q_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:775d59161d8896c1576a63d82660fc6cef2a89a4edb880e7f7f28f34dff681b4 +size 33556293 diff --git a/model.layers.18.self_attn.q_proj/NVFP4.pth b/model.layers.18.self_attn.q_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..407c44c93e61a5ceac2db209b15aa4193e6b11be --- /dev/null +++ b/model.layers.18.self_attn.q_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9a32dfa25145bd35a93e446379a3026aedf96806c2219f7fcd06eca27c01d85 +size 33556187 diff --git a/model.layers.18.self_attn.v_proj/FP8_Block.pth b/model.layers.18.self_attn.v_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..7d56581184f115ca31a50c348d8de4b374851810 --- /dev/null +++ b/model.layers.18.self_attn.v_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60c0471f7b16496a6b9afd9ea99ccd01230fac0b00aaa61c835074d5a31dfd88 +size 8390455 diff --git a/model.layers.18.self_attn.v_proj/FP8_Dynamic.pth b/model.layers.18.self_attn.v_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..de05ec14a397ed7c258c6ee8c057a894d6662f71 --- /dev/null +++ b/model.layers.18.self_attn.v_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52f0e48ce2bd065ce5414fca543ebc56f775bb8c8a0bbc2124641c6f370038bd +size 8390469 diff --git a/model.layers.18.self_attn.v_proj/NVFP4.pth b/model.layers.18.self_attn.v_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..4a688d55acfc6c388781c94f432562bc30acb814 --- /dev/null +++ b/model.layers.18.self_attn.v_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24104275282e8e5e968d8db036d1f3f7d22610bb6df7630b8f2360a3447acc32 +size 8390363 diff --git a/model.layers.19.mlp.down_proj/FP8_Block.pth b/model.layers.19.mlp.down_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..4f8101f9995c78466babce3c229490d56975a6f9 --- /dev/null +++ b/model.layers.19.mlp.down_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11522df4e9d0ea1a382a8d721c28d593a44ae86afccbb3b37c60ea5be3247e0a +size 117442359 diff --git a/model.layers.19.mlp.down_proj/FP8_Dynamic.pth b/model.layers.19.mlp.down_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..ca5840f6d2042bc148522fa78c75918b9e3b404a --- /dev/null +++ b/model.layers.19.mlp.down_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9aad7234c773f6a871788059666dd3a9d271adbd55233010d56ae5503f4cf674 +size 117442373 diff --git a/model.layers.19.mlp.down_proj/NVFP4.pth b/model.layers.19.mlp.down_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..da1c380f9f6a4a519eeeaf27c237fdb71ba0998e --- /dev/null +++ b/model.layers.19.mlp.down_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9564c75208d8b77e9a90a750f978c38c34f4b60b5b72b24c6aedc691a59bf7b +size 117442267 diff --git a/model.layers.19.mlp.gate_proj/FP8_Block.pth b/model.layers.19.mlp.gate_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..a6ffbaad21b58e92e28a9234714f8b942b32f7d9 --- /dev/null +++ b/model.layers.19.mlp.gate_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3220009dffbae2c5e04e47ab8a91c636262bbbf8f81735dc3f98ad8c10bc7589 +size 117442359 diff --git a/model.layers.19.mlp.gate_proj/FP8_Dynamic.pth b/model.layers.19.mlp.gate_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..a535c7ec41375f9d46ad739d2ce48372c3e9825f --- /dev/null +++ b/model.layers.19.mlp.gate_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c95f2374de5ece85c0bb561d05027ad1f80abd8d9376efeb59c782b7ee56f49 +size 117442373 diff --git a/model.layers.19.mlp.gate_proj/NVFP4.pth b/model.layers.19.mlp.gate_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..aaa65121410aabd91564952f82543c8ac315b6dc --- /dev/null +++ b/model.layers.19.mlp.gate_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a34a90e5bf8f5002f199fd77b00c036da21a5fc93bbb215fa36055aa737ff89a +size 117442267 diff --git a/model.layers.19.mlp.up_proj/FP8_Block.pth b/model.layers.19.mlp.up_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..3c4816405837fe84936d0c128ae81e872b45297c --- /dev/null +++ b/model.layers.19.mlp.up_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca33f6aaca546e5191ec07eed39999eaa12760e2394e00356936c0f7d2b2cd5a +size 117442359 diff --git a/model.layers.19.mlp.up_proj/FP8_Dynamic.pth b/model.layers.19.mlp.up_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..d7e59a49ab656d81b02dbadf037035c960b1cb55 --- /dev/null +++ b/model.layers.19.mlp.up_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93fc8beea2d00466f3bc62b880125b8bdb6a2eeb018e8beb67bd8e930243b414 +size 117442373 diff --git a/model.layers.19.mlp.up_proj/NVFP4.pth b/model.layers.19.mlp.up_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..4c7450687a4d70484aee6500e18210c2a7c40b04 --- /dev/null +++ b/model.layers.19.mlp.up_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbddbfc4e72c9fb76e7fb65c3fa7f6479351399ab8de8bd7d9d739cad4dc253c +size 117442267 diff --git a/model.layers.19.self_attn.k_proj/FP8_Block.pth b/model.layers.19.self_attn.k_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..dbfcb85763af11fedbc6b4bbacabfe1ef37da56f --- /dev/null +++ b/model.layers.19.self_attn.k_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b96827abcf0dfa2ad054e17150593ac89c4ed1398b5120cf7618681c992b1f93 +size 8390455 diff --git a/model.layers.19.self_attn.k_proj/FP8_Dynamic.pth b/model.layers.19.self_attn.k_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..c4b6a24cdac3c61407c0a48a012e8c70e59c38e0 --- /dev/null +++ b/model.layers.19.self_attn.k_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0afa4f7aae9386bc8ce1b0ecc79fdaf30d64fcd63e538f59bff272a5fff8c16 +size 8390469 diff --git a/model.layers.19.self_attn.k_proj/NVFP4.pth b/model.layers.19.self_attn.k_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..76e4cab5cc24300048fc0bcc2201570aa64bfe8c --- /dev/null +++ b/model.layers.19.self_attn.k_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7eb4225e4fc5141e1422615755aec536a47c04772cf978c87debc14260f751bf +size 8390363 diff --git a/model.layers.19.self_attn.o_proj/FP8_Block.pth b/model.layers.19.self_attn.o_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..0374545590f3dbcda74c6e90060f8a4a2e7ccf39 --- /dev/null +++ b/model.layers.19.self_attn.o_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:369ac4181566058941a69d05c221915ff9004ccdbe7da67ecfc28dfb4a522bec +size 33556279 diff --git a/model.layers.19.self_attn.o_proj/FP8_Dynamic.pth b/model.layers.19.self_attn.o_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..98cf3a28330aa85c2555928a47e270094dc085c5 --- /dev/null +++ b/model.layers.19.self_attn.o_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:967be3477b20c5a74742f6a8f751344c02b7e8aab821e9f95cd0e6fd072c0f5d +size 33556293 diff --git a/model.layers.19.self_attn.o_proj/NVFP4.pth b/model.layers.19.self_attn.o_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..c87fbc247bfefa9f6e3738287421f513aacdec9f --- /dev/null +++ b/model.layers.19.self_attn.o_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d40575c0102c3327a4f933dddc78aa31cdd9b0b26aa8ad8029c97d767bc9362f +size 33556187 diff --git a/model.layers.19.self_attn.q_proj/FP8_Block.pth b/model.layers.19.self_attn.q_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..b428f65b201342dbd00047291b1956000ca4f92a --- /dev/null +++ b/model.layers.19.self_attn.q_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f14ebd9ef51bc935c747d421ffe20d1546387b8d46be9c2789338709ebcc851 +size 33556279 diff --git a/model.layers.19.self_attn.q_proj/FP8_Dynamic.pth b/model.layers.19.self_attn.q_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..74ae1ef517ba57b060ea31e84fafde73cc33ca6d --- /dev/null +++ b/model.layers.19.self_attn.q_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0456382b0d32b26261c3d8228404fc11c7a3bd8c525992a9946e98227358161d +size 33556293 diff --git a/model.layers.19.self_attn.q_proj/NVFP4.pth b/model.layers.19.self_attn.q_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..a2df6218e78c4eecbd34b13d7c3717bbd76d3859 --- /dev/null +++ b/model.layers.19.self_attn.q_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55f46890e672500a0f5d58e75102b102106ef810887dd0ffa6d7533cf472b812 +size 33556187 diff --git a/model.layers.19.self_attn.v_proj/FP8_Block.pth b/model.layers.19.self_attn.v_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..d8a571b0a67a97b96ebfe96fe784a7133745543d --- /dev/null +++ b/model.layers.19.self_attn.v_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9857faf1bb256d844d8cb26ad4e563e3c5236571ae2f5d17d634da0fddaab2d1 +size 8390455 diff --git a/model.layers.19.self_attn.v_proj/FP8_Dynamic.pth b/model.layers.19.self_attn.v_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..503d9f4176f53c3823b32eca1a14125801f27516 --- /dev/null +++ b/model.layers.19.self_attn.v_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7f77ee7a8b930a66020b420265f1635a6f023f6eba26d9135f80a6757d315ad +size 8390469 diff --git a/model.layers.19.self_attn.v_proj/NVFP4.pth b/model.layers.19.self_attn.v_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..ef1edc6d2f321ee1d4aa6afcfa03ed84ba524fed --- /dev/null +++ b/model.layers.19.self_attn.v_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39435754a193101b731f0728c49d621d8d98548117544ea8e17b0e75589d75ed +size 8390363 diff --git a/model.layers.2.mlp.down_proj/FP8_Block.pth b/model.layers.2.mlp.down_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..25bf39ff564574492664636d02b0e8271bc80714 --- /dev/null +++ b/model.layers.2.mlp.down_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd24649aa149c20cbd4541b47fa2d7c029aeb4bf18ac14ee6aa4c1b84717d6a2 +size 117442359 diff --git a/model.layers.2.mlp.down_proj/FP8_Dynamic.pth b/model.layers.2.mlp.down_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..827bd3088a75b7e50b47f41b071100d0a70829b9 --- /dev/null +++ b/model.layers.2.mlp.down_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:127b5057aa825e5e69dc4131436ac5994020e3769e3c476d0bbb94d67357d0c0 +size 117442373 diff --git a/model.layers.2.mlp.down_proj/NVFP4.pth b/model.layers.2.mlp.down_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..2f0d20e938ac33b7c2fce88f4e12cbbe23a44ce9 --- /dev/null +++ b/model.layers.2.mlp.down_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ff40949de9d6c496a5dccdbab87c1027d99e2d29606e8500dbbaf8018f474cd +size 117442267 diff --git a/model.layers.2.mlp.gate_proj/FP8_Block.pth b/model.layers.2.mlp.gate_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..81bbeebd1cff9539557fe7670fd40a2282f0737d --- /dev/null +++ b/model.layers.2.mlp.gate_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7350dcf15434687d99c67fdef2b1e237d20e046d7d40db461373ebdc7f0c444 +size 117442359 diff --git a/model.layers.2.mlp.gate_proj/FP8_Dynamic.pth b/model.layers.2.mlp.gate_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..357970f2d3739109ca6ebfc406eca66264d4c37f --- /dev/null +++ b/model.layers.2.mlp.gate_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6cad2867f2390894f2a65108a280dad2ea63b71bcdaf339f61b3b956345c071 +size 117442373 diff --git a/model.layers.2.mlp.gate_proj/NVFP4.pth b/model.layers.2.mlp.gate_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..4b564c079b9e031071ed7a8ac5e4223fdee11d7d --- /dev/null +++ b/model.layers.2.mlp.gate_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7103e95dc698d3780b527509e7bbe1bd92eaca5bdae682a9c0dfdf96215032c +size 117442267 diff --git a/model.layers.2.mlp.up_proj/FP8_Block.pth b/model.layers.2.mlp.up_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..669ea49aeaa0b25792e977c08fe6973cffbd1056 --- /dev/null +++ b/model.layers.2.mlp.up_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e95311c9ae617524f6735e21498294c90cf9b3f0d2af121deb1e5149b16eba3a +size 117442359 diff --git a/model.layers.2.mlp.up_proj/FP8_Dynamic.pth b/model.layers.2.mlp.up_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..96dba24620b6947190bf891d7f8fafe3072c7469 --- /dev/null +++ b/model.layers.2.mlp.up_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17459e968a46a4fce897e57831f15b435507125f64f60fb2898eb7b62992afb0 +size 117442373 diff --git a/model.layers.2.mlp.up_proj/NVFP4.pth b/model.layers.2.mlp.up_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..e5fa99fad1d9509007428052dcfcd86a197c828e --- /dev/null +++ b/model.layers.2.mlp.up_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:777c7eda51803c7a0f038fb6c3a51c8afb3b993bfbc2bea8dc0c3a219e819b59 +size 117442267 diff --git a/model.layers.2.self_attn.k_proj/FP8_Block.pth b/model.layers.2.self_attn.k_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..c594c4ee3e9ecc008cc6124f0efb9296f7fa3219 --- /dev/null +++ b/model.layers.2.self_attn.k_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0fdf01810edb1502c05683a2a68d7af1b709e0d7a26443c04d0499d6ddde915 +size 8390455 diff --git a/model.layers.2.self_attn.k_proj/FP8_Dynamic.pth b/model.layers.2.self_attn.k_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..4c71f8f416e5651958151928c51745d559bf29a0 --- /dev/null +++ b/model.layers.2.self_attn.k_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6a039d7cc6f38519a37fc347b8e7f7d267f082eb83743c20a881f1b7ff74851 +size 8390469 diff --git a/model.layers.2.self_attn.k_proj/NVFP4.pth b/model.layers.2.self_attn.k_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..ad391c9168c74e4492e29b676817ba832721b5a0 --- /dev/null +++ b/model.layers.2.self_attn.k_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f910e9072b1a99db8a9c36b77e76d52609758dd690dfe5f3d776e095d847a5c +size 8390363 diff --git a/model.layers.2.self_attn.o_proj/FP8_Block.pth b/model.layers.2.self_attn.o_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..12889f34f9c90b2822aa34a1cb752917d517d004 --- /dev/null +++ b/model.layers.2.self_attn.o_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:810d3062846cb47e62a70c457118c0c4ddef1c4bf77f8bce40abd48b759db2de +size 33556279 diff --git a/model.layers.2.self_attn.o_proj/FP8_Dynamic.pth b/model.layers.2.self_attn.o_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..4ae5fc1f475a124818f955280a9c6b327c704f1e --- /dev/null +++ b/model.layers.2.self_attn.o_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e7d090336663166732da0bbd1e0ff39deb7ed3539dad184ea66893aaa49de4d +size 33556293 diff --git a/model.layers.2.self_attn.o_proj/NVFP4.pth b/model.layers.2.self_attn.o_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..276831f85bdb2053469544465d77ab2b25e6fa8c --- /dev/null +++ b/model.layers.2.self_attn.o_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25bc47d5a95ea1727f2a7e5c5633b696a72b164555abe5786d608a9e602fdc7f +size 33556187 diff --git a/model.layers.2.self_attn.q_proj/FP8_Block.pth b/model.layers.2.self_attn.q_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..c530dcc85fde4d4be138e635447919c24006c9af --- /dev/null +++ b/model.layers.2.self_attn.q_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bad457bef83b8e7e2e5cc17de7ad7bbd6702f6beca8b0b655fbe8db3903c8bb1 +size 33556279 diff --git a/model.layers.2.self_attn.q_proj/FP8_Dynamic.pth b/model.layers.2.self_attn.q_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..a871204c0f3171d994f1847a8a505fc46b77adb0 --- /dev/null +++ b/model.layers.2.self_attn.q_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45712bb64074b66d13edcd4ff2da9cddc0c1ff224d13923b9918ac33c1462de4 +size 33556293 diff --git a/model.layers.2.self_attn.q_proj/NVFP4.pth b/model.layers.2.self_attn.q_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..ad0c0fadadfa70acf8c9768ef8882a99b784c918 --- /dev/null +++ b/model.layers.2.self_attn.q_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cf8ddbca214f683497cbaebd34ee7d3fd85e914ed5cc42883d81c370043c8f7 +size 33556187 diff --git a/model.layers.2.self_attn.v_proj/FP8_Block.pth b/model.layers.2.self_attn.v_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..e170d055b94fd5142501534bc3508bd68c7eafac --- /dev/null +++ b/model.layers.2.self_attn.v_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5761c9537e41ccb45163af0daa0e36f96948b08cad027aa6d3c747f6fe8f2e1b +size 8390455 diff --git a/model.layers.2.self_attn.v_proj/FP8_Dynamic.pth b/model.layers.2.self_attn.v_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..41db0d8d7386dd9c369b2a80a85378ab8b6ad68b --- /dev/null +++ b/model.layers.2.self_attn.v_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07c8246b6a6a3bcb7ade06451be4b1efe5a6440b08081676b0671a3c777726d8 +size 8390469 diff --git a/model.layers.2.self_attn.v_proj/NVFP4.pth b/model.layers.2.self_attn.v_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..af289bf7b4860c9a3d7c20654c2009ad19aee5ea --- /dev/null +++ b/model.layers.2.self_attn.v_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebe86ab699ac6563b4fcaade6c623b609d0af0ea4bf4adc4fdd06cae0373ebec +size 8390363 diff --git a/model.layers.20.mlp.down_proj/FP8_Block.pth b/model.layers.20.mlp.down_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..2dbca01f179260cf1d08131c2f730640d72a6e2e --- /dev/null +++ b/model.layers.20.mlp.down_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e537f6c49bc184a32d0a55909ac5a6174f64fcd7db09f7f5ebf46d05db016ae +size 117442359 diff --git a/model.layers.20.mlp.down_proj/FP8_Dynamic.pth b/model.layers.20.mlp.down_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..f3de32d27f41c052c2f3716fd862c5ef3d76e3b7 --- /dev/null +++ b/model.layers.20.mlp.down_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:687ea3cbc0fa21b7d58d04b7f385ea5b3b5bb073274cb4fdb0eb3b5427f5ed1a +size 117442373 diff --git a/model.layers.20.mlp.down_proj/NVFP4.pth b/model.layers.20.mlp.down_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..7c4194425ab69e58b046345aaf31456f0106dd80 --- /dev/null +++ b/model.layers.20.mlp.down_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf044adf8abe4b1dccde6276cd98356f8ef10cb2ad5dcfc1191bb7a1c3b5960d +size 117442267 diff --git a/model.layers.20.mlp.gate_proj/FP8_Block.pth b/model.layers.20.mlp.gate_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..bc91b0ec5ea27b0f646b5152d7456f6d5c62c991 --- /dev/null +++ b/model.layers.20.mlp.gate_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56064089964be976db12fd7bc75ef8000122c5060ed3cb373bf0ccc60faa3cc9 +size 117442359 diff --git a/model.layers.20.mlp.gate_proj/FP8_Dynamic.pth b/model.layers.20.mlp.gate_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..d00efab9201abd79184742fe52f1a386f7f6c88e --- /dev/null +++ b/model.layers.20.mlp.gate_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d0f4fd32ed471bba826a7b989d7bfdaa6f96fc96e3174c284c86e0f272e5d62 +size 117442373 diff --git a/model.layers.20.mlp.gate_proj/NVFP4.pth b/model.layers.20.mlp.gate_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..67a3faf26f0604def9f6da8d3201e852192f2c44 --- /dev/null +++ b/model.layers.20.mlp.gate_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa6e007a0e6dd71632692b3beb19797be08d6e4dd07a680f49965bf2169903fa +size 117442267 diff --git a/model.layers.20.mlp.up_proj/FP8_Block.pth b/model.layers.20.mlp.up_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..48633a20dcb6466314b2473f97fb629a43681833 --- /dev/null +++ b/model.layers.20.mlp.up_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98c7b9835853b57bc50d5f18fa56065f51be8394e3c241bf882112cfb01b620e +size 117442359 diff --git a/model.layers.20.mlp.up_proj/FP8_Dynamic.pth b/model.layers.20.mlp.up_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..28287986eb19769c562d71ecc496f9b6ef1411be --- /dev/null +++ b/model.layers.20.mlp.up_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:648c1fc5ebb6a512a638b6e8644ee44959d0ce5290892e1c0a7011ff50eae7af +size 117442373 diff --git a/model.layers.20.mlp.up_proj/NVFP4.pth b/model.layers.20.mlp.up_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..98dd42f49dd82bd119af1fb7f81654e98fc73588 --- /dev/null +++ b/model.layers.20.mlp.up_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62e615788addfb17f7b78539e0dbabd7bb33fc80da70e4f4dbb9bf87167558ab +size 117442267 diff --git a/model.layers.20.self_attn.k_proj/FP8_Block.pth b/model.layers.20.self_attn.k_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..c5cdc04f6affa07464b19fc3638222b2779e48b3 --- /dev/null +++ b/model.layers.20.self_attn.k_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a50e2532bc049381e73261ef70058441392fe8acacd74a38423161337545322b +size 8390455 diff --git a/model.layers.20.self_attn.k_proj/FP8_Dynamic.pth b/model.layers.20.self_attn.k_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..3dc370ea4a759d35bd9092ddb7d88c6de3c2462f --- /dev/null +++ b/model.layers.20.self_attn.k_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7c5ba25899cd7aaa28880a753ffd7cc95970aed9a26429bd3d5c4709a7338f2 +size 8390469 diff --git a/model.layers.20.self_attn.k_proj/NVFP4.pth b/model.layers.20.self_attn.k_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..f1182f8bf84aa8db3a890df2b4ece368f3f4577c --- /dev/null +++ b/model.layers.20.self_attn.k_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed73c34f0b0414a8f06784c88057746b5d6f9bc9206878cf8265bcfad74cd8b0 +size 8390363 diff --git a/model.layers.20.self_attn.o_proj/FP8_Block.pth b/model.layers.20.self_attn.o_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..09f7c7bf9c2a4a276cf4fd132d631d35d5be542f --- /dev/null +++ b/model.layers.20.self_attn.o_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aacf910d02c4da2c0653dffe7cf14f125e6f145cce6f5f9d0b30befca73e81ef +size 33556279 diff --git a/model.layers.20.self_attn.o_proj/FP8_Dynamic.pth b/model.layers.20.self_attn.o_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..58789e58af3a107194b89508ed71e028b23fa655 --- /dev/null +++ b/model.layers.20.self_attn.o_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72048d6168461dfd4c720de92aec9e3856a661a970cea4f16f49b8f59b3720d1 +size 33556293 diff --git a/model.layers.20.self_attn.o_proj/NVFP4.pth b/model.layers.20.self_attn.o_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..1198a367725fcb9f880feb0241840a50284b3ca6 --- /dev/null +++ b/model.layers.20.self_attn.o_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54e045e23b7a872476a95f59723c9eec2e94e3444b6832985ee0fa8d756910cb +size 33556187 diff --git a/model.layers.20.self_attn.q_proj/FP8_Block.pth b/model.layers.20.self_attn.q_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..909a167ce1ba19760e52cedf2efcf6265cf9806d --- /dev/null +++ b/model.layers.20.self_attn.q_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c7c2f7a3af579ce8213aff4ba40cefa028cc61cde88582e22aa0d0b5f158ea3 +size 33556279 diff --git a/model.layers.20.self_attn.q_proj/FP8_Dynamic.pth b/model.layers.20.self_attn.q_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..89cc3e5ea23627b7d5b634ac2118c3bdb34206aa --- /dev/null +++ b/model.layers.20.self_attn.q_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ed1b1d55a2b4b1139bb5b764e2f802d833a59840a0c6f184fbe9b50bd1e8453 +size 33556293 diff --git a/model.layers.20.self_attn.q_proj/NVFP4.pth b/model.layers.20.self_attn.q_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..fc670684e11d3b5118fcbd468468971126411141 --- /dev/null +++ b/model.layers.20.self_attn.q_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:434b5fc68d6e9a9e393ac4915f978550e9be8237dd75f6df06faef85c144272b +size 33556187 diff --git a/model.layers.20.self_attn.v_proj/FP8_Block.pth b/model.layers.20.self_attn.v_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..b5119a622a06fed1a415c0134345f84148aa4676 --- /dev/null +++ b/model.layers.20.self_attn.v_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96856da261a080f284fb01235fd99fd501c9998f456a936a52b2f04ff6b6112e +size 8390455 diff --git a/model.layers.20.self_attn.v_proj/FP8_Dynamic.pth b/model.layers.20.self_attn.v_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..5b777c3352ea3c728cd739df6180deacc5fb7288 --- /dev/null +++ b/model.layers.20.self_attn.v_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1e24a6469664ec801cc14393edbd11038f31e63b5e8f376bad185e59a9e4312 +size 8390469 diff --git a/model.layers.20.self_attn.v_proj/NVFP4.pth b/model.layers.20.self_attn.v_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..1e0ff31a8fb67cbb003aa024bfae3df82626d77d --- /dev/null +++ b/model.layers.20.self_attn.v_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a8343f1444731325b80cf30586095679dc34bbee9a6b2cf0161610fc7614377 +size 8390363 diff --git a/model.layers.21.mlp.down_proj/FP8_Block.pth b/model.layers.21.mlp.down_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..ae55eef7574faf59083f50aae041f5b3f173a98f --- /dev/null +++ b/model.layers.21.mlp.down_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be929cbbf892ed963150d95d42b9ed6fc39feba8c0949bb2011fa053c5ac1451 +size 117442359 diff --git a/model.layers.21.mlp.down_proj/FP8_Dynamic.pth b/model.layers.21.mlp.down_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..7db2e1757315e2874f3d3851a4609d4e0997420c --- /dev/null +++ b/model.layers.21.mlp.down_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49852c810bf0b70ae2d6380fe5cc09867a4343a7c34d7800f7c2e3657e06539c +size 117442373 diff --git a/model.layers.21.mlp.down_proj/NVFP4.pth b/model.layers.21.mlp.down_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..26d260651ae412c857b321ffd15940d0a90a87da --- /dev/null +++ b/model.layers.21.mlp.down_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86465482fa42d397e73049f1cee5c45024c551a9fabec4df2c1fee0cd891fa41 +size 117442267 diff --git a/model.layers.21.mlp.gate_proj/FP8_Block.pth b/model.layers.21.mlp.gate_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..02ab6572907c3ba1329ced1a3b3d160ffe6918e4 --- /dev/null +++ b/model.layers.21.mlp.gate_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b72204690cc1c4b81c86bb245313363dd181e714c89f450952e45709fbe44a40 +size 117442359 diff --git a/model.layers.21.mlp.gate_proj/FP8_Dynamic.pth b/model.layers.21.mlp.gate_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..4bf4aa0c240245a803f86d0c7bb4b6f128fb3185 --- /dev/null +++ b/model.layers.21.mlp.gate_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7874b93f2c534fe46331bc8677dcd03c8b762f1b654c198a698d43dd4716a9e +size 117442373 diff --git a/model.layers.21.mlp.gate_proj/NVFP4.pth b/model.layers.21.mlp.gate_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..cd32cf5c1de4a27d7c1589aaffdf3b9789eeba7e --- /dev/null +++ b/model.layers.21.mlp.gate_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c603509dddde673e92a9763e37412a303e23688b43c1260fccb18d06c94e0a7b +size 117442267 diff --git a/model.layers.21.mlp.up_proj/FP8_Block.pth b/model.layers.21.mlp.up_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..0074e052b740c66b3ce64296db58e6b1b55d4d05 --- /dev/null +++ b/model.layers.21.mlp.up_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf822c8c93baf594b9864b4e1e9058e5a35d2b9bda272e47ab90a6f73bad9e86 +size 117442359 diff --git a/model.layers.21.mlp.up_proj/FP8_Dynamic.pth b/model.layers.21.mlp.up_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..3bd64f7845914bf069be41a6bf8abd3e5cfc23fe --- /dev/null +++ b/model.layers.21.mlp.up_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31c344baf2e7cae29bb8ddae2ce25336fc84ad1f62e6caa717a14ba31775e615 +size 117442373 diff --git a/model.layers.21.mlp.up_proj/NVFP4.pth b/model.layers.21.mlp.up_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..b955a685b8cb047dd33f4d22cba189d34580f67e --- /dev/null +++ b/model.layers.21.mlp.up_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:444a33bb06560b84a6217e6f4c15fea08a242d65a2d42ac0a17056cf99d9a0cd +size 117442267 diff --git a/model.layers.21.self_attn.k_proj/FP8_Block.pth b/model.layers.21.self_attn.k_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..12125dbf0106a5373d2a8ca98c2dbf559318f7c6 --- /dev/null +++ b/model.layers.21.self_attn.k_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fb66a2b478e7aaf9c47a686a1b9f7bbdc92986f8b94d0a1d62086ccd118e41a +size 8390455 diff --git a/model.layers.21.self_attn.k_proj/FP8_Dynamic.pth b/model.layers.21.self_attn.k_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..ddbb4e4531b1e6090d71b552bced066930571d01 --- /dev/null +++ b/model.layers.21.self_attn.k_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46fb8ba52d787f6d071839a490950d56b551f0e843ebaebac2ee7b2a44f4c26f +size 8390469 diff --git a/model.layers.21.self_attn.k_proj/NVFP4.pth b/model.layers.21.self_attn.k_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..d64605522d647d0d34dba7cad1af642e272aee8f --- /dev/null +++ b/model.layers.21.self_attn.k_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2250001af63c24516764f19a473548a776065fad75ae5bf7336acfd89755d56 +size 8390363 diff --git a/model.layers.21.self_attn.o_proj/FP8_Block.pth b/model.layers.21.self_attn.o_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..756143ec3a30d34e0a1fd236641ee7ed172e041c --- /dev/null +++ b/model.layers.21.self_attn.o_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1198f8d94d64cf14440afe926535389e3eb02d964fb39ddb134b822e32997f56 +size 33556279 diff --git a/model.layers.21.self_attn.o_proj/FP8_Dynamic.pth b/model.layers.21.self_attn.o_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..490d0f37ad0ef49df568def6a20703b54115e162 --- /dev/null +++ b/model.layers.21.self_attn.o_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09df2ab5147ce8fe0200d65faeff05c764cabe79b10c920d3839e4ac4359c099 +size 33556293 diff --git a/model.layers.21.self_attn.o_proj/NVFP4.pth b/model.layers.21.self_attn.o_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..a7b3aeed0a814f65d0a3b05371e0d790c4c95a62 --- /dev/null +++ b/model.layers.21.self_attn.o_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e49d3c2477ffd00ba78073d8ce313da61817c92f7882bb48b72bb4cb7e1af6e +size 33556187 diff --git a/model.layers.21.self_attn.q_proj/FP8_Block.pth b/model.layers.21.self_attn.q_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..be37e5c543901cf90de3763397b0e50b918f1fc9 --- /dev/null +++ b/model.layers.21.self_attn.q_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f45b3eb0a1e55a048aef4d9865051e9b454579aff71f5d9716f7f948c300390 +size 33556279 diff --git a/model.layers.21.self_attn.q_proj/FP8_Dynamic.pth b/model.layers.21.self_attn.q_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..568d39b4d7fefe44501c2f54152f50c2f4e9bcb3 --- /dev/null +++ b/model.layers.21.self_attn.q_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c4bc672c3a78e739f7cefb54a7e48f92423ab9e2e1ef2fb34576fdf4c371d79 +size 33556293 diff --git a/model.layers.21.self_attn.q_proj/NVFP4.pth b/model.layers.21.self_attn.q_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..64502ec2ed1ec8c2d0ff8aa5d9d0bce1ec2de452 --- /dev/null +++ b/model.layers.21.self_attn.q_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38e17eb551d0899b96f62f847dd04c1b5cd9b199b3b349e9ca64cf00c5b742fe +size 33556187 diff --git a/model.layers.21.self_attn.v_proj/FP8_Block.pth b/model.layers.21.self_attn.v_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..85ed84b46db8bdb160fdc804e06ca61451463b10 --- /dev/null +++ b/model.layers.21.self_attn.v_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:157c2afd949982331935b1f6ac3b79ce54cd85f7e295ec8117aae9d49d713eeb +size 8390455 diff --git a/model.layers.21.self_attn.v_proj/FP8_Dynamic.pth b/model.layers.21.self_attn.v_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..207acf13f3dbbd60ac854daef197ae4e7a68c7d3 --- /dev/null +++ b/model.layers.21.self_attn.v_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75f812f202fc2df975db4434894793155068859376c77f54e165403f1dcba8cb +size 8390469 diff --git a/model.layers.21.self_attn.v_proj/NVFP4.pth b/model.layers.21.self_attn.v_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..ea87338a09dc98d7fb9224cb86cc83ef5be27602 --- /dev/null +++ b/model.layers.21.self_attn.v_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64c63cbe39008332f2d118036a20a49573a72aebb46a527af1b690d16169d232 +size 8390363 diff --git a/model.layers.22.mlp.down_proj/FP8_Block.pth b/model.layers.22.mlp.down_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..c9a5e4b5582ac9786271c44edc21c206b3fd9fbd --- /dev/null +++ b/model.layers.22.mlp.down_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fee6d758f02ea6d07a5f0111859180d99167cac500c55cc1cfe85ff4d15a9abf +size 117442359 diff --git a/model.layers.22.mlp.down_proj/FP8_Dynamic.pth b/model.layers.22.mlp.down_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..390e2abdc593f2c027e7745a326aae36094bbf44 --- /dev/null +++ b/model.layers.22.mlp.down_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fb7a36a48eaeb6a9dc5b2530a334420f91a0eb2c95429c142be0d4155e19708 +size 117442373 diff --git a/model.layers.22.mlp.down_proj/NVFP4.pth b/model.layers.22.mlp.down_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..89b0cd533ffd6bba941029f48ef5dd070020f8b0 --- /dev/null +++ b/model.layers.22.mlp.down_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34826ee7bb6e39ff56610a7064c2db910f56226afdc7cd7ffe798cbb6874deb8 +size 117442267 diff --git a/model.layers.22.mlp.gate_proj/FP8_Block.pth b/model.layers.22.mlp.gate_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..ac1a1d3a404170c4208813f7b49830f565336ce1 --- /dev/null +++ b/model.layers.22.mlp.gate_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e99d0bc99837f6d7f2e07a3081cbc778218410ab8b038dc5fba9cad66b65400c +size 117442359 diff --git a/model.layers.22.mlp.gate_proj/FP8_Dynamic.pth b/model.layers.22.mlp.gate_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..5eed69879624f1eaba1abd1b3d1248f4576913a3 --- /dev/null +++ b/model.layers.22.mlp.gate_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da50612e501f56b35809406cb4a5f729149a8e782500d63e717cf551ce6392e2 +size 117442373 diff --git a/model.layers.22.mlp.gate_proj/NVFP4.pth b/model.layers.22.mlp.gate_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..ff222252ca3b54be1bc48cf206176c280a4e597b --- /dev/null +++ b/model.layers.22.mlp.gate_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9675444effbccb1e304f1e8ce5ddcc769cb893a9ea0e935f99b873a578036cac +size 117442267 diff --git a/model.layers.22.mlp.up_proj/FP8_Block.pth b/model.layers.22.mlp.up_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..3f91bb5888f06a2b08c2fc808776c82db3ee24e1 --- /dev/null +++ b/model.layers.22.mlp.up_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9950a08762c9740245e809dd2acec71622e47a108fb464b0b7ec11c8b5929a93 +size 117442359 diff --git a/model.layers.22.mlp.up_proj/FP8_Dynamic.pth b/model.layers.22.mlp.up_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..2355576556c6fe9fa016d6decda8024e206f2f11 --- /dev/null +++ b/model.layers.22.mlp.up_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98aad2de58d0c60881d3e1fefea2b3b480378259ae33b7780824554c46938ada +size 117442373 diff --git a/model.layers.22.mlp.up_proj/NVFP4.pth b/model.layers.22.mlp.up_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..cb392e22cbf7b49df5ac4f165043c0ae13f3f9c9 --- /dev/null +++ b/model.layers.22.mlp.up_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e16f7ea99a4dbb7725fe0cfcada5b6231c9e91586bbfc621c0fe97547f76f30 +size 117442267 diff --git a/model.layers.22.self_attn.k_proj/FP8_Block.pth b/model.layers.22.self_attn.k_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..96b5d274df4cb0fba1ea58f30fbc703f2eee6f63 --- /dev/null +++ b/model.layers.22.self_attn.k_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce5dd7fa69d01bc42b5583280badd7082afad82a3332bb26c54f10b90c3dcf87 +size 8390455 diff --git a/model.layers.22.self_attn.k_proj/FP8_Dynamic.pth b/model.layers.22.self_attn.k_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..8006ee914870d64ebdffb7d036ddaa38a7f3ceaf --- /dev/null +++ b/model.layers.22.self_attn.k_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e37d738e76408f2a53aabe532093e0faafb8b36f63d288d703abff750539b8b1 +size 8390469 diff --git a/model.layers.22.self_attn.k_proj/NVFP4.pth b/model.layers.22.self_attn.k_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..a750e111d7158d9df5c943d7cde87d434a5a6f4b --- /dev/null +++ b/model.layers.22.self_attn.k_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83b9f930275c72f269976a7334d6b998a8613e6d4781a940dfa0aa65375c99e4 +size 8390363 diff --git a/model.layers.22.self_attn.o_proj/FP8_Block.pth b/model.layers.22.self_attn.o_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..d689c5a50a24a79acbe4eeab60baa2d5583f783a --- /dev/null +++ b/model.layers.22.self_attn.o_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a381519ac6effbb299a3af21966248b080b4d6c08d142d0fb883cb0c9962a993 +size 33556279 diff --git a/model.layers.22.self_attn.o_proj/FP8_Dynamic.pth b/model.layers.22.self_attn.o_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..b183a7cb18cd7707fd49d557bef6d02e58b39855 --- /dev/null +++ b/model.layers.22.self_attn.o_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6cc08994bbd923099b54b06ebc4c09f37d9e1914e06ae77ce1690a68a67b54ee +size 33556293 diff --git a/model.layers.22.self_attn.o_proj/NVFP4.pth b/model.layers.22.self_attn.o_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..e24020841b4bc846cbecd41e330008570855da3e --- /dev/null +++ b/model.layers.22.self_attn.o_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2d4a207b95c0d5e619ae1c37a680bdd2b1e3406aebd20855358f3c5515ea3dd +size 33556187 diff --git a/model.layers.22.self_attn.q_proj/FP8_Block.pth b/model.layers.22.self_attn.q_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..63f42446412ad0c6fbffbbc3b5bdbf44b195490b --- /dev/null +++ b/model.layers.22.self_attn.q_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbce900c3fa94c008212bd882b77d61cfb26a1ff8cd347ce87c4a1209ae13dfa +size 33556279 diff --git a/model.layers.22.self_attn.q_proj/FP8_Dynamic.pth b/model.layers.22.self_attn.q_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..989219d9b744c930c88a25cde4154008ec6d511d --- /dev/null +++ b/model.layers.22.self_attn.q_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21429223285ecf00974ed15d54c1e49293eed01697def532d8634622b729baa5 +size 33556293 diff --git a/model.layers.22.self_attn.q_proj/NVFP4.pth b/model.layers.22.self_attn.q_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..be2cb2c27954513b76c5741252bb55b0c7b49999 --- /dev/null +++ b/model.layers.22.self_attn.q_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7039621db70a4eb370ebe47d12b536ab92938316166abc9d592e0694edc79f73 +size 33556187 diff --git a/model.layers.22.self_attn.v_proj/FP8_Block.pth b/model.layers.22.self_attn.v_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..2171861641b14f87652ffc994c8dc3ee66e3faf2 --- /dev/null +++ b/model.layers.22.self_attn.v_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3670a006ee8a76f20b55b82a674091d6bfae084130f4a33110001ebd9197fc48 +size 8390455 diff --git a/model.layers.22.self_attn.v_proj/FP8_Dynamic.pth b/model.layers.22.self_attn.v_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..56dce71f1a534344fc042bfabfe67e63a8b1eab3 --- /dev/null +++ b/model.layers.22.self_attn.v_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6b0677cb6086150f430255658f87419a6839a52450c302c3be498e4ca9719ed +size 8390469 diff --git a/model.layers.22.self_attn.v_proj/NVFP4.pth b/model.layers.22.self_attn.v_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..3121a4731281ac5555b331f651fd0a6c9b5d3861 --- /dev/null +++ b/model.layers.22.self_attn.v_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6210c6670d028b83af11f5276b7298b6953072e0d4929d26d107b77af8101af5 +size 8390363 diff --git a/model.layers.23.mlp.down_proj/FP8_Block.pth b/model.layers.23.mlp.down_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..ed0eafe61dc4ab20fd32cbedc69991f9d4407ce2 --- /dev/null +++ b/model.layers.23.mlp.down_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63c58d3929b27725d7e2a0bbeb96db5a5b312ab67344814e56a8c4afc86b31f2 +size 117442359 diff --git a/model.layers.23.mlp.down_proj/FP8_Dynamic.pth b/model.layers.23.mlp.down_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..97f9db4ded809556f1a7920b545dba0f87861595 --- /dev/null +++ b/model.layers.23.mlp.down_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2c7a6836f77522f174295716136d980747de1cd1213577200af76e1fd90736f +size 117442373 diff --git a/model.layers.23.mlp.down_proj/NVFP4.pth b/model.layers.23.mlp.down_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..a03d43afbdaa46af9709fc1b4f5b4c766281f5fe --- /dev/null +++ b/model.layers.23.mlp.down_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81d39ce37a497a5fa51c9f4811186ceee89cbe29bf97ed83c86fcc6cb5cef008 +size 117442267 diff --git a/model.layers.23.mlp.gate_proj/FP8_Block.pth b/model.layers.23.mlp.gate_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..b7ea7c97f48a12483c27d3826242216c84006b45 --- /dev/null +++ b/model.layers.23.mlp.gate_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2fede0886b576c81549904aabeed61f9f11e2ec702a7b9d33a7b71b4d23a8f72 +size 117442359 diff --git a/model.layers.23.mlp.gate_proj/FP8_Dynamic.pth b/model.layers.23.mlp.gate_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..b3b96b84a21a2985f0b223593879b128b2c59c0a --- /dev/null +++ b/model.layers.23.mlp.gate_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:369ff7721ddced53d0d5e724c07c770346884341ff0fc1eacdeb697298ac3d83 +size 117442373 diff --git a/model.layers.23.mlp.gate_proj/NVFP4.pth b/model.layers.23.mlp.gate_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..829b9d500c46ba5fede5c1501f93596a74e39d2e --- /dev/null +++ b/model.layers.23.mlp.gate_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4eb1f43c456e6cd183f21e032400c9b719ef7faf67d834d2aaa1804239d83013 +size 117442267 diff --git a/model.layers.23.mlp.up_proj/FP8_Block.pth b/model.layers.23.mlp.up_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..fb15422713d4498e49c6270587b18a5970f02347 --- /dev/null +++ b/model.layers.23.mlp.up_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3e770d4f65314e9ea7538e221ef3825f7cdf9d3203f249fee4b917fe80077f6 +size 117442359 diff --git a/model.layers.23.mlp.up_proj/FP8_Dynamic.pth b/model.layers.23.mlp.up_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..19a27ea6f194adbdb71e20887d915e72fae0ade8 --- /dev/null +++ b/model.layers.23.mlp.up_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91a75e4fdc67c80969a9cf9c67d2ee1d88a973c8c6bccc7662981bd7b8a8bdfd +size 117442373 diff --git a/model.layers.23.mlp.up_proj/NVFP4.pth b/model.layers.23.mlp.up_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..b033694c45fa4e3349974737ec115426d09eec5a --- /dev/null +++ b/model.layers.23.mlp.up_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:021c1edf77673941183d07a17cbae396671b3ccbfaf2d03d9c82582639d92144 +size 117442267 diff --git a/model.layers.23.self_attn.k_proj/FP8_Block.pth b/model.layers.23.self_attn.k_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..763156930c0c1f4a3c875507d46a207b380e3de9 --- /dev/null +++ b/model.layers.23.self_attn.k_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d6b24ed6426daec0031e48941746e3bf974c5ea8daa978a018fdfc456b591f1 +size 8390455 diff --git a/model.layers.23.self_attn.k_proj/FP8_Dynamic.pth b/model.layers.23.self_attn.k_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..00dbffffbd5d483af8f775af3a37daa46ae8248d --- /dev/null +++ b/model.layers.23.self_attn.k_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a47c58871377214e8d4558c9ef3f13eb31a3b5f4bda5befce9c4ee708dc0c3ed +size 8390469 diff --git a/model.layers.23.self_attn.k_proj/NVFP4.pth b/model.layers.23.self_attn.k_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..dfbbe300fc4792d364e4a2db1897644a1d89b17d --- /dev/null +++ b/model.layers.23.self_attn.k_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad39a1f8b4cc0685008f6d6dedc4ca1a2d6bc04fe9d4d539d891f849141af50f +size 8390363 diff --git a/model.layers.23.self_attn.o_proj/FP8_Block.pth b/model.layers.23.self_attn.o_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..805f6e85d25e11f7bff61915ea0b8717e83c641b --- /dev/null +++ b/model.layers.23.self_attn.o_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a86dbbb5738bbecd816ad8e41ab995cbea2d929675d6c27cc0b3554e6cdb9a7c +size 33556279 diff --git a/model.layers.23.self_attn.o_proj/FP8_Dynamic.pth b/model.layers.23.self_attn.o_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..e7f3b36225c6478e967f8ab6ff076ee85630c59b --- /dev/null +++ b/model.layers.23.self_attn.o_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d82e537e80bd3acc214e5666acd0f4f163d34d77c9ab5c98945464640139071 +size 33556293 diff --git a/model.layers.23.self_attn.o_proj/NVFP4.pth b/model.layers.23.self_attn.o_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..fd417b19f6220f4f1c91b256278bb10678efcdef --- /dev/null +++ b/model.layers.23.self_attn.o_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4600fc53811480bc5d765cd8ae2fa4cfd4d4efe588eeb39f25f70a2c1a8f2bfa +size 33556187 diff --git a/model.layers.23.self_attn.q_proj/FP8_Block.pth b/model.layers.23.self_attn.q_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..cf5cee9816bc86b14f7bfee6d17fb7f9a537dfe8 --- /dev/null +++ b/model.layers.23.self_attn.q_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e6f3b9119ca6cbe321bb85d01591bf5c818aa3bd12cf6545ea992f19cb5d178 +size 33556279 diff --git a/model.layers.23.self_attn.q_proj/FP8_Dynamic.pth b/model.layers.23.self_attn.q_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..796f544dee8fa8c199404764494a047f8d90b4ec --- /dev/null +++ b/model.layers.23.self_attn.q_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b228bb67410717e544a2e89d1a1e35547e87a6c15e00cf484160daeeb6dc4f0 +size 33556293 diff --git a/model.layers.23.self_attn.q_proj/NVFP4.pth b/model.layers.23.self_attn.q_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..7871eea800db5ab3e741cdbc21ce9b40fa6f9011 --- /dev/null +++ b/model.layers.23.self_attn.q_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2126a676efb4eb179ad1d698d903dc8b201c1e8a63d78d5b186998dc559fbcb7 +size 33556187 diff --git a/model.layers.23.self_attn.v_proj/FP8_Block.pth b/model.layers.23.self_attn.v_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..a99a498a85aebbb8003b5b8f248918d307dac638 --- /dev/null +++ b/model.layers.23.self_attn.v_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:222e58b901908bf9523b71ac53871c08151f4a112f7b314a4e235b4641b3db90 +size 8390455 diff --git a/model.layers.23.self_attn.v_proj/FP8_Dynamic.pth b/model.layers.23.self_attn.v_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..b51b19d1bb8aacb505827ed4a6cf48e8563b5b08 --- /dev/null +++ b/model.layers.23.self_attn.v_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bdf5545cbba6226a9fd692aa8f46e67dce877f5217b6dc00e99539b1be29ec1 +size 8390469 diff --git a/model.layers.23.self_attn.v_proj/NVFP4.pth b/model.layers.23.self_attn.v_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..7fbf1345a6197f0ba5736d10f9dd043a84da29bc --- /dev/null +++ b/model.layers.23.self_attn.v_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd94d3b8e6946fb62c8e919c7fb5536a27691fc01b6c8153a9e3cfb3ce5bade8 +size 8390363 diff --git a/model.layers.24.mlp.down_proj/FP8_Block.pth b/model.layers.24.mlp.down_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..1176bf1c1a7091e7ea53d1da45403f63185c9339 --- /dev/null +++ b/model.layers.24.mlp.down_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b2d91f831474a08956c525fb26c98c63fda8bf18c285d079ad459033e4cfb82 +size 117442359 diff --git a/model.layers.24.mlp.down_proj/FP8_Dynamic.pth b/model.layers.24.mlp.down_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..442cba032203fa42984fce9ab48a8ee29cbd03e7 --- /dev/null +++ b/model.layers.24.mlp.down_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e71d43fc513cbd7619ce0ef2e00b4f3f9348f1f790c577ef8f9ba4fc98035044 +size 117442373 diff --git a/model.layers.24.mlp.down_proj/NVFP4.pth b/model.layers.24.mlp.down_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..950be8ba6b2987ada1850c2fe85d285ad0de9164 --- /dev/null +++ b/model.layers.24.mlp.down_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06193c16879bb04a0210f8a93ef0b59f59ed9af48c947b37674ba8f3d863c9e9 +size 117442267 diff --git a/model.layers.24.mlp.gate_proj/FP8_Block.pth b/model.layers.24.mlp.gate_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..298192314f236fe022b80b741aadb38a18b36cba --- /dev/null +++ b/model.layers.24.mlp.gate_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f51a8f343e387c7c50423628a8373e80824c409642c973ccb30a6c5b96dbd2a +size 117442359 diff --git a/model.layers.24.mlp.gate_proj/FP8_Dynamic.pth b/model.layers.24.mlp.gate_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..b7ec23fc1acb96b8886a964dc6fb61ff1329d591 --- /dev/null +++ b/model.layers.24.mlp.gate_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a78bbaf66601a7f4b25d4e80c9ee3ed17f70f37c0c07cb9fb5c19e5e8fef0651 +size 117442373 diff --git a/model.layers.24.mlp.gate_proj/NVFP4.pth b/model.layers.24.mlp.gate_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..73e97a1a88e4fc05c3dcdc151a9531fa90212995 --- /dev/null +++ b/model.layers.24.mlp.gate_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd19d276b64f281f1da44761d03cafee598a715d588019ba28ed6e2961823708 +size 117442267 diff --git a/model.layers.24.mlp.up_proj/FP8_Block.pth b/model.layers.24.mlp.up_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..9f82ad3de27fac2a22248a478104241b319c3a01 --- /dev/null +++ b/model.layers.24.mlp.up_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2068994e5576e51a8d6daedc48cbe9ba0cdf09d77b1dfdefec8d5ca25707ae62 +size 117442359 diff --git a/model.layers.24.mlp.up_proj/FP8_Dynamic.pth b/model.layers.24.mlp.up_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..d81f78729f84bf950fdf03e5806b754500974e33 --- /dev/null +++ b/model.layers.24.mlp.up_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:611364a5efd5f3a5f2f1dd7ee40ee763af829bfed04da1e9f19c147b6a8b3363 +size 117442373 diff --git a/model.layers.24.mlp.up_proj/NVFP4.pth b/model.layers.24.mlp.up_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..9a1f07bc96edfa3d401a16d4c78dd96663846724 --- /dev/null +++ b/model.layers.24.mlp.up_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3dab73f823b15bb2859af2ad0d495c6ee4e489c0693596aec3b2719cb659d82 +size 117442267 diff --git a/model.layers.24.self_attn.k_proj/FP8_Block.pth b/model.layers.24.self_attn.k_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..3985c01bb56f0b91ab5efd709cdd9e72edaf3dfe --- /dev/null +++ b/model.layers.24.self_attn.k_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87b7c931fc46fa557df32f11c05e1541ef297b673a7711f7fd4ae1aa8c2886a9 +size 8390455 diff --git a/model.layers.24.self_attn.k_proj/FP8_Dynamic.pth b/model.layers.24.self_attn.k_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..83ac3a20c2a715c7f7bae932f431fc0ba575ea53 --- /dev/null +++ b/model.layers.24.self_attn.k_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:533a2a49de1ab3fd040b8767f9068e30b78a5cae4dd966f7861afa65eabde5d5 +size 8390469 diff --git a/model.layers.24.self_attn.k_proj/NVFP4.pth b/model.layers.24.self_attn.k_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..2bf4cd0bc7b79ae077f535ad5aedbb87ac1500c0 --- /dev/null +++ b/model.layers.24.self_attn.k_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8af489b5386407c2cd688e159dcd856c4ab59d0c7a612c30a3720dbd2674f8f2 +size 8390363 diff --git a/model.layers.24.self_attn.o_proj/FP8_Block.pth b/model.layers.24.self_attn.o_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..5370f780c29f6dea0d2760787616c505452ea9fc --- /dev/null +++ b/model.layers.24.self_attn.o_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b00196b400c2f682d3d68b7311084db2ab35a91c4fdb080198188f50c320d004 +size 33556279 diff --git a/model.layers.24.self_attn.o_proj/FP8_Dynamic.pth b/model.layers.24.self_attn.o_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..2d8df40da7ee2b94b56e6b4816bf3b2de6141a41 --- /dev/null +++ b/model.layers.24.self_attn.o_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb53d6ccbb983120393d2adf0333debb68dea97b975d237c77b0afe84d18c750 +size 33556293 diff --git a/model.layers.24.self_attn.o_proj/NVFP4.pth b/model.layers.24.self_attn.o_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..455b6b139f0ac7049f9061e2ccfbe2d47a70d394 --- /dev/null +++ b/model.layers.24.self_attn.o_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ca1e188a4297180c2ab1b4207ced936c58f6abb64c1592fcb33b42828021221 +size 33556187 diff --git a/model.layers.24.self_attn.q_proj/FP8_Block.pth b/model.layers.24.self_attn.q_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..fb9bf02d5db4c07e93672682566d437d4b4774dd --- /dev/null +++ b/model.layers.24.self_attn.q_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:215d6c8171924b1d03a89ab8432b9a94c7da3fe80ee4c10755ce220a073f8c77 +size 33556279 diff --git a/model.layers.24.self_attn.q_proj/FP8_Dynamic.pth b/model.layers.24.self_attn.q_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..b9ce3aac0bf3d64eb24a8c577f64fe425eb3e266 --- /dev/null +++ b/model.layers.24.self_attn.q_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa5345d9bea75fceb6ed7a4d4fa57481d460d8b3d1599b16f83e2f4daf846f6d +size 33556293 diff --git a/model.layers.24.self_attn.q_proj/NVFP4.pth b/model.layers.24.self_attn.q_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..bf31160fde9a72956f2b28bdd5e62728d54257fe --- /dev/null +++ b/model.layers.24.self_attn.q_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e900012ddd909e7e7815932af492fd7226a69249248b9234989af7d78146e9c1 +size 33556187 diff --git a/model.layers.24.self_attn.v_proj/FP8_Block.pth b/model.layers.24.self_attn.v_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..7327707890cb72f80a948c1dec67f26a47d37342 --- /dev/null +++ b/model.layers.24.self_attn.v_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b35caf35b243cca757987afedce551ceb034e90c3e872d840e4f498c6733d4a3 +size 8390455 diff --git a/model.layers.24.self_attn.v_proj/FP8_Dynamic.pth b/model.layers.24.self_attn.v_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..00c4683585347c23ba6e8de2db0dbe74cee985cf --- /dev/null +++ b/model.layers.24.self_attn.v_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edef38b56ea43a3b376d8d5c440fd4d4c7bfb462debd95ab50031a3658fa7c7d +size 8390469 diff --git a/model.layers.24.self_attn.v_proj/NVFP4.pth b/model.layers.24.self_attn.v_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..add6033b24a65845dd8f0c425d9754096b940c4f --- /dev/null +++ b/model.layers.24.self_attn.v_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3f6ab41c7a83ae9696c283688d31afe96db7b4dff6b257b5d9c84514c320ee7 +size 8390363 diff --git a/model.layers.25.mlp.down_proj/FP8_Block.pth b/model.layers.25.mlp.down_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..6219f4fad65d6012ec5aab1a620249cec655a627 --- /dev/null +++ b/model.layers.25.mlp.down_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf55bb55d81f530e41ec0aaaa79422d070db19ffa4fcfec117b4cdad991e2152 +size 117442359 diff --git a/model.layers.25.mlp.down_proj/FP8_Dynamic.pth b/model.layers.25.mlp.down_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..f811512fbffe1f48d6b0830f6a5961d89f3d2bf0 --- /dev/null +++ b/model.layers.25.mlp.down_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3607b67a9da64f81cf40d45205d94669e2594c730f959460014527267873abb1 +size 117442373 diff --git a/model.layers.25.mlp.down_proj/NVFP4.pth b/model.layers.25.mlp.down_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..1141094ff71b9fdcf4a27b62e95358c82891ad24 --- /dev/null +++ b/model.layers.25.mlp.down_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec2a0f68dd0dbd4f8ed9cf894bc58d36dadf1a17173dd87809e76e1c5043f2c1 +size 117442267 diff --git a/model.layers.25.mlp.gate_proj/FP8_Block.pth b/model.layers.25.mlp.gate_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..35c09b6b22ba5b10b4230a8187ac455b38f09fd6 --- /dev/null +++ b/model.layers.25.mlp.gate_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e288d553e72144da79441cb6ba49c8536ac4e72c0660ea333bacc44b247bec75 +size 117442359 diff --git a/model.layers.25.mlp.gate_proj/FP8_Dynamic.pth b/model.layers.25.mlp.gate_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..588cb2f0de183b41ffa74888d181ea5f6a4aee6f --- /dev/null +++ b/model.layers.25.mlp.gate_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b3bab33eedba7ca1643fb23a0fce5d31aac6430f4185486d6b847db56f86c9a +size 117442373 diff --git a/model.layers.25.mlp.gate_proj/NVFP4.pth b/model.layers.25.mlp.gate_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..7920d929a690f322d99722104ca89a2147ee8ca5 --- /dev/null +++ b/model.layers.25.mlp.gate_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:225c9bb0945e9ccb99ca8a7ef8687df4ae24c0f5bc4e5e0fb052ab9fb092cb43 +size 117442267 diff --git a/model.layers.25.mlp.up_proj/FP8_Block.pth b/model.layers.25.mlp.up_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..695b85f3459674c1181b5603b777a9f5bb6a8d48 --- /dev/null +++ b/model.layers.25.mlp.up_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccdecceb9136e75cc25a9365e85cc0e5666995f1b16858cd56b1de42966a228f +size 117442359 diff --git a/model.layers.25.mlp.up_proj/FP8_Dynamic.pth b/model.layers.25.mlp.up_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..7fbc2399ef33fa88770b532922c48f57331470d5 --- /dev/null +++ b/model.layers.25.mlp.up_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff0fba543b2d6808a9185b40ac15ce636cd9cc1a7f997440d06c463827e8a5f0 +size 117442373 diff --git a/model.layers.25.mlp.up_proj/NVFP4.pth b/model.layers.25.mlp.up_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..f6ef4286479d7fb9172a8537dad05543033d5712 --- /dev/null +++ b/model.layers.25.mlp.up_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86e84ea6fd53e25ec3a0cac3fb2a53620eb9beb9d05c3027799bb8dc9e4aa26a +size 117442267 diff --git a/model.layers.25.self_attn.k_proj/FP8_Block.pth b/model.layers.25.self_attn.k_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..b1aa10d8df1c01a3b83884787133b85104221573 --- /dev/null +++ b/model.layers.25.self_attn.k_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:638c109d65012819a5766a348076ce9e3a19dc0ea4cc5604af3341e5317f0c45 +size 8390455 diff --git a/model.layers.25.self_attn.k_proj/FP8_Dynamic.pth b/model.layers.25.self_attn.k_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..ac5b124588a4988cb0b5979ab0221be400195689 --- /dev/null +++ b/model.layers.25.self_attn.k_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80b91dd3c46ea84301d9cf852188c60d25640f8595aca29b8a1b48a6f83a08fd +size 8390469 diff --git a/model.layers.25.self_attn.k_proj/NVFP4.pth b/model.layers.25.self_attn.k_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..6340aae6f1ddab5e818c5e5bca9461e6eff42c06 --- /dev/null +++ b/model.layers.25.self_attn.k_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3ebd9a45fa7ce15315ceac9e3f05bb422bb7b037bf197f46eff93405f450768 +size 8390363 diff --git a/model.layers.25.self_attn.o_proj/FP8_Block.pth b/model.layers.25.self_attn.o_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..f53e8cba693090b9254fa6447863e2157d3f165f --- /dev/null +++ b/model.layers.25.self_attn.o_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2008d48622348975bd1c8293bb7366b83c8d00be97b706c0382387b727cc220b +size 33556279 diff --git a/model.layers.25.self_attn.o_proj/FP8_Dynamic.pth b/model.layers.25.self_attn.o_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..2cdb89120d15b8604149730607dd943cb5535d13 --- /dev/null +++ b/model.layers.25.self_attn.o_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9eaa601b19aa8a74df7efc414d029b50087260810cd9214c2c1a24dfa7ef9f22 +size 33556293 diff --git a/model.layers.25.self_attn.o_proj/NVFP4.pth b/model.layers.25.self_attn.o_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..e80e7e5b8f96399fbd71e5644b344044c19e8dc5 --- /dev/null +++ b/model.layers.25.self_attn.o_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a13081c94284373df8afdc05957695d4c02808d6019d9dad78be651680215b8 +size 33556187 diff --git a/model.layers.25.self_attn.q_proj/FP8_Block.pth b/model.layers.25.self_attn.q_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..ef12ac5b3d46efc897b9f679b8d715156d4817df --- /dev/null +++ b/model.layers.25.self_attn.q_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54893f9a9801d7af2741a858dde0952d635252dd676b950f86619bb8e3642f0b +size 33556279 diff --git a/model.layers.25.self_attn.q_proj/FP8_Dynamic.pth b/model.layers.25.self_attn.q_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..3ed1da1d37339ab16fb139920be4874326f2ea5d --- /dev/null +++ b/model.layers.25.self_attn.q_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e97c2241dbe019530e1d9218ccbc3d9f1f48250e4db1a1d4c87f937a0f68fc3a +size 33556293 diff --git a/model.layers.25.self_attn.q_proj/NVFP4.pth b/model.layers.25.self_attn.q_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..8ddbb1150bc0215044a374cfbd7f2b9a60a72801 --- /dev/null +++ b/model.layers.25.self_attn.q_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c836b276612809b442bdad549efe536afadf22bb94d930357166217ccbdc2a8d +size 33556187 diff --git a/model.layers.25.self_attn.v_proj/FP8_Block.pth b/model.layers.25.self_attn.v_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..c470bdabde3d7f8ed3b0c9de6306f99e2c09a07c --- /dev/null +++ b/model.layers.25.self_attn.v_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:232287127feb9297aeef60473f6d7dc1666bbf1aa78fde47f41fc791ef9f3ce6 +size 8390455 diff --git a/model.layers.25.self_attn.v_proj/FP8_Dynamic.pth b/model.layers.25.self_attn.v_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..c0f0ba4b62d03ea66674363fa379d73be33c7118 --- /dev/null +++ b/model.layers.25.self_attn.v_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c33d838a89ae40bd548e5048c6484aea9f8c970739d74f8893707a1533c4bf2 +size 8390469 diff --git a/model.layers.25.self_attn.v_proj/NVFP4.pth b/model.layers.25.self_attn.v_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..e0be5b61421730fbf0a0634408439f91992e4beb --- /dev/null +++ b/model.layers.25.self_attn.v_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d5cce3784802157d6036f8d17ac9f4f156757a73cd44187213f3f8a8beaabce +size 8390363 diff --git a/model.layers.26.mlp.down_proj/FP8_Block.pth b/model.layers.26.mlp.down_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..175e23e7efdfece7659d1e0d16b9fe1892869d20 --- /dev/null +++ b/model.layers.26.mlp.down_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:395200c25c9ca8ace709996e915b60cc4eae3dd994e853f2b9d305becc84d21e +size 117442359 diff --git a/model.layers.26.mlp.down_proj/FP8_Dynamic.pth b/model.layers.26.mlp.down_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..5d109266989f31fb81553a7dbecbecbc6aff6457 --- /dev/null +++ b/model.layers.26.mlp.down_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36b77fd6696c767a23817bc921a418143dae591ad4908af8ccb91979293879cc +size 117442373 diff --git a/model.layers.26.mlp.down_proj/NVFP4.pth b/model.layers.26.mlp.down_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..adfec59f483a7423db440db957e57709efdb213b --- /dev/null +++ b/model.layers.26.mlp.down_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8eb1cdc46fd297c38a4d3d821b4f9a960b4d2ef85f95aef4ba772bd7d006666 +size 117442267 diff --git a/model.layers.26.mlp.gate_proj/FP8_Block.pth b/model.layers.26.mlp.gate_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..f36132fa091dc67618be09774f9d747685f713b7 --- /dev/null +++ b/model.layers.26.mlp.gate_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb174c3901c6d083e86fd670f3f9136af51b19bd0ec83158f5264aefb4ba8a2e +size 117442359 diff --git a/model.layers.26.mlp.gate_proj/FP8_Dynamic.pth b/model.layers.26.mlp.gate_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..bb020ed0d470d86624ba3525c8cedebe40aea5de --- /dev/null +++ b/model.layers.26.mlp.gate_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d28a91091f21190d5223ac82e80b99e3931a1107f41bcbe1fc759150ccb8dda +size 117442373 diff --git a/model.layers.26.mlp.gate_proj/NVFP4.pth b/model.layers.26.mlp.gate_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..ad749f59b591c196b0cc2c11f36eccd3fd3bf349 --- /dev/null +++ b/model.layers.26.mlp.gate_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f887ab531ef81fa8fa5c29ef3a701a245adf9b61173b3a400a139e06d30e1cd5 +size 117442267 diff --git a/model.layers.26.mlp.up_proj/FP8_Block.pth b/model.layers.26.mlp.up_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..644f20350e845b4376035de987ba8af7c86a011b --- /dev/null +++ b/model.layers.26.mlp.up_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52f7380fc16d32d7460911051865e4e85cd01add44dc98031ed7cb31576bee11 +size 117442359 diff --git a/model.layers.26.mlp.up_proj/FP8_Dynamic.pth b/model.layers.26.mlp.up_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..f990b020c8ff1dc38980a7ab9e958a891a53e1b4 --- /dev/null +++ b/model.layers.26.mlp.up_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d689e7369384a3d9c0c84fc09731ea78d20dae4704503e9dd292a808b458d581 +size 117442373 diff --git a/model.layers.26.mlp.up_proj/NVFP4.pth b/model.layers.26.mlp.up_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..689647fdca661fc35f4e674a5ae33861c139dace --- /dev/null +++ b/model.layers.26.mlp.up_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93aec62ed4855b5c3fdd700e00310c548cc9612b59d39746e0f15d711bd50e6c +size 117442267 diff --git a/model.layers.26.self_attn.k_proj/FP8_Block.pth b/model.layers.26.self_attn.k_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..fe61c5fa67e38eaf32cea6a9ac6e8dff203118db --- /dev/null +++ b/model.layers.26.self_attn.k_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31b057b5766b2d67f01b5adaf95f1f6f8a0cde65ffc0eae777ee6a9fc693b18d +size 8390455 diff --git a/model.layers.26.self_attn.k_proj/FP8_Dynamic.pth b/model.layers.26.self_attn.k_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..d2260de687d0c0ce6491081ba678999dd08bbc1a --- /dev/null +++ b/model.layers.26.self_attn.k_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f93637594c63195f7add2ac47e4e9097e236276f0d53b733ec1b6f8804641249 +size 8390469 diff --git a/model.layers.26.self_attn.k_proj/NVFP4.pth b/model.layers.26.self_attn.k_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..afb11f3a06ee5335f64375f8f26f351b907d2901 --- /dev/null +++ b/model.layers.26.self_attn.k_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eed0e77e3188e9c38e4a934b7fd5de7fd765d4de6dc5e7f20c9c6cc0990228e2 +size 8390363 diff --git a/model.layers.26.self_attn.o_proj/FP8_Block.pth b/model.layers.26.self_attn.o_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..9730f55c49aad2967a782cb4f5c6e9f461113538 --- /dev/null +++ b/model.layers.26.self_attn.o_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:365b4223d152583710fc5d347cb4a101009a5b2d346b5192ff7b1b76eff450aa +size 33556279 diff --git a/model.layers.26.self_attn.o_proj/FP8_Dynamic.pth b/model.layers.26.self_attn.o_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..cc7fda51f1495942cc43afe3440082fc93d2c7cb --- /dev/null +++ b/model.layers.26.self_attn.o_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5026fe049cb086c4802db11e42d535f5760a194ab735d2030ff0ca4caddf4551 +size 33556293 diff --git a/model.layers.26.self_attn.o_proj/NVFP4.pth b/model.layers.26.self_attn.o_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..f309866b62f2e8cc773c77e6b369639629173b2e --- /dev/null +++ b/model.layers.26.self_attn.o_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:192a443ae461bb560a945e2db745ca60636937c6f67041844c0f7620ceab7a73 +size 33556187 diff --git a/model.layers.26.self_attn.q_proj/FP8_Block.pth b/model.layers.26.self_attn.q_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..7d147daa7c5674030920f11ee603d906109d347f --- /dev/null +++ b/model.layers.26.self_attn.q_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:953673df161f6fdd6b0a10d8affbd9997871fe299f5d241bd511f7727a47a409 +size 33556279 diff --git a/model.layers.26.self_attn.q_proj/FP8_Dynamic.pth b/model.layers.26.self_attn.q_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..f486072cf25080b1d7c3a271d71a8278c45e0652 --- /dev/null +++ b/model.layers.26.self_attn.q_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b69eb9b0fa92444daf66afc1b3f2976998b12a6b0f5f4e6cfb8443eb6e0868a3 +size 33556293 diff --git a/model.layers.26.self_attn.q_proj/NVFP4.pth b/model.layers.26.self_attn.q_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..3b120b34924212cf5d0c9601837902900cf887b8 --- /dev/null +++ b/model.layers.26.self_attn.q_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a3b0efe516ba3cf70b544565ceeced07df4e7aecec00a66d949ca648b7ca7b1 +size 33556187 diff --git a/model.layers.26.self_attn.v_proj/FP8_Block.pth b/model.layers.26.self_attn.v_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..4d4137d7032dd1ea8d404d884866307ea6d29ce3 --- /dev/null +++ b/model.layers.26.self_attn.v_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40dca7817b334f4837f5e9d65c7a1dd3da2f284c5e812c96c57b620e992709a8 +size 8390455 diff --git a/model.layers.26.self_attn.v_proj/FP8_Dynamic.pth b/model.layers.26.self_attn.v_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..ec89499101301ea7dff6c86d63a1808f87be4a90 --- /dev/null +++ b/model.layers.26.self_attn.v_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:999300eb2b29cbd6a58e2225a45ef377cf7d9929521508028ab67b23d14b41d2 +size 8390469 diff --git a/model.layers.26.self_attn.v_proj/NVFP4.pth b/model.layers.26.self_attn.v_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..6d7cc46fc17db98d439899fe1758ca23cb4bc4a9 --- /dev/null +++ b/model.layers.26.self_attn.v_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a6eb3344ab2cf8b817b5ec338b526a5fe39c6d81bc02201500d0f9a0b9fd913 +size 8390363 diff --git a/model.layers.27.mlp.down_proj/FP8_Block.pth b/model.layers.27.mlp.down_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..1a612ae3a5e3e5dc9882107c0472ca7cae5ec55b --- /dev/null +++ b/model.layers.27.mlp.down_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3070187b6754e13f1b3156c202329e2b0d159cd834d82dba7d21c148df5b057b +size 117442359 diff --git a/model.layers.27.mlp.down_proj/FP8_Dynamic.pth b/model.layers.27.mlp.down_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..4d9f4ff6c8a1fe9575b39cfdeee9146e9ac738e3 --- /dev/null +++ b/model.layers.27.mlp.down_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a656a6faa7b880380e326ff846510bb4f5238087a2cfbe0753647871a49cda50 +size 117442373 diff --git a/model.layers.27.mlp.down_proj/NVFP4.pth b/model.layers.27.mlp.down_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..963cbadd7c58be93d77f3bf6673f6e0130b62be3 --- /dev/null +++ b/model.layers.27.mlp.down_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e45f0172b8b01bafc13a3653a12949a6b9f010ac6248358389c0d0cf522cc393 +size 117442267 diff --git a/model.layers.27.mlp.gate_proj/FP8_Block.pth b/model.layers.27.mlp.gate_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..03aa2e7e80910f02cbaf4d90621d093f6c9cd77c --- /dev/null +++ b/model.layers.27.mlp.gate_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:856914927b8b7fb4db9f47e56fa3346f2d33b6359862b4e520d3ffe47f0d6655 +size 117442359 diff --git a/model.layers.27.mlp.gate_proj/FP8_Dynamic.pth b/model.layers.27.mlp.gate_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..104be5906de53b0c0fe3735882cd4f69df00ba02 --- /dev/null +++ b/model.layers.27.mlp.gate_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e746e63413353d620edd126c966425fac0c931f1ce90ef9e71af9ebf68cc5707 +size 117442373 diff --git a/model.layers.27.mlp.gate_proj/NVFP4.pth b/model.layers.27.mlp.gate_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..3f3d7a0021f6719affe9a4af174cf3922083f7fc --- /dev/null +++ b/model.layers.27.mlp.gate_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79ecd7114dff199d78ee352ee52bdb799ac147bf8ea64fab5af5b63f79b04fa4 +size 117442267 diff --git a/model.layers.27.mlp.up_proj/FP8_Block.pth b/model.layers.27.mlp.up_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..61584af5d75c745687cbb287054786f5ee191423 --- /dev/null +++ b/model.layers.27.mlp.up_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91177ec511dd729902361634e3667ec634162f94d0b4111c6ddc04f186fa856e +size 117442359 diff --git a/model.layers.27.mlp.up_proj/FP8_Dynamic.pth b/model.layers.27.mlp.up_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..e13e79ccedcfdb0f46522e003295c23a977a7165 --- /dev/null +++ b/model.layers.27.mlp.up_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:241d68bba140da6cf93f78ea7b6c35aefc35a08a9f2e7eb57d3183d0abac97e1 +size 117442373 diff --git a/model.layers.27.mlp.up_proj/NVFP4.pth b/model.layers.27.mlp.up_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..a6044087c00cfe0c490040dfff9ab2145d1072f8 --- /dev/null +++ b/model.layers.27.mlp.up_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6f77b3c138db2932f348346d39ab761c32f43e087d619480769d479c5992ff4 +size 117442267 diff --git a/model.layers.27.self_attn.k_proj/FP8_Block.pth b/model.layers.27.self_attn.k_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..232f5071d2df6701a5d86b69766aa96a5de0d7f6 --- /dev/null +++ b/model.layers.27.self_attn.k_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3884a736df9bec213e912bd30cf1ed7ccc642172b070b274ffa42d5d212cc344 +size 8390455 diff --git a/model.layers.27.self_attn.k_proj/FP8_Dynamic.pth b/model.layers.27.self_attn.k_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..5fc474780af35f58cccf99857b31ace5ec53a6e8 --- /dev/null +++ b/model.layers.27.self_attn.k_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3e8426e2f3acaadeceb74fd831dd2eee8d6b0dca72c5aff6a3d4703cf7508dd +size 8390469 diff --git a/model.layers.27.self_attn.k_proj/NVFP4.pth b/model.layers.27.self_attn.k_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..0b959768e69d309b00e8611d2d10802f5a3dda68 --- /dev/null +++ b/model.layers.27.self_attn.k_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3ec54ba557912df2d93de568ed2d1708faba6d1a1b21a6feccee9061bbc1d6d +size 8390363 diff --git a/model.layers.27.self_attn.o_proj/FP8_Block.pth b/model.layers.27.self_attn.o_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..707903fa59c26efb620987ba5298afd35efbe6c2 --- /dev/null +++ b/model.layers.27.self_attn.o_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:754a22d74da146ed132cefdd6e4a8baf45e18170c9c4556b8cc29d15fb6c4044 +size 33556279 diff --git a/model.layers.27.self_attn.o_proj/FP8_Dynamic.pth b/model.layers.27.self_attn.o_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..e44d3d0464e0bc83cccaf52653bde6101b89ed19 --- /dev/null +++ b/model.layers.27.self_attn.o_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d61d93b0b9f33cc18623928c59853d858a8e348125a255cde65282bb75522b6 +size 33556293 diff --git a/model.layers.27.self_attn.o_proj/NVFP4.pth b/model.layers.27.self_attn.o_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..31c1db3ba36ac50b53e07cc79ea71f475119ac43 --- /dev/null +++ b/model.layers.27.self_attn.o_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9460a7bfcf679b273810c7115832ce84f891086140af5391ffd68ab82bcfb348 +size 33556187 diff --git a/model.layers.27.self_attn.q_proj/FP8_Block.pth b/model.layers.27.self_attn.q_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..768dabecdda1463efb0a89f1455a0725ac81d820 --- /dev/null +++ b/model.layers.27.self_attn.q_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c74ab82343bd8843a4230fe6492e949a5138a6cdd562d4d8f2075b4ec3502034 +size 33556279 diff --git a/model.layers.27.self_attn.q_proj/FP8_Dynamic.pth b/model.layers.27.self_attn.q_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..98537a912ce83339f6740cc8d8d932d55d50a26b --- /dev/null +++ b/model.layers.27.self_attn.q_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80c2b3411f4eccae3b0975d9201ceb535223b87a9c6bcdd58e910f16c64c728c +size 33556293 diff --git a/model.layers.27.self_attn.q_proj/NVFP4.pth b/model.layers.27.self_attn.q_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..0635a4fa7ad18ed46fa4a997a9216fb65e6611ae --- /dev/null +++ b/model.layers.27.self_attn.q_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d856b2a063dbd142e65b21a0ff7739d456046638d9d53813da4428dfbb0157e1 +size 33556187 diff --git a/model.layers.27.self_attn.v_proj/FP8_Block.pth b/model.layers.27.self_attn.v_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..73ef79054df281eef72d2e4a4f25168bef0778d4 --- /dev/null +++ b/model.layers.27.self_attn.v_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2aaec8f1a2bbe9b72b7b6cd4c85d4666f6cacbbd4751c97e899a630489e57c8 +size 8390455 diff --git a/model.layers.27.self_attn.v_proj/FP8_Dynamic.pth b/model.layers.27.self_attn.v_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..e51e06c670e31abca712aae6a8c6a3280d329358 --- /dev/null +++ b/model.layers.27.self_attn.v_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:957ce016c6b6d795bdcf3df5c39c9469348840bad34f9e5aa3b4c2e5939f69ab +size 8390469 diff --git a/model.layers.27.self_attn.v_proj/NVFP4.pth b/model.layers.27.self_attn.v_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..aeb20e27cb0a98a55198be3797d148f067fc5dc7 --- /dev/null +++ b/model.layers.27.self_attn.v_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bba5290f7ed95f78cf0f7b0214bc924f97a3f30181552b30f7fda93aea1a891a +size 8390363 diff --git a/model.layers.28.mlp.down_proj/FP8_Block.pth b/model.layers.28.mlp.down_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..7ffacc222efe702ccf3d2573764733f73d73c3a1 --- /dev/null +++ b/model.layers.28.mlp.down_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a04a16252d5d998e836b9312a5979bbb34f4ac411077ae473defdaabda0efb6d +size 117442359 diff --git a/model.layers.28.mlp.down_proj/FP8_Dynamic.pth b/model.layers.28.mlp.down_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..8da927ff3e3fded34d8f8f22fbc00ce2b6060009 --- /dev/null +++ b/model.layers.28.mlp.down_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7552046838c02f31c88c9f365ddd89ffdf01f11a7aff91d95766e37df6a96ec0 +size 117442373 diff --git a/model.layers.28.mlp.down_proj/NVFP4.pth b/model.layers.28.mlp.down_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..f7553fce579c1a666fa7b9a0fbb491e610b7a0b9 --- /dev/null +++ b/model.layers.28.mlp.down_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:331f3af74eaa8aeb94f393aeb13ab8bd25aeb40d458f08d1be586297a28b1659 +size 117442267 diff --git a/model.layers.28.mlp.gate_proj/FP8_Block.pth b/model.layers.28.mlp.gate_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..f0b042cf773d02f3b10ae43b9c1f27d34c136f1f --- /dev/null +++ b/model.layers.28.mlp.gate_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53ee1b025185e84d74b3e58e56afcd6b89cb014f56e4e5e900b89c418628eeed +size 117442359 diff --git a/model.layers.28.mlp.gate_proj/FP8_Dynamic.pth b/model.layers.28.mlp.gate_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..9cfc4ea83e4d35bfabd532ec69418129704768f5 --- /dev/null +++ b/model.layers.28.mlp.gate_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41ad4e314d14afa97103f79f622ac463068500a7f6dec924acf8e6865b49461d +size 117442373 diff --git a/model.layers.28.mlp.gate_proj/NVFP4.pth b/model.layers.28.mlp.gate_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..646586ea4ebba48a8da64d7847a84aa491443457 --- /dev/null +++ b/model.layers.28.mlp.gate_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5d466d0f74dabb0872340f8c823a36733d91d3f20dccf6959c39651e6f3b7ef +size 117442267 diff --git a/model.layers.28.mlp.up_proj/FP8_Block.pth b/model.layers.28.mlp.up_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..abb70aac6de818c9fc3f1893c6f2c2246188c7e2 --- /dev/null +++ b/model.layers.28.mlp.up_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1308168dd9ef2832121764064986fbbb64240b23d1f75c7dbc056436be9f9f1 +size 117442359 diff --git a/model.layers.28.mlp.up_proj/FP8_Dynamic.pth b/model.layers.28.mlp.up_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..4a5e7e0f5dc517992fdf4e95438736926d7c007f --- /dev/null +++ b/model.layers.28.mlp.up_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fcb5f3898a3ce02e9b1a63ac10466b214b69deb1cc4bb803623da44e48ed49fa +size 117442373 diff --git a/model.layers.28.mlp.up_proj/NVFP4.pth b/model.layers.28.mlp.up_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..ef0be84f2526c63d97280eebd12bf30ecdd3adeb --- /dev/null +++ b/model.layers.28.mlp.up_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc92fe981c7ed673e2c6ba51362802efae5a09ec5a4371b2dc453178304410ba +size 117442267 diff --git a/model.layers.28.self_attn.k_proj/FP8_Block.pth b/model.layers.28.self_attn.k_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..cf521e418f67d7870bc50185b0a1da4f0d55e7b6 --- /dev/null +++ b/model.layers.28.self_attn.k_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0084e55119c9121d92dce0eba9af4be2c945e3c6f58e737d62009c378179ac27 +size 8390455 diff --git a/model.layers.28.self_attn.k_proj/FP8_Dynamic.pth b/model.layers.28.self_attn.k_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..4b69cbf9b377057db314cc5d5ed8b8cadac4230f --- /dev/null +++ b/model.layers.28.self_attn.k_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a829aad77809d2291fc3e0cde543ce08284110ef1491879a7912809dfdc0f387 +size 8390469 diff --git a/model.layers.28.self_attn.k_proj/NVFP4.pth b/model.layers.28.self_attn.k_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..c4474625d7c991c66856223255d5a51e5e0d6e25 --- /dev/null +++ b/model.layers.28.self_attn.k_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a31de9eac151a62d16fdd976621894de9694dcffc485982b5b1ec42328a0e88 +size 8390363 diff --git a/model.layers.28.self_attn.o_proj/FP8_Block.pth b/model.layers.28.self_attn.o_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..13b378c888534d3514c76454c93b4dd37ff5cdca --- /dev/null +++ b/model.layers.28.self_attn.o_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea3923099628b0d90f9ccfe71185699e061a968d96711c0eedf8c56f2e529f36 +size 33556279 diff --git a/model.layers.28.self_attn.o_proj/FP8_Dynamic.pth b/model.layers.28.self_attn.o_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..e7f9f89e83a9703ac527025e854940bad87c09d9 --- /dev/null +++ b/model.layers.28.self_attn.o_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ca38c5fd5687e70806e4da8cb3352550310194d4070f80e4d50476bafadf943 +size 33556293 diff --git a/model.layers.28.self_attn.o_proj/NVFP4.pth b/model.layers.28.self_attn.o_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..54cd75463403c954db5ec8888883231a2d34a0f5 --- /dev/null +++ b/model.layers.28.self_attn.o_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3502889ee8b01830ede29fa717db178db80ab952dd37f9f95625bd4dbe54baa6 +size 33556187 diff --git a/model.layers.28.self_attn.q_proj/FP8_Block.pth b/model.layers.28.self_attn.q_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..02930c87956010cd0fd23c6677841ee592e137bd --- /dev/null +++ b/model.layers.28.self_attn.q_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6e669243dd58a6fab82d4950ec56455bbb97e7ae0c2cb62e5ad89697046826e +size 33556279 diff --git a/model.layers.28.self_attn.q_proj/FP8_Dynamic.pth b/model.layers.28.self_attn.q_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..eb9796c218f9d760a4c0b62f78620b4f71e258a4 --- /dev/null +++ b/model.layers.28.self_attn.q_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e95867b1a2f94adae907b73801a9c11e5743919e8285c6acb910314d8df58622 +size 33556293 diff --git a/model.layers.28.self_attn.q_proj/NVFP4.pth b/model.layers.28.self_attn.q_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..fcc30a5995c9d803a6986acf8b70095e528560fe --- /dev/null +++ b/model.layers.28.self_attn.q_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40ced6269f6bcb245c166a6a0897b20cf2474d58abf76424c76596bcf7da11c9 +size 33556187 diff --git a/model.layers.28.self_attn.v_proj/FP8_Block.pth b/model.layers.28.self_attn.v_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..75c09bb4e7d94355ff11fb22f515115bd697943b --- /dev/null +++ b/model.layers.28.self_attn.v_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20219044e35806bb66041ed220ee05b70331c4515b47b6ff4ef124b424feadfa +size 8390455 diff --git a/model.layers.28.self_attn.v_proj/FP8_Dynamic.pth b/model.layers.28.self_attn.v_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..ecde7b935b628e8b8822374217d8f76f8234bd5c --- /dev/null +++ b/model.layers.28.self_attn.v_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3d3f386766c007e79cc82b004ea1d42d0bc8f7ae62bfa360990a2bd10333c14 +size 8390469 diff --git a/model.layers.28.self_attn.v_proj/NVFP4.pth b/model.layers.28.self_attn.v_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..0cab93ca599bb889598440a5d59c86aebe0037d1 --- /dev/null +++ b/model.layers.28.self_attn.v_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd98cd0667063335390b174a948e596cd1c7066c6326aa89715690ce62720f2f +size 8390363 diff --git a/model.layers.29.mlp.down_proj/FP8_Block.pth b/model.layers.29.mlp.down_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..9d7be4a796bfaf98df1863a67d4ad571d42a5d6b --- /dev/null +++ b/model.layers.29.mlp.down_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0b6906968102b465f8d07220046e7074c21826bb3f5189e0cf84170b2d86a0c +size 117442359 diff --git a/model.layers.29.mlp.down_proj/FP8_Dynamic.pth b/model.layers.29.mlp.down_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..ffc0b13c83d5d13678d721d90763db9e1ad5dbba --- /dev/null +++ b/model.layers.29.mlp.down_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a58938d34d56bcbbe135700ab829ed9900e43e571de8c9805981be6eab1e6c1 +size 117442373 diff --git a/model.layers.29.mlp.down_proj/NVFP4.pth b/model.layers.29.mlp.down_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..a047d189fea7841a70d16e9074727bd4cab0445e --- /dev/null +++ b/model.layers.29.mlp.down_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23b0ece1a838f8598944a5a277b7638c1601444ab9a3d268ed6e709fdbe91f81 +size 117442267 diff --git a/model.layers.29.mlp.gate_proj/FP8_Block.pth b/model.layers.29.mlp.gate_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..a6a6dd47657302a72ece958dd0c18474daf104ab --- /dev/null +++ b/model.layers.29.mlp.gate_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a1bf982d8a78b3c943491e33f1c2c5966ab1ea41b0971628e3754488d083ecf +size 117442359 diff --git a/model.layers.29.mlp.gate_proj/FP8_Dynamic.pth b/model.layers.29.mlp.gate_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..8f44582c68f977aa07d174f589393024dcb9ed71 --- /dev/null +++ b/model.layers.29.mlp.gate_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab1fbccd20545dad741575d3600cd447877626298e18f5b1c8a63375152cf287 +size 117442373 diff --git a/model.layers.29.mlp.gate_proj/NVFP4.pth b/model.layers.29.mlp.gate_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..6a2352de58eabacddcfd9e88cbf3cbfce31595a4 --- /dev/null +++ b/model.layers.29.mlp.gate_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e572d0426e419973f9157b0bebfcf07cd468e2694e465aa54b7ed54fae5f856 +size 117442267 diff --git a/model.layers.29.mlp.up_proj/FP8_Block.pth b/model.layers.29.mlp.up_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..b886751cea1cee723496603f0d2f7acf5063e592 --- /dev/null +++ b/model.layers.29.mlp.up_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed671383ec56ab2d46718239d76e7377ccec157a57cddb7cd334edc0f459a105 +size 117442359 diff --git a/model.layers.29.mlp.up_proj/FP8_Dynamic.pth b/model.layers.29.mlp.up_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..6a085a0cd0a7e4bc209c7a8a278f047016dbf622 --- /dev/null +++ b/model.layers.29.mlp.up_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c250ef8f1265759446d6e479703bc86ab858827148a13d129773533d13db071 +size 117442373 diff --git a/model.layers.29.mlp.up_proj/NVFP4.pth b/model.layers.29.mlp.up_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..d85cd9d96ad10d60412a2f14fba7740033d2f534 --- /dev/null +++ b/model.layers.29.mlp.up_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dae6e956b14a6da4d41e84e7ce0036f0a371f15136f6656591ba621ddf05daa7 +size 117442267 diff --git a/model.layers.29.self_attn.k_proj/FP8_Block.pth b/model.layers.29.self_attn.k_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..fd00725d2e96bbdbba31bb391840f32d02c99579 --- /dev/null +++ b/model.layers.29.self_attn.k_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7af262ac61340a7823e4b9affc13535984a6bb934921040fcf56e19e8d739f5f +size 8390455 diff --git a/model.layers.29.self_attn.k_proj/FP8_Dynamic.pth b/model.layers.29.self_attn.k_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..f225c363ca70c186252781b60bbce86a84686544 --- /dev/null +++ b/model.layers.29.self_attn.k_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5be0eaddd8244c8920e62cfadb2640a2499508986ef2e8afce878c38a50f5154 +size 8390469 diff --git a/model.layers.29.self_attn.k_proj/NVFP4.pth b/model.layers.29.self_attn.k_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..b8d8d45891a22c868d64086f163b050b1037709c --- /dev/null +++ b/model.layers.29.self_attn.k_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4a31e590a80efc43e2c535e0c492f4a58b8f4b8bc3a05aac8a649006c7d5189 +size 8390363 diff --git a/model.layers.29.self_attn.o_proj/FP8_Block.pth b/model.layers.29.self_attn.o_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..a47360bd66d0de18319b9c332de44d3b85b4c970 --- /dev/null +++ b/model.layers.29.self_attn.o_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:509da1b476185034eb150ebc08d355fa386ee34c828b7794baef719a00725176 +size 33556279 diff --git a/model.layers.29.self_attn.o_proj/FP8_Dynamic.pth b/model.layers.29.self_attn.o_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..0e6c8f7a35c4c1c7ab089599d81be02a8f874814 --- /dev/null +++ b/model.layers.29.self_attn.o_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de2bbb78b4fa5854c9814c9436be83cea235691da7568ac7bd48c42ab04e6d80 +size 33556293 diff --git a/model.layers.29.self_attn.o_proj/NVFP4.pth b/model.layers.29.self_attn.o_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..83180ee763104a48322bf8ad93524f83715b2fe4 --- /dev/null +++ b/model.layers.29.self_attn.o_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6906650bb8f56259fbf95e324d5de4d594265f98cf2232f157e574b5d4e8e9e2 +size 33556187 diff --git a/model.layers.29.self_attn.q_proj/FP8_Block.pth b/model.layers.29.self_attn.q_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..4917cca6679f6c092be06093ff74e3282a72a196 --- /dev/null +++ b/model.layers.29.self_attn.q_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fbce1b56af80f7fb595eece189ed508c6af0f906ba33ecfb93d52348f36fa88 +size 33556279 diff --git a/model.layers.29.self_attn.q_proj/FP8_Dynamic.pth b/model.layers.29.self_attn.q_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..41fe09dcbefb00c561cfd996f0214c71f406642c --- /dev/null +++ b/model.layers.29.self_attn.q_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccab8afc7194b6022bd506efd824cdfb13c0587cefd37b0a23c2356362d38dfa +size 33556293 diff --git a/model.layers.29.self_attn.q_proj/NVFP4.pth b/model.layers.29.self_attn.q_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..91138a17e4de68b01238818b66d0ec0de8c3683b --- /dev/null +++ b/model.layers.29.self_attn.q_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef240fb6fe5ad85a8113efa5d08e8e46e36a7827b3caa40306c943ed3d8a171b +size 33556187 diff --git a/model.layers.29.self_attn.v_proj/FP8_Block.pth b/model.layers.29.self_attn.v_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..86df28a0e50d271bac09ef3642b1cce71e91aae3 --- /dev/null +++ b/model.layers.29.self_attn.v_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16c53ee66d1199bbbe1c28539898d2d9ce725c6a8b4cc3200cad2e18a7b36a1d +size 8390455 diff --git a/model.layers.29.self_attn.v_proj/FP8_Dynamic.pth b/model.layers.29.self_attn.v_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..58b3ad7b5152b6c5e580945d6e116a47648cf6c0 --- /dev/null +++ b/model.layers.29.self_attn.v_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99f4da6352f2f700146e23b381942230205e95916c09a7c14212ad4d615c635f +size 8390469 diff --git a/model.layers.29.self_attn.v_proj/NVFP4.pth b/model.layers.29.self_attn.v_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..9afa545372fb0da279650fc5e9bed0b10000ec81 --- /dev/null +++ b/model.layers.29.self_attn.v_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fd87539be8fc3516cbdb51c373830fc6b2fb5972dd3bbccba8c4c61085925ba +size 8390363 diff --git a/model.layers.3.mlp.down_proj/FP8_Block.pth b/model.layers.3.mlp.down_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..c0f1ac1c567f01062d0e2b5e6b7e1d50a28ffc64 --- /dev/null +++ b/model.layers.3.mlp.down_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c09a2ee51088748a8fbc86de8621e227ac2906447a36d78a642b80e3dad5989 +size 117442359 diff --git a/model.layers.3.mlp.down_proj/FP8_Dynamic.pth b/model.layers.3.mlp.down_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..7c7e685b26a871505a58692c3109f608ba74afa5 --- /dev/null +++ b/model.layers.3.mlp.down_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e60508860ac5113f56d8d6f5129378bb4217b6a0e0a760c19ac51cc4e0c8ab20 +size 117442373 diff --git a/model.layers.3.mlp.down_proj/NVFP4.pth b/model.layers.3.mlp.down_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..2511169c7024a68a9f06a9d8478923a95d70a18e --- /dev/null +++ b/model.layers.3.mlp.down_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1f3f60024f9d8e559139f641866c1019df76c99554dfa7db087e6e24664f3ad +size 117442267 diff --git a/model.layers.3.mlp.gate_proj/FP8_Block.pth b/model.layers.3.mlp.gate_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..b1bdaffaeb96bb13cf43daed5bffaa6365af4512 --- /dev/null +++ b/model.layers.3.mlp.gate_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f670e4b0ca7dfc22ec19c0b9ff1c20621976e43601292ea331388b2de2821644 +size 117442359 diff --git a/model.layers.3.mlp.gate_proj/FP8_Dynamic.pth b/model.layers.3.mlp.gate_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..9f9aef758848ab1d0f53c1d32bcdee6a1fdd9243 --- /dev/null +++ b/model.layers.3.mlp.gate_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdcb8757dec0b0115d2281eccdb15be9bd76ac8d2c656630ea616259f2064705 +size 117442373 diff --git a/model.layers.3.mlp.gate_proj/NVFP4.pth b/model.layers.3.mlp.gate_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..0769e4929f7c82a1f68c7ef12a6b29638767d27d --- /dev/null +++ b/model.layers.3.mlp.gate_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2126e14f4fb8f2efb1377a9e4b269c814e7ad265ff04de223315c4742674360a +size 117442267 diff --git a/model.layers.3.mlp.up_proj/FP8_Block.pth b/model.layers.3.mlp.up_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..a00325b45709a29b83543101199cdf341ff96e98 --- /dev/null +++ b/model.layers.3.mlp.up_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe4b19a0c607ea8c053b2b3e6099056a150c53671188b896e56a282999431e61 +size 117442359 diff --git a/model.layers.3.mlp.up_proj/FP8_Dynamic.pth b/model.layers.3.mlp.up_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..daf81e30ce21c040d51ae3526fe0caa03fc296d4 --- /dev/null +++ b/model.layers.3.mlp.up_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f50525f9608cc431ed5d9187595226101a04ae490b25ea24fc774400f597f6f0 +size 117442373 diff --git a/model.layers.3.mlp.up_proj/NVFP4.pth b/model.layers.3.mlp.up_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..22ab335bef3083db40018bec52acd1e47696f8d5 --- /dev/null +++ b/model.layers.3.mlp.up_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5eeb8cf660d7e42d4ab58ce8a4b91597fd8bdff4e4519642a48f77686efb9f93 +size 117442267 diff --git a/model.layers.3.self_attn.k_proj/FP8_Block.pth b/model.layers.3.self_attn.k_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..8e396f68e25ba180fc3c14d8b1cc570fdd28dce3 --- /dev/null +++ b/model.layers.3.self_attn.k_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3012f1147cd77ad58b41c5879f9885fe5f7494f2b1c05f253c02b01bf5b1b7b9 +size 8390455 diff --git a/model.layers.3.self_attn.k_proj/FP8_Dynamic.pth b/model.layers.3.self_attn.k_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..a3ea91e4f6a7eda8c9fd2932ad20a9444a7ce44a --- /dev/null +++ b/model.layers.3.self_attn.k_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14caf39f947a9b7403284681ac70149338d43e8914e1d10ea6ba3e3739949bef +size 8390469 diff --git a/model.layers.3.self_attn.k_proj/NVFP4.pth b/model.layers.3.self_attn.k_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..97742b356bf2bb9d19d5dbc54bc418b172d3d0b7 --- /dev/null +++ b/model.layers.3.self_attn.k_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33d6ccf03ddaf69ed026b5d2aa7ebc9fc6f6d34ea18d556c2ededdb153d8e2f3 +size 8390363 diff --git a/model.layers.3.self_attn.o_proj/FP8_Block.pth b/model.layers.3.self_attn.o_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..3f0dd3b538c5624e1a8082d5d9921e28eab4e429 --- /dev/null +++ b/model.layers.3.self_attn.o_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec9bc0737e0b95a4c77ecbba62b9acae7a5e2b22c1721961fd402a607b379a78 +size 33556279 diff --git a/model.layers.3.self_attn.o_proj/FP8_Dynamic.pth b/model.layers.3.self_attn.o_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..2fda13db3ff79243edaff74d4f47bc68128dddfe --- /dev/null +++ b/model.layers.3.self_attn.o_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cefc04f876666b195d1afa47cc704bcc176b7c1ca15f3ea107e0333f9d855d20 +size 33556293 diff --git a/model.layers.3.self_attn.o_proj/NVFP4.pth b/model.layers.3.self_attn.o_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..bbce41dbd73c6b4bef2a1d27cca5320531857b25 --- /dev/null +++ b/model.layers.3.self_attn.o_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1254be5b997eec818c13764bf1deb7ff807df59686365f2fa87b53791198a21e +size 33556187 diff --git a/model.layers.3.self_attn.q_proj/FP8_Block.pth b/model.layers.3.self_attn.q_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..1146d852312043b8f20f6f2507d34fd341e5a73b --- /dev/null +++ b/model.layers.3.self_attn.q_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e057aa111bc8340ac1e4f882fa9fc9af0ef72a3c1532a15426678759f7452c9c +size 33556279 diff --git a/model.layers.3.self_attn.q_proj/FP8_Dynamic.pth b/model.layers.3.self_attn.q_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..c46d0252884d1fa2bcf6165f8b5a9c74ecdca221 --- /dev/null +++ b/model.layers.3.self_attn.q_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aab580b0c4245868197740bfc1b3ffb363cb30d89f146e7e9c704ccbe73bd495 +size 33556293 diff --git a/model.layers.3.self_attn.q_proj/NVFP4.pth b/model.layers.3.self_attn.q_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..1784c14919088d129ac53290566a6afd53c397ce --- /dev/null +++ b/model.layers.3.self_attn.q_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b97524bd5aeb31357a5b009b77c6eb6144fa91c216199b92fcefef8ef2c06434 +size 33556187 diff --git a/model.layers.3.self_attn.v_proj/FP8_Block.pth b/model.layers.3.self_attn.v_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..fac1eaa1e187a42b34a8624101cddac29bf7e2a9 --- /dev/null +++ b/model.layers.3.self_attn.v_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a96a0653752a9c363487cf2c8d6d3e6753cc42d08dfbce77e05da0aea90291d2 +size 8390455 diff --git a/model.layers.3.self_attn.v_proj/FP8_Dynamic.pth b/model.layers.3.self_attn.v_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..a66fcf5acb5623dc8d78f6df38e30762a470d898 --- /dev/null +++ b/model.layers.3.self_attn.v_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8db2e18d5991c513b7ad9b7f89de5be58bab0a2f6a5bef658637dfc8936aa450 +size 8390469 diff --git a/model.layers.3.self_attn.v_proj/NVFP4.pth b/model.layers.3.self_attn.v_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..50d351d0fbfd91cd852b653c03f64b030c5890d0 --- /dev/null +++ b/model.layers.3.self_attn.v_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a2d78b93c15255ae53266d60cf0c62227faf061f3d75fd4232f972499dbfb25 +size 8390363 diff --git a/model.layers.30.mlp.down_proj/FP8_Block.pth b/model.layers.30.mlp.down_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..375842907cdb1e2760683ae30fbce5b2a1feb134 --- /dev/null +++ b/model.layers.30.mlp.down_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:708291267d337ad86bc5d4161b026feb99f39ef1e2b1bf92eb9d9b90c5eeca03 +size 117442359 diff --git a/model.layers.30.mlp.down_proj/FP8_Dynamic.pth b/model.layers.30.mlp.down_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..53fe6afe4d336f06bf9d6e2605b44280732e069d --- /dev/null +++ b/model.layers.30.mlp.down_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7fd25aca7c2d28156951b7a4a28bfdb398de746b68f74fd56137b8867e05305 +size 117442373 diff --git a/model.layers.30.mlp.down_proj/NVFP4.pth b/model.layers.30.mlp.down_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..4a354746d802648d3865e94e60f6bcbcdd91d55f --- /dev/null +++ b/model.layers.30.mlp.down_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75472e4783ebc1ad70544e35317836aeef1d0a7f4c433bd81c3cdea79a487307 +size 117442267 diff --git a/model.layers.30.mlp.gate_proj/FP8_Block.pth b/model.layers.30.mlp.gate_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..bf0ea7d3e590521fa20bbeebb11e1f6b087a76e9 --- /dev/null +++ b/model.layers.30.mlp.gate_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9dc2d4f2d3b375537fa41d9e4de32a4e215f947572c9729cc260de85a6f12a0 +size 117442359 diff --git a/model.layers.30.mlp.gate_proj/FP8_Dynamic.pth b/model.layers.30.mlp.gate_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..ac42e4a10e967ce1b4bac2e37471a63edc789e87 --- /dev/null +++ b/model.layers.30.mlp.gate_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae6dd9b3dc47aac6ebc44c14fa87b53cdfcc94b18b3954115511f196b4eb743e +size 117442373 diff --git a/model.layers.30.mlp.gate_proj/NVFP4.pth b/model.layers.30.mlp.gate_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..78819e46fdc81b0864feef975a84aa6b49f07302 --- /dev/null +++ b/model.layers.30.mlp.gate_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c99d55cd1f622652f2eebdf7dbc347ade5d2a6bcfed6618543761d93b9280351 +size 117442267 diff --git a/model.layers.30.mlp.up_proj/FP8_Block.pth b/model.layers.30.mlp.up_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..2b52c686a12d3c08ab3856e4457138dd41a807bc --- /dev/null +++ b/model.layers.30.mlp.up_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91ed73741d1d0b892314796a42f42311096894d23d8c4f5d594e616818dd0ca5 +size 117442359 diff --git a/model.layers.30.mlp.up_proj/FP8_Dynamic.pth b/model.layers.30.mlp.up_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..f0a07d2cbcfce5bc765e95cd8c0121ba05263c13 --- /dev/null +++ b/model.layers.30.mlp.up_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1ead8e59ea1f3f649cb636d4dbec046cef90f2a9abec64bb54429166e31138c +size 117442373 diff --git a/model.layers.30.mlp.up_proj/NVFP4.pth b/model.layers.30.mlp.up_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..ca3e7d99a00ab0786211588930fb544e75578443 --- /dev/null +++ b/model.layers.30.mlp.up_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3bd20ceddcdb50e60fef2bbc53fa1a68f0ea88abf473c5464734b7be8bd2f234 +size 117442267 diff --git a/model.layers.30.self_attn.k_proj/FP8_Block.pth b/model.layers.30.self_attn.k_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..4ddbdd812106d97f51860af66e84450aa3b79cc2 --- /dev/null +++ b/model.layers.30.self_attn.k_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:258712523145022e6c868a6c5151966dc2a4cf12364450935657c7b1791b21a7 +size 8390455 diff --git a/model.layers.30.self_attn.k_proj/FP8_Dynamic.pth b/model.layers.30.self_attn.k_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..eccbf7d594a34f2f0d4e290584a70ea36f720f7b --- /dev/null +++ b/model.layers.30.self_attn.k_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4eca75fac17d3a1767957adcda061268d391f10fa98e2d6403d93b886d41c524 +size 8390469 diff --git a/model.layers.30.self_attn.k_proj/NVFP4.pth b/model.layers.30.self_attn.k_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..3bcccd77956e92a73a5b979ddff91fa10adc0a87 --- /dev/null +++ b/model.layers.30.self_attn.k_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1a67d0b4e0a3b57e8c42d3a28af74eb20361eddbbdb7770edf270326f5dabb9 +size 8390363 diff --git a/model.layers.30.self_attn.o_proj/FP8_Block.pth b/model.layers.30.self_attn.o_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..555bc01f7af16bab8a4ed34f731ce6f51391c495 --- /dev/null +++ b/model.layers.30.self_attn.o_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a79e0d1970a245c3299dcea8d8d211e6e00983dd51b211e1db51d3489f2149a +size 33556279 diff --git a/model.layers.30.self_attn.o_proj/FP8_Dynamic.pth b/model.layers.30.self_attn.o_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..1c34eb88f365adeee984e0bf9a7aa562b8d6ccae --- /dev/null +++ b/model.layers.30.self_attn.o_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90d69748c322f66b999199d9baa44c3db3c362965950c50a11ef8bf50ccc840f +size 33556293 diff --git a/model.layers.30.self_attn.o_proj/NVFP4.pth b/model.layers.30.self_attn.o_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..f3a7d68ee7475aee52261f40f37b3a94f3d59f4d --- /dev/null +++ b/model.layers.30.self_attn.o_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6107863921f0e337b3712598ab2333139e069d9f9686b2fb2d2548dc1b38b695 +size 33556187 diff --git a/model.layers.30.self_attn.q_proj/FP8_Block.pth b/model.layers.30.self_attn.q_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..d156711dd83ba7905ba6aa25dc4c9d0abcd777be --- /dev/null +++ b/model.layers.30.self_attn.q_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84bba7a1a289f5b6d4cd1f2bc288702479c8e11e276cf50d0d7297ed048199dd +size 33556279 diff --git a/model.layers.30.self_attn.q_proj/FP8_Dynamic.pth b/model.layers.30.self_attn.q_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..b25d8e682c849a8766a310db68e92d5dd263d715 --- /dev/null +++ b/model.layers.30.self_attn.q_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a475cf9389ea228f8b943dcc6c1e1c0a51104eb235ddd610f93435bf38f5d78f +size 33556293 diff --git a/model.layers.30.self_attn.q_proj/NVFP4.pth b/model.layers.30.self_attn.q_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..6489e21952f851f1580384109b12d7fd9ba12897 --- /dev/null +++ b/model.layers.30.self_attn.q_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a69ca1604caef5c8762ddb1db484e3349ed68affa4e536066bf693d09496e804 +size 33556187 diff --git a/model.layers.30.self_attn.v_proj/FP8_Block.pth b/model.layers.30.self_attn.v_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..e5fddad740c267b4ee552c562fe2f5e1ab27fcb0 --- /dev/null +++ b/model.layers.30.self_attn.v_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b59f93b0ebe0c49f5296e42b355c487f115f1472e6da5a53a5284342a00a2be +size 8390455 diff --git a/model.layers.30.self_attn.v_proj/FP8_Dynamic.pth b/model.layers.30.self_attn.v_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..23659a28c2cf30cd7493e79c5d87485883b4da8d --- /dev/null +++ b/model.layers.30.self_attn.v_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c7581e0e39c0712d00688b31dbf5c6afd998a8c069fd6428472edbca2a37f2a +size 8390469 diff --git a/model.layers.30.self_attn.v_proj/NVFP4.pth b/model.layers.30.self_attn.v_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..2a93ba816dd37dc569d4eb26418fdf74aced2c1b --- /dev/null +++ b/model.layers.30.self_attn.v_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:964a9ab9aa2e656ac53c1b1e5022d7f38206907e3d5588960bed2eb3c46a2612 +size 8390363 diff --git a/model.layers.31.mlp.down_proj/FP8_Block.pth b/model.layers.31.mlp.down_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..6b68a8dd0a28c9c35daf6547c986c204675b413f --- /dev/null +++ b/model.layers.31.mlp.down_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce2757125e01f454af9d704fdbe72bf954471fec4fb9a39b1f274b40cecbeaae +size 117442359 diff --git a/model.layers.31.mlp.down_proj/FP8_Dynamic.pth b/model.layers.31.mlp.down_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..1df78809feeb2b22b1e226a4934e2d5b0cf29e2e --- /dev/null +++ b/model.layers.31.mlp.down_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6083cec8f21886bb99163bfc96bbb69c5aa7eacf04ec2711a9b55fb1af9e219e +size 117442373 diff --git a/model.layers.31.mlp.down_proj/NVFP4.pth b/model.layers.31.mlp.down_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..e800b8e186b2b4e5eaa1a3d13c82d9a5a321fc57 --- /dev/null +++ b/model.layers.31.mlp.down_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf7589414cfa9845ae108646b3e7fa1d2079ddca7bca921accfd80bf8bace52b +size 117442267 diff --git a/model.layers.31.mlp.gate_proj/FP8_Block.pth b/model.layers.31.mlp.gate_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..1b27140d56c299a8150aef2e0535160b14520d68 --- /dev/null +++ b/model.layers.31.mlp.gate_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0accd000bcc06be2311b8d1b8a503865c22c13006e3dac3b483414f570205b81 +size 117442359 diff --git a/model.layers.31.mlp.gate_proj/FP8_Dynamic.pth b/model.layers.31.mlp.gate_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..42dbc02af59ef904fd687f0c847123632d051fb9 --- /dev/null +++ b/model.layers.31.mlp.gate_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3fc327544bbca93b86491a4801319475cdb68bd497939163428536bb85780f55 +size 117442373 diff --git a/model.layers.31.mlp.gate_proj/NVFP4.pth b/model.layers.31.mlp.gate_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..ff730f791e57e9ab1885fa8dda107051438b1ade --- /dev/null +++ b/model.layers.31.mlp.gate_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:260521be14bab071e6a5184d7c9d8cc7935a81900eb57e8b950bc50cb356b85b +size 117442267 diff --git a/model.layers.31.mlp.up_proj/FP8_Block.pth b/model.layers.31.mlp.up_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..a29011f3490540c2285a7ecd6c4a0d796e07ed6f --- /dev/null +++ b/model.layers.31.mlp.up_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e4aa5a0a175299038456704c6d7b3f2f463a54fb4887cc6a91bd5dddd1b32df +size 117442359 diff --git a/model.layers.31.mlp.up_proj/FP8_Dynamic.pth b/model.layers.31.mlp.up_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..1e16debc5abc966bc170b180b2af14c362d84ef9 --- /dev/null +++ b/model.layers.31.mlp.up_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a93ff81ba0445dffe8c9a0e37fb45db71703558b27f798e21c425fafa2dc7f7f +size 117442373 diff --git a/model.layers.31.mlp.up_proj/NVFP4.pth b/model.layers.31.mlp.up_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..f0c6c1d5ba2b1b7d1074c38f4ab64fc5e1c5e3fa --- /dev/null +++ b/model.layers.31.mlp.up_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39c8ccecef140c2c5a3b0e7148b65e6fa61a01b821cc70ca127c9533e193f326 +size 117442267 diff --git a/model.layers.31.self_attn.k_proj/FP8_Block.pth b/model.layers.31.self_attn.k_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..f85afbf1b3c10448503308c519cedb462c5ac685 --- /dev/null +++ b/model.layers.31.self_attn.k_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0840f5329090477c69447bd6565c9425ed806872d8489900d48474a04d32b7da +size 8390455 diff --git a/model.layers.31.self_attn.k_proj/FP8_Dynamic.pth b/model.layers.31.self_attn.k_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..c5c3342cc4d86630cdb6e3af0a608616bd74d92c --- /dev/null +++ b/model.layers.31.self_attn.k_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14c4b79c112d152033a6ff67dcd850562ce170e7666abd14e9ff94665f21ad10 +size 8390469 diff --git a/model.layers.31.self_attn.k_proj/NVFP4.pth b/model.layers.31.self_attn.k_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..89ea7c664c62471aeaf5d27c519d1083bb985302 --- /dev/null +++ b/model.layers.31.self_attn.k_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f7a273bce80b6e9a78b98e6d8ba99cbb02cf9051fcc11bdc2b8ca50dd8acdca +size 8390363 diff --git a/model.layers.31.self_attn.o_proj/FP8_Block.pth b/model.layers.31.self_attn.o_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..4cf878deefc2e33c5d4a05d354fc66467a39cf73 --- /dev/null +++ b/model.layers.31.self_attn.o_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78d4400ccf84a289477ada7b851ba1ca7b668a26bc01998393cbad5a29700d32 +size 33556279 diff --git a/model.layers.31.self_attn.o_proj/FP8_Dynamic.pth b/model.layers.31.self_attn.o_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..4d1d50bebadac38feb19bfec9bf2b9e3fe5e9cf8 --- /dev/null +++ b/model.layers.31.self_attn.o_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f8ae2c72bbf69b047402663ce501b34beeea0bb2ee624781b654685b92bb4ed +size 33556293 diff --git a/model.layers.31.self_attn.o_proj/NVFP4.pth b/model.layers.31.self_attn.o_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..85a6d5977afba5fab6a1eaead96f0e8b7efd0b9d --- /dev/null +++ b/model.layers.31.self_attn.o_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:921b20f80693b58b243c15b542855bf86321900f56fa734e78fa8da1c547cb94 +size 33556187 diff --git a/model.layers.31.self_attn.q_proj/FP8_Block.pth b/model.layers.31.self_attn.q_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..115d7cbd3401ba16333a5a2ed7eaa23278065a31 --- /dev/null +++ b/model.layers.31.self_attn.q_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:568e62b30e50392c0080de2f97a557d71ad5bc104fa3d53366b5f147e834ad52 +size 33556279 diff --git a/model.layers.31.self_attn.q_proj/FP8_Dynamic.pth b/model.layers.31.self_attn.q_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..ae1cb294ac50034433c4e1af9962e3b62c996508 --- /dev/null +++ b/model.layers.31.self_attn.q_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fe2ee43701e1ed4a8c625cce254f7399b42679d01c044317c626137c1b70067 +size 33556293 diff --git a/model.layers.31.self_attn.q_proj/NVFP4.pth b/model.layers.31.self_attn.q_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..2e99b419ca1891f0cc200eba514e4dc2c183dee1 --- /dev/null +++ b/model.layers.31.self_attn.q_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4332cdbf597f697d8e801dd8903582289ae7c26c66385f39f81cb4732b10f57e +size 33556187 diff --git a/model.layers.31.self_attn.v_proj/FP8_Block.pth b/model.layers.31.self_attn.v_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..4a1211f9ec11b29eca925ae0bc03203039cedcea --- /dev/null +++ b/model.layers.31.self_attn.v_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1cf0271208519dffdada635ff6e7171ec9189c1b1d68763076a11084c804a4e8 +size 8390455 diff --git a/model.layers.31.self_attn.v_proj/FP8_Dynamic.pth b/model.layers.31.self_attn.v_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..e25ed68e363028598e25dfc38b81d29ab428c023 --- /dev/null +++ b/model.layers.31.self_attn.v_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8cfc29b57aba48bec2e825ed6bd159c02f16cf097a3d9bd7a46ed6609941f80 +size 8390469 diff --git a/model.layers.31.self_attn.v_proj/NVFP4.pth b/model.layers.31.self_attn.v_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..a06f1cd76c81c01a4c95fcbb27f7728b647eea27 --- /dev/null +++ b/model.layers.31.self_attn.v_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa695c466117b52467ec4b65f1b21de53ad1f3b89881ffe872a6ff0bb05bad37 +size 8390363 diff --git a/model.layers.4.mlp.down_proj/FP8_Block.pth b/model.layers.4.mlp.down_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..85f220b987e095313a09d1d1375ac4eb25ff3b7e --- /dev/null +++ b/model.layers.4.mlp.down_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e069d39a105efcd7454c3bc22921ca1e12ed133e18387ccc85e7f20bc81152f +size 117442359 diff --git a/model.layers.4.mlp.down_proj/FP8_Dynamic.pth b/model.layers.4.mlp.down_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..776ae7e300fa8ace2a9adc0cd66004f68db0b411 --- /dev/null +++ b/model.layers.4.mlp.down_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30eeaa1d7fc464e3bc95f792fe4d601f5aab0cfe2ef3cbdfddb05a9a4007e45b +size 117442373 diff --git a/model.layers.4.mlp.down_proj/NVFP4.pth b/model.layers.4.mlp.down_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..6f499a70b30d5851b62918e923213e45e1469bcc --- /dev/null +++ b/model.layers.4.mlp.down_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40f838c8153a19be70090a53d27d147a7fab95eea2008691fd84c61152e73a4b +size 117442267 diff --git a/model.layers.4.mlp.gate_proj/FP8_Block.pth b/model.layers.4.mlp.gate_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..71f9d4fb9f5c94889a29eae159922d46fb0d3a98 --- /dev/null +++ b/model.layers.4.mlp.gate_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c18af88b148c53fcb91f4405fddfd99e56dee4b4333a118ccc3e8bebd8f3666b +size 117442359 diff --git a/model.layers.4.mlp.gate_proj/FP8_Dynamic.pth b/model.layers.4.mlp.gate_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..8bd92b677466dde04abeff089123b28f3a8b656e --- /dev/null +++ b/model.layers.4.mlp.gate_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8f48d888208cab775aad297686d1d2832b90279c14fd5a94b0e392a99f7a52e +size 117442373 diff --git a/model.layers.4.mlp.gate_proj/NVFP4.pth b/model.layers.4.mlp.gate_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..050ab783ec26cdbed1e4ffcf9e5ce0983704e88f --- /dev/null +++ b/model.layers.4.mlp.gate_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf1ae16500302cdfe8e83d9007f156b3f152d254da8d33299630be603b774905 +size 117442267 diff --git a/model.layers.4.mlp.up_proj/FP8_Block.pth b/model.layers.4.mlp.up_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..1356aa81a1196033dbbe3e04402bea047105d618 --- /dev/null +++ b/model.layers.4.mlp.up_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2dd8156c544dfa7e21b6306de4a5c4db361982bdceaf0a324a438e3d80f2b5b3 +size 117442359 diff --git a/model.layers.4.mlp.up_proj/FP8_Dynamic.pth b/model.layers.4.mlp.up_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..1acb0a0afb5fb67b00e49727346b934c9ec705df --- /dev/null +++ b/model.layers.4.mlp.up_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e9af75e182bd96d3c25c85c25994e429ae86d8af385e496b5825c6f3ad8927d +size 117442373 diff --git a/model.layers.4.mlp.up_proj/NVFP4.pth b/model.layers.4.mlp.up_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..a3f5951f9f753d36ab66279db919885053a16cb8 --- /dev/null +++ b/model.layers.4.mlp.up_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c1b92ed69aacc3cc74be0c6ebacbd100b5cab5a7364c2b1ad2ce2d78eee0280 +size 117442267 diff --git a/model.layers.4.self_attn.k_proj/FP8_Block.pth b/model.layers.4.self_attn.k_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..1c909e08c8c6d4384925e7924192e5a04483a030 --- /dev/null +++ b/model.layers.4.self_attn.k_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9041d1c234a28d4c3e88ec8ec9ff7dd47ef6b0995f1a6b0c7c80343c98f808da +size 8390455 diff --git a/model.layers.4.self_attn.k_proj/FP8_Dynamic.pth b/model.layers.4.self_attn.k_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..dc83d73e1fba5cce92de2ca857599dee09601988 --- /dev/null +++ b/model.layers.4.self_attn.k_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06f293ad5e40694f77423ae5c7054cb9c8462a5be3b09cebd72a50348c4355c3 +size 8390469 diff --git a/model.layers.4.self_attn.k_proj/NVFP4.pth b/model.layers.4.self_attn.k_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..68482aade743de9064f5c776edc95e3f020e334d --- /dev/null +++ b/model.layers.4.self_attn.k_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8529c03f34b1a58413ff58ff3a24afb6b92e7928c92fbe4436c7f8a940a14c5 +size 8390363 diff --git a/model.layers.4.self_attn.o_proj/FP8_Block.pth b/model.layers.4.self_attn.o_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..6a1d68eaa3cfd8f203da4a29218d3bb7f18e2ea7 --- /dev/null +++ b/model.layers.4.self_attn.o_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc27df8449e0b27e12b8619ed6ac0d504d72a40d9b1006f0b9fc04a1ed99b8ca +size 33556279 diff --git a/model.layers.4.self_attn.o_proj/FP8_Dynamic.pth b/model.layers.4.self_attn.o_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..db98f02e9c4fde9e6e8c9a39332c0c37beeda880 --- /dev/null +++ b/model.layers.4.self_attn.o_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:456e7122c349854d730933d8eff9c136f1b3005dba74a0e236e46a77caa8c5bd +size 33556293 diff --git a/model.layers.4.self_attn.o_proj/NVFP4.pth b/model.layers.4.self_attn.o_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..4db85643a64568bdc1605f1730397bc7d870da0f --- /dev/null +++ b/model.layers.4.self_attn.o_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55d8b563efc2c30e70f7da43a9b8c4e21ca9c25f0bf8e38558aef2406060e381 +size 33556187 diff --git a/model.layers.4.self_attn.q_proj/FP8_Block.pth b/model.layers.4.self_attn.q_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..a9f4f9e72025645fe6e9bada7b116e3908341ce0 --- /dev/null +++ b/model.layers.4.self_attn.q_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:939ad6b69a988fc04591f64a64060705be688d8d3f53d3746bd59077ef560242 +size 33556279 diff --git a/model.layers.4.self_attn.q_proj/FP8_Dynamic.pth b/model.layers.4.self_attn.q_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..9ab659cc6ded275e7362c94abdd41973a861fa6d --- /dev/null +++ b/model.layers.4.self_attn.q_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8005938dd0073b60d87f5a3e56534b66af2c27b6f2d63b64415dd126331e6d87 +size 33556293 diff --git a/model.layers.4.self_attn.q_proj/NVFP4.pth b/model.layers.4.self_attn.q_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..7c97abf8e1493eb2a5f2e40f9b79a7d9bf8efadf --- /dev/null +++ b/model.layers.4.self_attn.q_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca5d821fb03f8a1ac232ab442da4fbe21c4bf83c42534944a63d51a441d0a620 +size 33556187 diff --git a/model.layers.4.self_attn.v_proj/FP8_Block.pth b/model.layers.4.self_attn.v_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..d7b0b9fb02cfb4a1e35ee33e282630adb19ee4ec --- /dev/null +++ b/model.layers.4.self_attn.v_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e26333f8fe68a3fb48d631557c54c2dbaf81afb0552b17bccff18a454040eed9 +size 8390455 diff --git a/model.layers.4.self_attn.v_proj/FP8_Dynamic.pth b/model.layers.4.self_attn.v_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..7d48e03a6704b4a003f092743a18c53154e29059 --- /dev/null +++ b/model.layers.4.self_attn.v_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccb65b49928e07b44b4e394730ee9fdd624232bbc08b06091ef99921de059ce6 +size 8390469 diff --git a/model.layers.4.self_attn.v_proj/NVFP4.pth b/model.layers.4.self_attn.v_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..e3ba99a7deca5ecc909a03601d94ebf7d952699a --- /dev/null +++ b/model.layers.4.self_attn.v_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71e1644023e41a782003944547212f541d4d2734196402e011b7146f04a16253 +size 8390363 diff --git a/model.layers.5.mlp.down_proj/FP8_Block.pth b/model.layers.5.mlp.down_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..c70b059918773c7f70e1f14118373483cd3a2ca4 --- /dev/null +++ b/model.layers.5.mlp.down_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:642e5ca7681bf2d4b12ae822a41e4b264260524a502c2dd4e5b9c5885457e8d6 +size 117442359 diff --git a/model.layers.5.mlp.down_proj/FP8_Dynamic.pth b/model.layers.5.mlp.down_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..245038c32c6c02bd0ff9491e9da0b53337d0266c --- /dev/null +++ b/model.layers.5.mlp.down_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3482f9d2194a725b7e448a5a1e64732799158e54ba00787e674bb95ff4ed9ba +size 117442373 diff --git a/model.layers.5.mlp.down_proj/NVFP4.pth b/model.layers.5.mlp.down_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..b01c22dafac548e5aeec57a059a461e1a09fcd53 --- /dev/null +++ b/model.layers.5.mlp.down_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:051dff4862434356e866cc22d16b1641b69f97ed891c4508b62488d6597d547c +size 117442267 diff --git a/model.layers.5.mlp.gate_proj/FP8_Block.pth b/model.layers.5.mlp.gate_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..24e4103834af85a8662492829b2dc7226c456881 --- /dev/null +++ b/model.layers.5.mlp.gate_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed3396f5133a596561601e52a60e12c64489a278a0dd03ec792ee053c9b29f08 +size 117442359 diff --git a/model.layers.5.mlp.gate_proj/FP8_Dynamic.pth b/model.layers.5.mlp.gate_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..5d116d5270c0cb570a238ef0fb58958fbd5232ea --- /dev/null +++ b/model.layers.5.mlp.gate_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10f892ddd669c87448eb613362cf040c18da0c930b86e0752bc4c19ba0adcc04 +size 117442373 diff --git a/model.layers.5.mlp.gate_proj/NVFP4.pth b/model.layers.5.mlp.gate_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..5d23c0c33fa02cab831dd1de45eb6210c3278d23 --- /dev/null +++ b/model.layers.5.mlp.gate_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3fa7724602d5db3eda2b7e786818fe38bc5c61a71f5168b74e37d0815b164ecc +size 117442267 diff --git a/model.layers.5.mlp.up_proj/FP8_Block.pth b/model.layers.5.mlp.up_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..29059e0c36338cfb6f56a47da8c69c8801ec7c90 --- /dev/null +++ b/model.layers.5.mlp.up_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:254b85290b0ed597678e267ea15d96970c8667f92436c3c1080e2201e6c71551 +size 117442359 diff --git a/model.layers.5.mlp.up_proj/FP8_Dynamic.pth b/model.layers.5.mlp.up_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..228a2465587e384c9645fd7462ee74024c678921 --- /dev/null +++ b/model.layers.5.mlp.up_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39eb6c2f1206fcb22309b8b611b49264d5911f3a8c7cb45a747405b6f1504909 +size 117442373 diff --git a/model.layers.5.mlp.up_proj/NVFP4.pth b/model.layers.5.mlp.up_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..03814a5c4b55e45cbb6fe722addabf6d6ab3de00 --- /dev/null +++ b/model.layers.5.mlp.up_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb06ae87b15bc6710a6c4a19a0076adc1419f7836c36f44991861010aee2baa9 +size 117442267 diff --git a/model.layers.5.self_attn.k_proj/FP8_Block.pth b/model.layers.5.self_attn.k_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..84b2692adc55bca0b51a0f388078336bb1236c12 --- /dev/null +++ b/model.layers.5.self_attn.k_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c8f89a9c0dccd9a3ced7c0e80f72c2b7344ff8191aa66de94a89b272496fa86 +size 8390455 diff --git a/model.layers.5.self_attn.k_proj/FP8_Dynamic.pth b/model.layers.5.self_attn.k_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..9c1d25222b287a704d0aac6d9d8177f365078429 --- /dev/null +++ b/model.layers.5.self_attn.k_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f63419d5d0ddccea6b9a0f5028c5d28929d8df8eb47731d9fb9759e0b7747359 +size 8390469 diff --git a/model.layers.5.self_attn.k_proj/NVFP4.pth b/model.layers.5.self_attn.k_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..df5419ef803b2643786daf6187dfcd663cd7a249 --- /dev/null +++ b/model.layers.5.self_attn.k_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2dd6414fddb3ea2294c367e77b83a5b514d9a5f08fa2bb4d10b5d7f1ae22cf7f +size 8390363 diff --git a/model.layers.5.self_attn.o_proj/FP8_Block.pth b/model.layers.5.self_attn.o_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..a12df21cdc0b9a87cd5889453bb613ebe6e07d13 --- /dev/null +++ b/model.layers.5.self_attn.o_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d39a22503ccdf9e71f550dd6af011b2fcbcff15923354fea1eda70e0805ecc66 +size 33556279 diff --git a/model.layers.5.self_attn.o_proj/FP8_Dynamic.pth b/model.layers.5.self_attn.o_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..1f25d551676857a2097f603a3e7f1e0117649093 --- /dev/null +++ b/model.layers.5.self_attn.o_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ecc8ca7669a4d24a1446b51e700c665b680b0c053e6493d3bf043af831e1e56 +size 33556293 diff --git a/model.layers.5.self_attn.o_proj/NVFP4.pth b/model.layers.5.self_attn.o_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..7a4d5b9ec632b94a5e95453d2eb912f7e5539942 --- /dev/null +++ b/model.layers.5.self_attn.o_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f98e334da4092f83ce6ae99dae02ca8e091d136d7e2483775c85811adfe7dacc +size 33556187 diff --git a/model.layers.5.self_attn.q_proj/FP8_Block.pth b/model.layers.5.self_attn.q_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..fd55fd8c7a54ed795e91ce1823aa6a3a67fa2b25 --- /dev/null +++ b/model.layers.5.self_attn.q_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ec9d0ea5dad2e5829c759ce64b0a63a7c9fc167465acb47a5d3b7ad6f315541 +size 33556279 diff --git a/model.layers.5.self_attn.q_proj/FP8_Dynamic.pth b/model.layers.5.self_attn.q_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..90c47c4143f6d18a5ef96c67df557be56a11f176 --- /dev/null +++ b/model.layers.5.self_attn.q_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b11866cf8305e50aabe7b3b9cd2afc7f2668099d2aff99a86ac7e1a9a20dc21 +size 33556293 diff --git a/model.layers.5.self_attn.q_proj/NVFP4.pth b/model.layers.5.self_attn.q_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..22747e4001a48c8fc2ee43bf576d296acf0cb2df --- /dev/null +++ b/model.layers.5.self_attn.q_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34d09c55a2925ba4bb63f33380212f77cbc5658196eec77f26aba49b6d5a85ae +size 33556187 diff --git a/model.layers.5.self_attn.v_proj/FP8_Block.pth b/model.layers.5.self_attn.v_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..acbae4c1b49e6b752c1eb6266d9213377b046abb --- /dev/null +++ b/model.layers.5.self_attn.v_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bb782ff8fc8c211d06bd911dca3674883207c66276090bc7c0d36270dbc94ae +size 8390455 diff --git a/model.layers.5.self_attn.v_proj/FP8_Dynamic.pth b/model.layers.5.self_attn.v_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..08a605ce6e81aa71037ea308355683d4374369a8 --- /dev/null +++ b/model.layers.5.self_attn.v_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92890151833be93f1e7b3658d72ae097da174b4df055c30faa842373b5690a51 +size 8390469 diff --git a/model.layers.5.self_attn.v_proj/NVFP4.pth b/model.layers.5.self_attn.v_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..2e37c7f464c00a3b7ce4a70a7430811ba60aa7e1 --- /dev/null +++ b/model.layers.5.self_attn.v_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b2d77db359eee6d9c897a5286ca0132a6e3f26cd812545f446fb60ec95b35bd +size 8390363 diff --git a/model.layers.6.mlp.down_proj/FP8_Block.pth b/model.layers.6.mlp.down_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..9c2bdadaec9b1f93e7fab662d067fe93d5398255 --- /dev/null +++ b/model.layers.6.mlp.down_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55d5a1f7621170e2df7deb5ca1add6fd2fbebe557e039f2b3a50dcc2eabed9b5 +size 117442359 diff --git a/model.layers.6.mlp.down_proj/FP8_Dynamic.pth b/model.layers.6.mlp.down_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..5232d8a384e2d1d7db63e944a45291738bd65033 --- /dev/null +++ b/model.layers.6.mlp.down_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4844b1e18c2eb7ec53864890d57806570157630ddbdb991998d9ef5c1aab0186 +size 117442373 diff --git a/model.layers.6.mlp.down_proj/NVFP4.pth b/model.layers.6.mlp.down_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..fcd7cab74076c0eccdf325450e7735849526b80a --- /dev/null +++ b/model.layers.6.mlp.down_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40d727d69e5a12c797e7e4aa9ed172423d31dd44af96238a3d02142d64643890 +size 117442267 diff --git a/model.layers.6.mlp.gate_proj/FP8_Block.pth b/model.layers.6.mlp.gate_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..41924ede507cd8b8a4009774cc5718f046f6f034 --- /dev/null +++ b/model.layers.6.mlp.gate_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:559487035e88a619c0f746ea93dfe5888f026dc2e150c94a480e1940e6a27c41 +size 117442359 diff --git a/model.layers.6.mlp.gate_proj/FP8_Dynamic.pth b/model.layers.6.mlp.gate_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..bc6aeedf4981f54ba2ac8897ba9ee0042827d21c --- /dev/null +++ b/model.layers.6.mlp.gate_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e77f6de4ffcc65e0ae5a665f88c96cb5f07857ee942fa69f719d4139b4c7b640 +size 117442373 diff --git a/model.layers.6.mlp.gate_proj/NVFP4.pth b/model.layers.6.mlp.gate_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..b99a94b30b47cb1c29e4c9613fc485f601bd2e45 --- /dev/null +++ b/model.layers.6.mlp.gate_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb947dc631e5a81370c89abc5ed8d54cd5cfc942837b5a2b51357b4fb2d30634 +size 117442267 diff --git a/model.layers.6.mlp.up_proj/FP8_Block.pth b/model.layers.6.mlp.up_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..95c8fe859e3007c98e53cfc1fa1f0d6314fd3fcb --- /dev/null +++ b/model.layers.6.mlp.up_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:442a03486c75dc1edfba78fb6fa4a692b276457f8611473608f7a008bdbaa53d +size 117442359 diff --git a/model.layers.6.mlp.up_proj/FP8_Dynamic.pth b/model.layers.6.mlp.up_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..b41ad5e4150f7b6a62da4de4a9b60224476d949e --- /dev/null +++ b/model.layers.6.mlp.up_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:867b1c58f3c27254d421954b34ba4d2e01338994373d478e16476d08630ec9d4 +size 117442373 diff --git a/model.layers.6.mlp.up_proj/NVFP4.pth b/model.layers.6.mlp.up_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..c59d6e1c9086b5c46718992bec22391c34a7aaa2 --- /dev/null +++ b/model.layers.6.mlp.up_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01b6a5919a1266e111de62cb61cd4db8355c2f40e0aa45a8990f45dbd1577195 +size 117442267 diff --git a/model.layers.6.self_attn.k_proj/FP8_Block.pth b/model.layers.6.self_attn.k_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..c97fe471e30cace8435edec4c993754453797efa --- /dev/null +++ b/model.layers.6.self_attn.k_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffb2f1c75a1aa53ddd84275d64db43711844bd3f53ad1a0e6ff7c0b2da1017c1 +size 8390455 diff --git a/model.layers.6.self_attn.k_proj/FP8_Dynamic.pth b/model.layers.6.self_attn.k_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..b60d45f07a916be6d813269d086f09b853b239d8 --- /dev/null +++ b/model.layers.6.self_attn.k_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8a1141029a76b03d3dba6d7c647dadb3d8db19d399a86a16af718177021e963 +size 8390469 diff --git a/model.layers.6.self_attn.k_proj/NVFP4.pth b/model.layers.6.self_attn.k_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..0aa08aeb11d15be4fa6332c6153d28ab26d491fb --- /dev/null +++ b/model.layers.6.self_attn.k_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ac17fff98fad39d4d572cb0788caa1b513a85540fdfcff1e2facfd77f6a43b5 +size 8390363 diff --git a/model.layers.6.self_attn.o_proj/FP8_Block.pth b/model.layers.6.self_attn.o_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..614c55b14ec234f9abfb06056e3939f41388e6c7 --- /dev/null +++ b/model.layers.6.self_attn.o_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d78944074ca230036795aa716aca1b6d844dd9f7746af7298ad37de1e5cab25 +size 33556279 diff --git a/model.layers.6.self_attn.o_proj/FP8_Dynamic.pth b/model.layers.6.self_attn.o_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..f4600b7f8e3137f46186a6889e7a052f7b00a9a5 --- /dev/null +++ b/model.layers.6.self_attn.o_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:132b6347f2b39d7c81144a4fdb1ce8fa3140f651a36948263a21bf970fb79c88 +size 33556293 diff --git a/model.layers.6.self_attn.o_proj/NVFP4.pth b/model.layers.6.self_attn.o_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..2187c1304681a95af5cb30557da15534dd288a5f --- /dev/null +++ b/model.layers.6.self_attn.o_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8461bf27b38e573080d827c29207e1f55a1378857935ea660d0ae833ca9d8be +size 33556187 diff --git a/model.layers.6.self_attn.q_proj/FP8_Block.pth b/model.layers.6.self_attn.q_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..41fa34c9d2f59ed8f4441b9efda2b83b1f3374cb --- /dev/null +++ b/model.layers.6.self_attn.q_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03d6b6f6bac3f87311ff13604f4721d2def2f1c01b14c5f5ce1f502fc591b22c +size 33556279 diff --git a/model.layers.6.self_attn.q_proj/FP8_Dynamic.pth b/model.layers.6.self_attn.q_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..3ac09f82d0e23a64049e1a9545e160ecf2e3e5fb --- /dev/null +++ b/model.layers.6.self_attn.q_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2de989764768ebd171924a7ce346ee97fec5090bcf17375cec0dc602a3e98db6 +size 33556293 diff --git a/model.layers.6.self_attn.q_proj/NVFP4.pth b/model.layers.6.self_attn.q_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..55c10b7916a2fb90b1d12230c49acc48a89a4126 --- /dev/null +++ b/model.layers.6.self_attn.q_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b84e33bdc3b40655d3b5c433af82305c0324219513974b590fcc12a58319ccf8 +size 33556187 diff --git a/model.layers.6.self_attn.v_proj/FP8_Block.pth b/model.layers.6.self_attn.v_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..20abd50a26e4c6148d75f233288c792641c08c86 --- /dev/null +++ b/model.layers.6.self_attn.v_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c38828ae494503efa7a3136439029151797d9bdf650f0a4d59159753a42e6f5 +size 8390455 diff --git a/model.layers.6.self_attn.v_proj/FP8_Dynamic.pth b/model.layers.6.self_attn.v_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..39b644b6d329119096514ab68f6ba30ce25b807e --- /dev/null +++ b/model.layers.6.self_attn.v_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd0f3bd1c569b17e14ee4d874d706df390ac77e4b64f76b9051bf49e36805ee6 +size 8390469 diff --git a/model.layers.6.self_attn.v_proj/NVFP4.pth b/model.layers.6.self_attn.v_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..6cd54f06aafe031e99db5e469bf5144ab96bb6ad --- /dev/null +++ b/model.layers.6.self_attn.v_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:464ca863bf41629680c0f6cc849f38184ef3a17b36a1d8fcc3c0986838034563 +size 8390363 diff --git a/model.layers.7.mlp.down_proj/FP8_Block.pth b/model.layers.7.mlp.down_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..b84afdb216bd26fa60d2a42156a73a09b9ece615 --- /dev/null +++ b/model.layers.7.mlp.down_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec1d1ee5642299597c1aa44f533eafe1fbb3a779332d662e30cd8945467e4998 +size 117442359 diff --git a/model.layers.7.mlp.down_proj/FP8_Dynamic.pth b/model.layers.7.mlp.down_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..15ccce9141a9846243faed62029c64dd4fdb78e7 --- /dev/null +++ b/model.layers.7.mlp.down_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a587b2f593a608025c7ffb9fb1363c8ead95e98e4f6683640c2320e07b9a0f2c +size 117442373 diff --git a/model.layers.7.mlp.down_proj/NVFP4.pth b/model.layers.7.mlp.down_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..72f591f977e591a8ff9ce87244d16a96bac14528 --- /dev/null +++ b/model.layers.7.mlp.down_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76596b638ab6f61a5ffdfd654a5f7a7737cf92811355760365f3fcc73fc59640 +size 117442267 diff --git a/model.layers.7.mlp.gate_proj/FP8_Block.pth b/model.layers.7.mlp.gate_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..33c3326280d0d3a5d24c9e12b5fdbf8db629ae64 --- /dev/null +++ b/model.layers.7.mlp.gate_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1c01b8eb8184ed348070b9a4793299fd7fd447d45c80ee0f8d72c4ff174d813 +size 117442359 diff --git a/model.layers.7.mlp.gate_proj/FP8_Dynamic.pth b/model.layers.7.mlp.gate_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..68cd5da43f6bdead4a763269574156a667b24424 --- /dev/null +++ b/model.layers.7.mlp.gate_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:416b27cf978b8a23ed00453564f56cdcff5099fa31bcaebd76d8cce3b0514388 +size 117442373 diff --git a/model.layers.7.mlp.gate_proj/NVFP4.pth b/model.layers.7.mlp.gate_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..cf13fca1631624ccba1f7050aad94f17bd41f5e3 --- /dev/null +++ b/model.layers.7.mlp.gate_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:566b13bfa54113e9b06c40dd7eae90f1a044c322d7ea5e8e45fc21a0b1f89aa4 +size 117442267 diff --git a/model.layers.7.mlp.up_proj/FP8_Block.pth b/model.layers.7.mlp.up_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..e1a677469d5d5c433acc54dd25b3ab469964b697 --- /dev/null +++ b/model.layers.7.mlp.up_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85ba2414bb5d8eb80b01462de438fc256c7c3021073dc0d046ef563063ed5f4d +size 117442359 diff --git a/model.layers.7.mlp.up_proj/FP8_Dynamic.pth b/model.layers.7.mlp.up_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..28dd279f2dfbedb01712069431ca8f0e67b79463 --- /dev/null +++ b/model.layers.7.mlp.up_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82ae3df2331df4d193ff777150c42f4dba89b729c71e668e5ba161e10a2410d6 +size 117442373 diff --git a/model.layers.7.mlp.up_proj/NVFP4.pth b/model.layers.7.mlp.up_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..8fb36e2937232404aff7798f2be6f0e584243eac --- /dev/null +++ b/model.layers.7.mlp.up_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01b0f4a4a213f2b6103d9e5dd821c82bf22233744b6475869c7ed65de61e9201 +size 117442267 diff --git a/model.layers.7.self_attn.k_proj/FP8_Block.pth b/model.layers.7.self_attn.k_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..608dceff72fb4ccffc3d49f8584a66af53955532 --- /dev/null +++ b/model.layers.7.self_attn.k_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e4bb312ca13601f0910c4502f75b41d5411c9ea2bea76b1884a206b8e447287 +size 8390455 diff --git a/model.layers.7.self_attn.k_proj/FP8_Dynamic.pth b/model.layers.7.self_attn.k_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..20e20ea3ceaa4fdbec64920072d3501db017c611 --- /dev/null +++ b/model.layers.7.self_attn.k_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38ab4b46a867473ab4f1ef2b9008582b704296e9c21275fef488dce8ed0a1710 +size 8390469 diff --git a/model.layers.7.self_attn.k_proj/NVFP4.pth b/model.layers.7.self_attn.k_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..21009a9c6eb373a43c9602afaa458f770683ea22 --- /dev/null +++ b/model.layers.7.self_attn.k_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abe510eada6948604545c5c0a9f490eabb73cfee223f3ae52817e5b63804f8f0 +size 8390363 diff --git a/model.layers.7.self_attn.o_proj/FP8_Block.pth b/model.layers.7.self_attn.o_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..4f1ecfc10af76689e774a3c19b158472f0798735 --- /dev/null +++ b/model.layers.7.self_attn.o_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d4d4be26965d80cc0f4d60b702f07cd1d9bf4b6e636a16dcb6c213eedd4cb7d +size 33556279 diff --git a/model.layers.7.self_attn.o_proj/FP8_Dynamic.pth b/model.layers.7.self_attn.o_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..75da5a7f266ab70c6352bd5f3ea6a530de3c0843 --- /dev/null +++ b/model.layers.7.self_attn.o_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3d388efbe1d1711f8e2fe4d83e39b1b88c95063f5566d99047a157e674ec068 +size 33556293 diff --git a/model.layers.7.self_attn.o_proj/NVFP4.pth b/model.layers.7.self_attn.o_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..7ca268e3bc1602eb4e6241f277e088dd54b476c9 --- /dev/null +++ b/model.layers.7.self_attn.o_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2b5a7170b38707552004629f6fb947c07d884c5e42ef5f1cae6a663998ded59 +size 33556187 diff --git a/model.layers.7.self_attn.q_proj/FP8_Block.pth b/model.layers.7.self_attn.q_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..efba982f4e907da64677dea04fe54391d460dde0 --- /dev/null +++ b/model.layers.7.self_attn.q_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bea6a86eab1b02d118b586090a468cabbbf6052cf3411efb4e440b645f233a4c +size 33556279 diff --git a/model.layers.7.self_attn.q_proj/FP8_Dynamic.pth b/model.layers.7.self_attn.q_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..375d33d82b78f9c0c2d2ff0afc9ab50af1b55403 --- /dev/null +++ b/model.layers.7.self_attn.q_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:807e92d2441548f42570046273e9a79e0a9f30c8820d91b4b8fc753164f5df8b +size 33556293 diff --git a/model.layers.7.self_attn.q_proj/NVFP4.pth b/model.layers.7.self_attn.q_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..da0cac89e6f98136a1828107a2188dbf9da86329 --- /dev/null +++ b/model.layers.7.self_attn.q_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5046152bbc7c1e1b24896853a6c338242be35457ee5b9b74a129761ccc3d33e +size 33556187 diff --git a/model.layers.7.self_attn.v_proj/FP8_Block.pth b/model.layers.7.self_attn.v_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..cfacb4d1ca6c3f7a42f99be9425d91f5888b9187 --- /dev/null +++ b/model.layers.7.self_attn.v_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:efdaac66a4ca0d4fae309c23308085d108a5229932ef632b0b219e0ae901d77b +size 8390455 diff --git a/model.layers.7.self_attn.v_proj/FP8_Dynamic.pth b/model.layers.7.self_attn.v_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..be850664d45b724195052e409182e182f34d2e9a --- /dev/null +++ b/model.layers.7.self_attn.v_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72be1b4f7b217aff0a5be8c15300d4cf7b1b7f513e22d24ab5d6d2bfffa6c18f +size 8390469 diff --git a/model.layers.7.self_attn.v_proj/NVFP4.pth b/model.layers.7.self_attn.v_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..c1b383854e635a939669c048e606c56ed0dd2467 --- /dev/null +++ b/model.layers.7.self_attn.v_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2f470f6b8d405a45db02b3c127bb0704d1ac791893c923d1cf25e8d8bade87d +size 8390363 diff --git a/model.layers.8.mlp.down_proj/FP8_Block.pth b/model.layers.8.mlp.down_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..5969c2643c431056a3da54d5211c97f5bf1daa00 --- /dev/null +++ b/model.layers.8.mlp.down_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bfc82a14c2828d7b4ad53cfb500be92ba190fddc0455e1bb51c0ecbe2d790fc +size 117442359 diff --git a/model.layers.8.mlp.down_proj/FP8_Dynamic.pth b/model.layers.8.mlp.down_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..3606084bda5577fe8e0ab595cc05d2589541b568 --- /dev/null +++ b/model.layers.8.mlp.down_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:374116c449b4014309fb0551d7995f78d74a0fe2a010eab4169562e3af773883 +size 117442373 diff --git a/model.layers.8.mlp.down_proj/NVFP4.pth b/model.layers.8.mlp.down_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..4f4037388fdcd0c90294466fec7326122ceab9a4 --- /dev/null +++ b/model.layers.8.mlp.down_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a1f0ac1f956296f62dfb19456adf4230a1accd42c6cb26cf00873ba939da8bc +size 117442267 diff --git a/model.layers.8.mlp.gate_proj/FP8_Block.pth b/model.layers.8.mlp.gate_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..7024f703178f59cacb6adfa9a3f8d9ba95c35e97 --- /dev/null +++ b/model.layers.8.mlp.gate_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d332f6b6e9506007510a752bb74cd90a5cab362d3cfe52010a424f699d9b8e5a +size 117442359 diff --git a/model.layers.8.mlp.gate_proj/FP8_Dynamic.pth b/model.layers.8.mlp.gate_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..3e832c616c939f677ce6cc53f3d64b4cce808708 --- /dev/null +++ b/model.layers.8.mlp.gate_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec5298bc1be6e53e727214a03bc84c88373b1c0e6bb1437008d6495d6631219b +size 117442373 diff --git a/model.layers.8.mlp.gate_proj/NVFP4.pth b/model.layers.8.mlp.gate_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..045e0127ab5f96db7f172e3851464fc01aca0d45 --- /dev/null +++ b/model.layers.8.mlp.gate_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0309f88f1f203f4e68739e357a69668aff0abcb8749eba5a37c66d1e1eaeb4e4 +size 117442267 diff --git a/model.layers.8.mlp.up_proj/FP8_Block.pth b/model.layers.8.mlp.up_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..fa4604e7e7ed4209a05830d5a4dad21093c2b73b --- /dev/null +++ b/model.layers.8.mlp.up_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c1a727b2bf019b2eb294e8a8c631fdcba56fc7e60346c3f68af87928afa96c9 +size 117442359 diff --git a/model.layers.8.mlp.up_proj/FP8_Dynamic.pth b/model.layers.8.mlp.up_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..16db3dac5cd27d07992343863ef38cd82403b472 --- /dev/null +++ b/model.layers.8.mlp.up_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c15315243970c9345fb63b75231ec7e8da015c8458b45169c7471fd29927ee0 +size 117442373 diff --git a/model.layers.8.mlp.up_proj/NVFP4.pth b/model.layers.8.mlp.up_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..d56ff9c2effed64ef652f9faedbe66e84c1a0596 --- /dev/null +++ b/model.layers.8.mlp.up_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac2014b0ef2c35089e3a76669378c06e7747a8b8298fd2392c101553d9912269 +size 117442267 diff --git a/model.layers.8.self_attn.k_proj/FP8_Block.pth b/model.layers.8.self_attn.k_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..7c971f3ae5ad915c6b0b2c6ad9d4977fc1cbba5f --- /dev/null +++ b/model.layers.8.self_attn.k_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a74a1b12dc04df5f9767afa36156119ff9156432d51d4d0569e8db9a3901ba03 +size 8390455 diff --git a/model.layers.8.self_attn.k_proj/FP8_Dynamic.pth b/model.layers.8.self_attn.k_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..3a95ee53daf2953790940813dc0f65104a9139e6 --- /dev/null +++ b/model.layers.8.self_attn.k_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3db160483f9166b118e13d736cdb1b1ab219bfce3cff53eb4ebfa2d8e862641a +size 8390469 diff --git a/model.layers.8.self_attn.k_proj/NVFP4.pth b/model.layers.8.self_attn.k_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..f34c45b2344b94320ec13f25d64016cd370ff22f --- /dev/null +++ b/model.layers.8.self_attn.k_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81c01427ce4bf6942a5128ac6ade447577c1220175fb3b8dfb2a317061887d39 +size 8390363 diff --git a/model.layers.8.self_attn.o_proj/FP8_Block.pth b/model.layers.8.self_attn.o_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..61a4e76c7aae2107d4d167654d64e8a06aacf42b --- /dev/null +++ b/model.layers.8.self_attn.o_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:655f11149d1a111f4e078f072dc5b297d006fb78d60f0c59e363b6cd9cafb3b9 +size 33556279 diff --git a/model.layers.8.self_attn.o_proj/FP8_Dynamic.pth b/model.layers.8.self_attn.o_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..0f5b185e88c8e7f57ed1429d6c1f13e3628f9510 --- /dev/null +++ b/model.layers.8.self_attn.o_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4413ee1218093dde83c839c35551e205005bc14f93a755081d4c7c85a649e48d +size 33556293 diff --git a/model.layers.8.self_attn.o_proj/NVFP4.pth b/model.layers.8.self_attn.o_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..bd3cc2766edc61350df3d20557c6b3c67c97cbac --- /dev/null +++ b/model.layers.8.self_attn.o_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b25407d4c1ca3fa2955da590a116ce26f36d1fc58a8ec930b53c22d6887e0eb0 +size 33556187 diff --git a/model.layers.8.self_attn.q_proj/FP8_Block.pth b/model.layers.8.self_attn.q_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..42063e1cc491de3b9257bdb78701e65065786c52 --- /dev/null +++ b/model.layers.8.self_attn.q_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dca4fc716ab8accba3970808af6bd45da2194b79a963aaf69bd0fee657cc4fcf +size 33556279 diff --git a/model.layers.8.self_attn.q_proj/FP8_Dynamic.pth b/model.layers.8.self_attn.q_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..be0758132c363525f5182d6650f38e46ba505fce --- /dev/null +++ b/model.layers.8.self_attn.q_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d511d054f04aadd00d3c668d908c31e2d198537955fbfead4f58856cbda7a7ac +size 33556293 diff --git a/model.layers.8.self_attn.q_proj/NVFP4.pth b/model.layers.8.self_attn.q_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..7da46d04e88224bb5f19db5743244a3f1296f2b1 --- /dev/null +++ b/model.layers.8.self_attn.q_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e33904cdc43e8422af13209c4e694f2bd91635799e5d6f166f422f2d3b0b6a7 +size 33556187 diff --git a/model.layers.8.self_attn.v_proj/FP8_Block.pth b/model.layers.8.self_attn.v_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..8ef479495d1ba21f5fe4c7573e9e2acfa62ef185 --- /dev/null +++ b/model.layers.8.self_attn.v_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:077c748e1635e789c58f79ef7aba27a0934e8168d260767968e6f017f9b92f6b +size 8390455 diff --git a/model.layers.8.self_attn.v_proj/FP8_Dynamic.pth b/model.layers.8.self_attn.v_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..d276e1f07679c668f87b35671adcf088f1cfd610 --- /dev/null +++ b/model.layers.8.self_attn.v_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80ae54768d5085da3ea5b57b1756a5fd3e120a813415ca457340ef7dda9481c9 +size 8390469 diff --git a/model.layers.8.self_attn.v_proj/NVFP4.pth b/model.layers.8.self_attn.v_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..7c5bde79bd7b2a803d92e0689a2584a7be0bbc9a --- /dev/null +++ b/model.layers.8.self_attn.v_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ac9abbe008364e6b6b04b876d88ae3879741ee09374ee8b577897e0478a6abd +size 8390363 diff --git a/model.layers.9.mlp.down_proj/FP8_Block.pth b/model.layers.9.mlp.down_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..eeeac7323787fe7baeca84bb675f17d6501886b4 --- /dev/null +++ b/model.layers.9.mlp.down_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11029d065c1908cd27abcc18e2de91b82067cd7288801353fcad376d3b83fe43 +size 117442359 diff --git a/model.layers.9.mlp.down_proj/FP8_Dynamic.pth b/model.layers.9.mlp.down_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..95ab780175a344822d964300cca4d4e62fcbec58 --- /dev/null +++ b/model.layers.9.mlp.down_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1d6a70a4816816e33af620344c0be859e7fea75202ebef61224502246654a45 +size 117442373 diff --git a/model.layers.9.mlp.down_proj/NVFP4.pth b/model.layers.9.mlp.down_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..94635722c506d93b6192dd56e741865a5af2191b --- /dev/null +++ b/model.layers.9.mlp.down_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2c7fd625b906c18f3232ef17f8c7ff74ee1da8910c0112750d081777e48f3cf +size 117442267 diff --git a/model.layers.9.mlp.gate_proj/FP8_Block.pth b/model.layers.9.mlp.gate_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..4dfce2c984c8c1da0792023629689158104cae55 --- /dev/null +++ b/model.layers.9.mlp.gate_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f727fe9f94dbf6a885121e6370ed7e0b53eb5d9bd3ddf347cfba3e76ab7b83d +size 117442359 diff --git a/model.layers.9.mlp.gate_proj/FP8_Dynamic.pth b/model.layers.9.mlp.gate_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..948fa2a6ec2617effe4d3cc62c0c4f1309863c84 --- /dev/null +++ b/model.layers.9.mlp.gate_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cb5f95fd17d12a13ae36a28146a9ecda7aa994739a3dbce3404669ed13f4cd1 +size 117442373 diff --git a/model.layers.9.mlp.gate_proj/NVFP4.pth b/model.layers.9.mlp.gate_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..356ccd12bd7796935f643f7f6f69b71d0078b731 --- /dev/null +++ b/model.layers.9.mlp.gate_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc97d8b6afbaec9494e9d6a7384ce865fd27168eb378ab210c84d2f952a9092b +size 117442267 diff --git a/model.layers.9.mlp.up_proj/FP8_Block.pth b/model.layers.9.mlp.up_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..2a50a1a904515e6057053b3a4337a54f418f758d --- /dev/null +++ b/model.layers.9.mlp.up_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:615d7cc16af257bf8d5d406e73902f3a77dd8d1d41a30d1bf407ac15ebc8db21 +size 117442359 diff --git a/model.layers.9.mlp.up_proj/FP8_Dynamic.pth b/model.layers.9.mlp.up_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..604f39cec8700512bde6da56fde9e502a7f2163f --- /dev/null +++ b/model.layers.9.mlp.up_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f32071f74ffedc4f4f8a1b0089df092fc652a967bd337cf17d778b205c57ce9 +size 117442373 diff --git a/model.layers.9.mlp.up_proj/NVFP4.pth b/model.layers.9.mlp.up_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..275ebf17f4717cb32e529bed2e6749a80bbde636 --- /dev/null +++ b/model.layers.9.mlp.up_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be73bb11621c4f13f77c48c946b15799595a34d75aa813db86b023555e25297c +size 117442267 diff --git a/model.layers.9.self_attn.k_proj/FP8_Block.pth b/model.layers.9.self_attn.k_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..5fc9f5c92f3f39158a050b06d1e2c167e12c8a2f --- /dev/null +++ b/model.layers.9.self_attn.k_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6283f74a88998736b07ab13d3dcac63ae7df548de2ad46ba0cfd2e5291437bbc +size 8390455 diff --git a/model.layers.9.self_attn.k_proj/FP8_Dynamic.pth b/model.layers.9.self_attn.k_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..143f4c32bbb3bd19b43b04c9c899bb407849da48 --- /dev/null +++ b/model.layers.9.self_attn.k_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6108ff8dd935ef7175e107fbeb95ed32b0e64648e4e65ee4155415e6e9a23a73 +size 8390469 diff --git a/model.layers.9.self_attn.k_proj/NVFP4.pth b/model.layers.9.self_attn.k_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..534527b2c094675459b142fb31af255482bfad70 --- /dev/null +++ b/model.layers.9.self_attn.k_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b2510656df679916c9d7c12a39d11076bc6e12d1336ad14a7f64a07b4410248 +size 8390363 diff --git a/model.layers.9.self_attn.o_proj/FP8_Block.pth b/model.layers.9.self_attn.o_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..fdd740bab3bc0938f73d25cfef350d2ac143cf80 --- /dev/null +++ b/model.layers.9.self_attn.o_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:399040ee2885642a46ff071ba42df0b4833ca44144a565e6d229915f7eafeb5e +size 33556279 diff --git a/model.layers.9.self_attn.o_proj/FP8_Dynamic.pth b/model.layers.9.self_attn.o_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..8228e93d1a0e68a56e8e996b261dd750cc4285d5 --- /dev/null +++ b/model.layers.9.self_attn.o_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b02efee1fc6ce4bcaf284cd8b1adf2c65da19e49bea80e5e7a38ec98371cbe6 +size 33556293 diff --git a/model.layers.9.self_attn.o_proj/NVFP4.pth b/model.layers.9.self_attn.o_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..7b4471b7fcb7a1d04da545ce2f16650984bf5d30 --- /dev/null +++ b/model.layers.9.self_attn.o_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4cd442479911443526dcdaf02ee6cd6362c440e9c6bb94ee05fb324741d3a1de +size 33556187 diff --git a/model.layers.9.self_attn.q_proj/FP8_Block.pth b/model.layers.9.self_attn.q_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..219f7a61fabd7852c5917c2774f0c6d745b06ea1 --- /dev/null +++ b/model.layers.9.self_attn.q_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d922c27f81e3d9510a7547a1e71d4e1855497b6378f5f342d589288a01d3ea9 +size 33556279 diff --git a/model.layers.9.self_attn.q_proj/FP8_Dynamic.pth b/model.layers.9.self_attn.q_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..08274e6fd0885e1af7176877ec251cf13e3c71ce --- /dev/null +++ b/model.layers.9.self_attn.q_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3e77d5eb291a44de7948c218216beb8908912b316eb9e9b9bfc61f0d2497541 +size 33556293 diff --git a/model.layers.9.self_attn.q_proj/NVFP4.pth b/model.layers.9.self_attn.q_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..9bb5eebf530778c356e1a03ddea5aab78a5694ec --- /dev/null +++ b/model.layers.9.self_attn.q_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ee20b6a4a4952accabf5244bec472602a674fefe6894ee06bee16411678561a +size 33556187 diff --git a/model.layers.9.self_attn.v_proj/FP8_Block.pth b/model.layers.9.self_attn.v_proj/FP8_Block.pth new file mode 100644 index 0000000000000000000000000000000000000000..7c0614b4d792850a59bfeb42c96f63968cc2b199 --- /dev/null +++ b/model.layers.9.self_attn.v_proj/FP8_Block.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae91aefea770254195b70bb74b2ab2b3188ec1ca58b6cca88bccc1c58aa46123 +size 8390455 diff --git a/model.layers.9.self_attn.v_proj/FP8_Dynamic.pth b/model.layers.9.self_attn.v_proj/FP8_Dynamic.pth new file mode 100644 index 0000000000000000000000000000000000000000..2f445843e7a02d05d407f58ae5635bdd66382e31 --- /dev/null +++ b/model.layers.9.self_attn.v_proj/FP8_Dynamic.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e27ead2ef1f5a85af3f313736c216622d5422c913b869c8d8ee17cb84273f9f2 +size 8390469 diff --git a/model.layers.9.self_attn.v_proj/NVFP4.pth b/model.layers.9.self_attn.v_proj/NVFP4.pth new file mode 100644 index 0000000000000000000000000000000000000000..3940b120fc5b751c7ce7320ada696653dec3d2f4 --- /dev/null +++ b/model.layers.9.self_attn.v_proj/NVFP4.pth @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:143d1184b0fd2b58cf7f106bed25168cadc12518797e13c5d58bfefcb86f0bb6 +size 8390363