Ba2han commited on
Commit
41c596b
·
verified ·
1 Parent(s): 6300618

Training in progress, step 291

Browse files
README.md CHANGED
@@ -1,18 +1,18 @@
1
  ---
2
- base_model: qwen
3
  library_name: transformers
4
  model_name: m_augment
5
  tags:
6
  - generated_from_trainer
7
  - trl
8
- - unsloth
9
  - sft
 
10
  licence: license
11
  ---
12
 
13
  # Model Card for m_augment
14
 
15
- This model is a fine-tuned version of [qwen](https://huggingface.co/qwen).
16
  It has been trained using [TRL](https://github.com/huggingface/trl).
17
 
18
  ## Quick start
@@ -28,16 +28,16 @@ print(output["generated_text"])
28
 
29
  ## Training procedure
30
 
31
- [<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="150" height="24"/>](https://wandb.ai/batuhan409/huggingface/runs/stynr6zo)
32
 
33
 
34
  This model was trained with SFT.
35
 
36
  ### Framework versions
37
 
38
- - TRL: 0.23.1
39
- - Transformers: 5.0.0rc2
40
- - Pytorch: 2.9.0+cu128
41
  - Datasets: 4.3.0
42
  - Tokenizers: 0.22.2
43
 
 
1
  ---
2
+ base_model: Ba2han/qwen-augment-2511
3
  library_name: transformers
4
  model_name: m_augment
5
  tags:
6
  - generated_from_trainer
7
  - trl
 
8
  - sft
9
+ - unsloth
10
  licence: license
11
  ---
12
 
13
  # Model Card for m_augment
14
 
15
+ This model is a fine-tuned version of [Ba2han/qwen-augment-2511](https://huggingface.co/Ba2han/qwen-augment-2511).
16
  It has been trained using [TRL](https://github.com/huggingface/trl).
17
 
18
  ## Quick start
 
28
 
29
  ## Training procedure
30
 
31
+ [<img src="https://raw.githubusercontent.com/wandb/assets/main/wandb-github-badge-28.svg" alt="Visualize in Weights & Biases" width="150" height="24"/>](https://wandb.ai/batuhan409/huggingface/runs/s1imxy2a)
32
 
33
 
34
  This model was trained with SFT.
35
 
36
  ### Framework versions
37
 
38
+ - TRL: 0.24.0
39
+ - Transformers: 5.0.0
40
+ - Pytorch: 2.10.0
41
  - Datasets: 4.3.0
42
  - Tokenizers: 0.22.2
43
 
adapter_config.json ADDED
@@ -0,0 +1,50 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "alora_invocation_tokens": null,
3
+ "alpha_pattern": {},
4
+ "arrow_config": null,
5
+ "auto_mapping": {
6
+ "base_model_class": "Qwen3ForCausalLM",
7
+ "parent_library": "transformers.models.qwen3.modeling_qwen3",
8
+ "unsloth_fixed": true
9
+ },
10
+ "base_model_name_or_path": "Ba2han/qwen-augment-2511",
11
+ "bias": "none",
12
+ "corda_config": null,
13
+ "ensure_weight_tying": false,
14
+ "eva_config": null,
15
+ "exclude_modules": null,
16
+ "fan_in_fan_out": false,
17
+ "inference_mode": true,
18
+ "init_lora_weights": true,
19
+ "layer_replication": null,
20
+ "layers_pattern": null,
21
+ "layers_to_transform": null,
22
+ "loftq_config": {},
23
+ "lora_alpha": 64,
24
+ "lora_bias": false,
25
+ "lora_dropout": 0,
26
+ "megatron_config": null,
27
+ "megatron_core": "megatron.core",
28
+ "modules_to_save": null,
29
+ "peft_type": "LORA",
30
+ "peft_version": "0.18.1",
31
+ "qalora_group_size": 16,
32
+ "r": 64,
33
+ "rank_pattern": {},
34
+ "revision": null,
35
+ "target_modules": [
36
+ "gate_proj",
37
+ "k_proj",
38
+ "up_proj",
39
+ "v_proj",
40
+ "o_proj",
41
+ "down_proj",
42
+ "q_proj"
43
+ ],
44
+ "target_parameters": null,
45
+ "task_type": "CAUSAL_LM",
46
+ "trainable_token_indices": null,
47
+ "use_dora": true,
48
+ "use_qalora": false,
49
+ "use_rslora": false
50
+ }
adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7a82542a3e6c5ad0ca85df359d7d9aff75e81685dbd375c3f64d3c0945757c3f
3
+ size 533009160
tokenizer.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:be75606093db2094d7cd20f3c2f385c212750648bd6ea4fb2bf507a6a4c55506
3
- size 11422650
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:476870a1f2fb6f6a2759a6ede2383bf9d5d738f17844563b65c91965b722ae09
3
+ size 11422924
tokenizer_config.json CHANGED
@@ -20,7 +20,7 @@
20
  "<|image_pad|>",
21
  "<|video_pad|>"
22
  ],
23
- "is_local": true,
24
  "model_max_length": 32768,
25
  "model_specific_special_tokens": {},
26
  "pad_token": "<|vision_pad|>",
 
20
  "<|image_pad|>",
21
  "<|video_pad|>"
22
  ],
23
+ "is_local": false,
24
  "model_max_length": 32768,
25
  "model_specific_special_tokens": {},
26
  "pad_token": "<|vision_pad|>",
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c79d9e3b60f9ae736e60257b55244a1f4a487531095b2990f156ad6ec799a46d
3
  size 5713
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:943c26076dfdedd9e28c802520a1c026bc1af685198b510701a3ead07fd3b809
3
  size 5713