raniero commited on
Commit
d1378de
·
1 Parent(s): 7671ece

Nuovo training DPO con Mistral-7B-Instruct-v0.2, modelli aggiornati

Browse files
Files changed (3) hide show
  1. README.md +1 -22
  2. adapter_config.json +8 -3
  3. adapter_model.safetensors +1 -1
README.md CHANGED
@@ -1,22 +1 @@
1
- ---
2
- base_model: meta-llama/Llama-2-7b-hf
3
- tags:
4
- - LoRA
5
- - bittensor
6
- - gradients
7
- license: apache-2.0
8
- ---
9
-
10
- # Submission for task `dpo_test_finale_007`
11
-
12
- Fine-tuned using LoRA on dynamic dataset.
13
-
14
- - Task ID: `dpo_test_finale_007`
15
- - Repo: `dpo_test_finale_007`
16
- - SHA256: 5fa30211ee0266cbc3c9828a45679020d334b290c39d60fd8666fbe8c510af75
17
- - Timestamp: 2025-07-30T17:24:34.233691
18
- ## URLs per validator
19
-
20
- - [Adapter Model](https://huggingface.co/raniero/dpo_test_finale_007/resolve/main/adapter_model.safetensors)
21
- - [Adapter Config](https://huggingface.co/raniero/dpo_test_finale_007/raw/main/adapter_config.json)
22
- - [README](https://huggingface.co/raniero/dpo_test_finale_007/raw/main/README.md)
 
1
+ Modello addestrato con DPOTask
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
adapter_config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "peft_type": "LORA",
3
  "auto_mapping": null,
4
- "base_model_name_or_path": "meta-llama/Llama-2-7b-hf",
5
  "revision": null,
6
  "task_type": "CAUSAL_LM",
7
  "inference_mode": false,
@@ -17,5 +17,10 @@
17
  "modules_to_save": null,
18
  "init_lora_weights": true,
19
  "layers_to_transform": null,
20
- "layers_pattern": null
21
- }
 
 
 
 
 
 
1
  {
2
  "peft_type": "LORA",
3
  "auto_mapping": null,
4
+ "base_model_name_or_path": "mistralai/Mistral-7B-Instruct-v0.2",
5
  "revision": null,
6
  "task_type": "CAUSAL_LM",
7
  "inference_mode": false,
 
17
  "modules_to_save": null,
18
  "init_lora_weights": true,
19
  "layers_to_transform": null,
20
+ "layers_pattern": null,
21
+ "rank_pattern": {},
22
+ "alpha_pattern": {},
23
+ "megatron_config": null,
24
+ "megatron_core": "megatron.core",
25
+ "loftq_config": {}
26
+ }
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5fa30211ee0266cbc3c9828a45679020d334b290c39d60fd8666fbe8c510af75
3
  size 13648400
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:160e8454f5c4745fe0d9954328e167444c9193b788f1f1042ada27485b551a07
3
  size 13648400