| | --- |
| | language: |
| | - en |
| | license: llama3 |
| | library_name: transformers |
| | tags: |
| | - axolotl |
| | - finetune |
| | - dpo |
| | - facebook |
| | - meta |
| | - pytorch |
| | - llama |
| | - llama-3 |
| | base_model: meta-llama/Meta-Llama-3-8B-Instruct |
| | model_name: Llama-3-8B-Instruct-DPO-v0.3 |
| | pipeline_tag: text-generation |
| | license_name: llama3 |
| | license_link: LICENSE |
| | inference: true |
| |
|
| | --- |
| | |
| | <img src="./llama-3-merges.webp" alt="Llama-3 DPO Logo" width="500" style="margin-left:'auto' margin-right:'auto' display:'block'"/> |
| |
|
| |
|
| | #StudyBuddy! |
| |
|
| | This model is a fine-tune (DPO) of `meta-llama/Meta-Llama-3-8B-Instruct` model. |