4bits-quantized
#2
by alphrc - opened
This view is limited to 50 files because it contains too many changes. See the raw diff here.
- .DS_Store +0 -0
- README.md +0 -208
- config.json +0 -42
- model-00001-of-00046.safetensors +0 -3
- model-00002-of-00046.safetensors +0 -3
- model-00003-of-00046.safetensors +0 -3
- model-00004-of-00046.safetensors +0 -3
- model-00005-of-00046.safetensors +0 -3
- model-00006-of-00046.safetensors +0 -3
- model-00007-of-00046.safetensors +0 -3
- model-00008-of-00046.safetensors +0 -3
- model-00009-of-00046.safetensors +0 -3
- model-00010-of-00046.safetensors +0 -3
- model-00011-of-00046.safetensors +0 -3
- model-00012-of-00046.safetensors +0 -3
- model-00013-of-00046.safetensors +0 -3
- model-00014-of-00046.safetensors +0 -3
- model-00015-of-00046.safetensors +0 -3
- model-00016-of-00046.safetensors +0 -3
- model-00017-of-00046.safetensors +0 -3
- model-00018-of-00046.safetensors +0 -3
- model-00019-of-00046.safetensors +0 -3
- model-00020-of-00046.safetensors +0 -3
- model-00021-of-00046.safetensors +0 -3
- model-00022-of-00046.safetensors +0 -3
- model-00023-of-00046.safetensors +0 -3
- model-00024-of-00046.safetensors +0 -3
- model-00025-of-00046.safetensors +0 -3
- model-00026-of-00046.safetensors +0 -3
- model-00027-of-00046.safetensors +0 -3
- model-00028-of-00046.safetensors +0 -3
- model-00029-of-00046.safetensors +0 -3
- model-00030-of-00046.safetensors +0 -3
- model-00031-of-00046.safetensors +0 -3
- model-00032-of-00046.safetensors +0 -3
- model-00033-of-00046.safetensors +0 -3
- model-00034-of-00046.safetensors +0 -3
- model-00035-of-00046.safetensors +0 -3
- model-00036-of-00046.safetensors +0 -3
- model-00037-of-00046.safetensors +0 -3
- model-00038-of-00046.safetensors +0 -3
- model-00039-of-00046.safetensors +0 -3
- model-00040-of-00046.safetensors +0 -3
- model-00041-of-00046.safetensors +0 -3
- model-00042-of-00046.safetensors +0 -3
- model-00043-of-00046.safetensors +0 -3
- model-00044-of-00046.safetensors +0 -3
- model-00045-of-00046.safetensors +0 -3
- model-00046-of-00046.safetensors +0 -3
- model.safetensors.index.json +0 -0
.DS_Store
DELETED
|
Binary file (6.15 kB)
|
|
|
README.md
DELETED
|
@@ -1,208 +0,0 @@
|
|
| 1 |
-
---
|
| 2 |
-
language:
|
| 3 |
-
- en
|
| 4 |
-
- de
|
| 5 |
-
- fr
|
| 6 |
-
- it
|
| 7 |
-
- pt
|
| 8 |
-
- hi
|
| 9 |
-
- es
|
| 10 |
-
- th
|
| 11 |
-
library_name: transformers
|
| 12 |
-
license: llama3.1
|
| 13 |
-
pipeline_tag: text-generation
|
| 14 |
-
tags:
|
| 15 |
-
- facebook
|
| 16 |
-
- meta
|
| 17 |
-
- pytorch
|
| 18 |
-
- llama
|
| 19 |
-
- llama-3
|
| 20 |
-
- mlx
|
| 21 |
-
extra_gated_prompt: "### LLAMA 3.1 COMMUNITY LICENSE AGREEMENT\nLlama 3.1 Version\
|
| 22 |
-
\ Release Date: July 23, 2024\n\"Agreement\" means the terms and conditions for\
|
| 23 |
-
\ use, reproduction, distribution and modification of the Llama Materials set forth\
|
| 24 |
-
\ herein.\n\"Documentation\" means the specifications, manuals and documentation\
|
| 25 |
-
\ accompanying Llama 3.1 distributed by Meta at https://llama.meta.com/doc/overview.\n\
|
| 26 |
-
\"Licensee\" or \"you\" means you, or your employer or any other person or entity\
|
| 27 |
-
\ (if you are entering into this Agreement on such person or entity’s behalf), of\
|
| 28 |
-
\ the age required under applicable laws, rules or regulations to provide legal\
|
| 29 |
-
\ consent and that has legal authority to bind your employer or such other person\
|
| 30 |
-
\ or entity if you are entering in this Agreement on their behalf.\n\"Llama 3.1\"\
|
| 31 |
-
\ means the foundational large language models and software and algorithms, including\
|
| 32 |
-
\ machine-learning model code, trained model weights, inference-enabling code, training-enabling\
|
| 33 |
-
\ code, fine-tuning enabling code and other elements of the foregoing distributed\
|
| 34 |
-
\ by Meta at https://llama.meta.com/llama-downloads.\n\"Llama Materials\" means,\
|
| 35 |
-
\ collectively, Meta’s proprietary Llama 3.1 and Documentation (and any portion\
|
| 36 |
-
\ thereof) made available under this Agreement.\n\"Meta\" or \"we\" means Meta Platforms\
|
| 37 |
-
\ Ireland Limited (if you are located in or, if you are an entity, your principal\
|
| 38 |
-
\ place of business is in the EEA or Switzerland) and Meta Platforms, Inc. (if you\
|
| 39 |
-
\ are located outside of the EEA or Switzerland).\n \n1. License Rights and Redistribution.\n\
|
| 40 |
-
a. Grant of Rights. You are granted a non-exclusive, worldwide, non-transferable\
|
| 41 |
-
\ and royalty-free limited license under Meta’s intellectual property or other rights\
|
| 42 |
-
\ owned by Meta embodied in the Llama Materials to use, reproduce, distribute, copy,\
|
| 43 |
-
\ create derivative works of, and make modifications to the Llama Materials.\nb.\
|
| 44 |
-
\ Redistribution and Use.\ni. If you distribute or make available the Llama Materials\
|
| 45 |
-
\ (or any derivative works thereof), or a product or service (including another\
|
| 46 |
-
\ AI model) that contains any of them, you shall (A) provide a copy of this Agreement\
|
| 47 |
-
\ with any such Llama Materials; and (B) prominently display “Built with Llama”\
|
| 48 |
-
\ on a related website, user interface, blogpost, about page, or product documentation.\
|
| 49 |
-
\ If you use the Llama Materials or any outputs or results of the Llama Materials\
|
| 50 |
-
\ to create, train, fine tune, or otherwise improve an AI model, which is distributed\
|
| 51 |
-
\ or made available, you shall also include “Llama” at the beginning of any such\
|
| 52 |
-
\ AI model name.\nii. If you receive Llama Materials, or any derivative works thereof,\
|
| 53 |
-
\ from a Licensee as part of an integrated end user product, then Section 2 of\
|
| 54 |
-
\ this Agreement will not apply to you.\niii. You must retain in all copies of the\
|
| 55 |
-
\ Llama Materials that you distribute the following attribution notice within a\
|
| 56 |
-
\ “Notice” text file distributed as a part of such copies: “Llama 3.1 is licensed\
|
| 57 |
-
\ under the Llama 3.1 Community License, Copyright © Meta Platforms, Inc. All Rights\
|
| 58 |
-
\ Reserved.”\niv. Your use of the Llama Materials must comply with applicable laws\
|
| 59 |
-
\ and regulations (including trade compliance laws and regulations) and adhere to\
|
| 60 |
-
\ the Acceptable Use Policy for the Llama Materials (available at https://llama.meta.com/llama3_1/use-policy),\
|
| 61 |
-
\ which is hereby incorporated by reference into this Agreement.\n2. Additional\
|
| 62 |
-
\ Commercial Terms. If, on the Llama 3.1 version release date, the monthly active\
|
| 63 |
-
\ users of the products or services made available by or for Licensee, or Licensee’s\
|
| 64 |
-
\ affiliates, is greater than 700 million monthly active users in the preceding\
|
| 65 |
-
\ calendar month, you must request a license from Meta, which Meta may grant to\
|
| 66 |
-
\ you in its sole discretion, and you are not authorized to exercise any of the\
|
| 67 |
-
\ rights under this Agreement unless or until Meta otherwise expressly grants you\
|
| 68 |
-
\ such rights.\n3. Disclaimer of Warranty. UNLESS REQUIRED BY APPLICABLE LAW, THE\
|
| 69 |
-
\ LLAMA MATERIALS AND ANY OUTPUT AND RESULTS THEREFROM ARE PROVIDED ON AN “AS IS”\
|
| 70 |
-
\ BASIS, WITHOUT WARRANTIES OF ANY KIND, AND META DISCLAIMS ALL WARRANTIES OF ANY\
|
| 71 |
-
\ KIND, BOTH EXPRESS AND IMPLIED, INCLUDING, WITHOUT LIMITATION, ANY WARRANTIES\
|
| 72 |
-
\ OF TITLE, NON-INFRINGEMENT, MERCHANTABILITY, OR FITNESS FOR A PARTICULAR PURPOSE.\
|
| 73 |
-
\ YOU ARE SOLELY RESPONSIBLE FOR DETERMINING THE APPROPRIATENESS OF USING OR REDISTRIBUTING\
|
| 74 |
-
\ THE LLAMA MATERIALS AND ASSUME ANY RISKS ASSOCIATED WITH YOUR USE OF THE LLAMA\
|
| 75 |
-
\ MATERIALS AND ANY OUTPUT AND RESULTS.\n4. Limitation of Liability. IN NO EVENT\
|
| 76 |
-
\ WILL META OR ITS AFFILIATES BE LIABLE UNDER ANY THEORY OF LIABILITY, WHETHER IN\
|
| 77 |
-
\ CONTRACT, TORT, NEGLIGENCE, PRODUCTS LIABILITY, OR OTHERWISE, ARISING OUT OF THIS\
|
| 78 |
-
\ AGREEMENT, FOR ANY LOST PROFITS OR ANY INDIRECT, SPECIAL, CONSEQUENTIAL, INCIDENTAL,\
|
| 79 |
-
\ EXEMPLARY OR PUNITIVE DAMAGES, EVEN IF META OR ITS AFFILIATES HAVE BEEN ADVISED\
|
| 80 |
-
\ OF THE POSSIBILITY OF ANY OF THE FOREGOING.\n5. Intellectual Property.\na. No\
|
| 81 |
-
\ trademark licenses are granted under this Agreement, and in connection with the\
|
| 82 |
-
\ Llama Materials, neither Meta nor Licensee may use any name or mark owned by or\
|
| 83 |
-
\ associated with the other or any of its affiliates, except as required for reasonable\
|
| 84 |
-
\ and customary use in describing and redistributing the Llama Materials or as set\
|
| 85 |
-
\ forth in this Section 5(a). Meta hereby grants you a license to use “Llama” (the\
|
| 86 |
-
\ “Mark”) solely as required to comply with the last sentence of Section 1.b.i.\
|
| 87 |
-
\ You will comply with Meta’s brand guidelines (currently accessible at https://about.meta.com/brand/resources/meta/company-brand/\
|
| 88 |
-
\ ). All goodwill arising out of your use of the Mark will inure to the benefit\
|
| 89 |
-
\ of Meta.\nb. Subject to Meta’s ownership of Llama Materials and derivatives made\
|
| 90 |
-
\ by or for Meta, with respect to any derivative works and modifications of the\
|
| 91 |
-
\ Llama Materials that are made by you, as between you and Meta, you are and will\
|
| 92 |
-
\ be the owner of such derivative works and modifications.\nc. If you institute\
|
| 93 |
-
\ litigation or other proceedings against Meta or any entity (including a cross-claim\
|
| 94 |
-
\ or counterclaim in a lawsuit) alleging that the Llama Materials or Llama 3.1 outputs\
|
| 95 |
-
\ or results, or any portion of any of the foregoing, constitutes infringement of\
|
| 96 |
-
\ intellectual property or other rights owned or licensable by you, then any licenses\
|
| 97 |
-
\ granted to you under this Agreement shall terminate as of the date such litigation\
|
| 98 |
-
\ or claim is filed or instituted. You will indemnify and hold harmless Meta from\
|
| 99 |
-
\ and against any claim by any third party arising out of or related to your use\
|
| 100 |
-
\ or distribution of the Llama Materials.\n6. Term and Termination. The term of\
|
| 101 |
-
\ this Agreement will commence upon your acceptance of this Agreement or access\
|
| 102 |
-
\ to the Llama Materials and will continue in full force and effect until terminated\
|
| 103 |
-
\ in accordance with the terms and conditions herein. Meta may terminate this Agreement\
|
| 104 |
-
\ if you are in breach of any term or condition of this Agreement. Upon termination\
|
| 105 |
-
\ of this Agreement, you shall delete and cease use of the Llama Materials. Sections\
|
| 106 |
-
\ 3, 4 and 7 shall survive the termination of this Agreement.\n7. Governing Law\
|
| 107 |
-
\ and Jurisdiction. This Agreement will be governed and construed under the laws\
|
| 108 |
-
\ of the State of California without regard to choice of law principles, and the\
|
| 109 |
-
\ UN Convention on Contracts for the International Sale of Goods does not apply\
|
| 110 |
-
\ to this Agreement. The courts of California shall have exclusive jurisdiction\
|
| 111 |
-
\ of any dispute arising out of this Agreement.\n### Llama 3.1 Acceptable Use Policy\n\
|
| 112 |
-
Meta is committed to promoting safe and fair use of its tools and features, including\
|
| 113 |
-
\ Llama 3.1. If you access or use Llama 3.1, you agree to this Acceptable Use Policy\
|
| 114 |
-
\ (“Policy”). The most recent copy of this policy can be found at [https://llama.meta.com/llama3_1/use-policy](https://llama.meta.com/llama3_1/use-policy)\n\
|
| 115 |
-
#### Prohibited Uses\nWe want everyone to use Llama 3.1 safely and responsibly.\
|
| 116 |
-
\ You agree you will not use, or allow others to use, Llama 3.1 to:\n 1. Violate\
|
| 117 |
-
\ the law or others’ rights, including to:\n 1. Engage in, promote, generate,\
|
| 118 |
-
\ contribute to, encourage, plan, incite, or further illegal or unlawful activity\
|
| 119 |
-
\ or content, such as:\n 1. Violence or terrorism\n 2. Exploitation\
|
| 120 |
-
\ or harm to children, including the solicitation, creation, acquisition, or dissemination\
|
| 121 |
-
\ of child exploitative content or failure to report Child Sexual Abuse Material\n\
|
| 122 |
-
\ 3. Human trafficking, exploitation, and sexual violence\n 4. The\
|
| 123 |
-
\ illegal distribution of information or materials to minors, including obscene\
|
| 124 |
-
\ materials, or failure to employ legally required age-gating in connection with\
|
| 125 |
-
\ such information or materials.\n 5. Sexual solicitation\n 6. Any\
|
| 126 |
-
\ other criminal activity\n 3. Engage in, promote, incite, or facilitate the\
|
| 127 |
-
\ harassment, abuse, threatening, or bullying of individuals or groups of individuals\n\
|
| 128 |
-
\ 4. Engage in, promote, incite, or facilitate discrimination or other unlawful\
|
| 129 |
-
\ or harmful conduct in the provision of employment, employment benefits, credit,\
|
| 130 |
-
\ housing, other economic benefits, or other essential goods and services\n 5.\
|
| 131 |
-
\ Engage in the unauthorized or unlicensed practice of any profession including,\
|
| 132 |
-
\ but not limited to, financial, legal, medical/health, or related professional\
|
| 133 |
-
\ practices\n 6. Collect, process, disclose, generate, or infer health, demographic,\
|
| 134 |
-
\ or other sensitive personal or private information about individuals without rights\
|
| 135 |
-
\ and consents required by applicable laws\n 7. Engage in or facilitate any action\
|
| 136 |
-
\ or generate any content that infringes, misappropriates, or otherwise violates\
|
| 137 |
-
\ any third-party rights, including the outputs or results of any products or services\
|
| 138 |
-
\ using the Llama Materials\n 8. Create, generate, or facilitate the creation\
|
| 139 |
-
\ of malicious code, malware, computer viruses or do anything else that could disable,\
|
| 140 |
-
\ overburden, interfere with or impair the proper working, integrity, operation\
|
| 141 |
-
\ or appearance of a website or computer system\n2. Engage in, promote, incite,\
|
| 142 |
-
\ facilitate, or assist in the planning or development of activities that present\
|
| 143 |
-
\ a risk of death or bodily harm to individuals, including use of Llama 3.1 related\
|
| 144 |
-
\ to the following:\n 1. Military, warfare, nuclear industries or applications,\
|
| 145 |
-
\ espionage, use for materials or activities that are subject to the International\
|
| 146 |
-
\ Traffic Arms Regulations (ITAR) maintained by the United States Department of\
|
| 147 |
-
\ State\n 2. Guns and illegal weapons (including weapon development)\n 3.\
|
| 148 |
-
\ Illegal drugs and regulated/controlled substances\n 4. Operation of critical\
|
| 149 |
-
\ infrastructure, transportation technologies, or heavy machinery\n 5. Self-harm\
|
| 150 |
-
\ or harm to others, including suicide, cutting, and eating disorders\n 6. Any\
|
| 151 |
-
\ content intended to incite or promote violence, abuse, or any infliction of bodily\
|
| 152 |
-
\ harm to an individual\n3. Intentionally deceive or mislead others, including use\
|
| 153 |
-
\ of Llama 3.1 related to the following:\n 1. Generating, promoting, or furthering\
|
| 154 |
-
\ fraud or the creation or promotion of disinformation\n 2. Generating, promoting,\
|
| 155 |
-
\ or furthering defamatory content, including the creation of defamatory statements,\
|
| 156 |
-
\ images, or other content\n 3. Generating, promoting, or further distributing\
|
| 157 |
-
\ spam\n 4. Impersonating another individual without consent, authorization,\
|
| 158 |
-
\ or legal right\n 5. Representing that the use of Llama 3.1 or outputs are human-generated\n\
|
| 159 |
-
\ 6. Generating or facilitating false online engagement, including fake reviews\
|
| 160 |
-
\ and other means of fake online engagement\n4. Fail to appropriately disclose to\
|
| 161 |
-
\ end users any known dangers of your AI system\nPlease report any violation of\
|
| 162 |
-
\ this Policy, software “bug,” or other problems that could lead to a violation\
|
| 163 |
-
\ of this Policy through one of the following means:\n * Reporting issues with\
|
| 164 |
-
\ the model: [https://github.com/meta-llama/llama-models/issues](https://github.com/meta-llama/llama-models/issues)\n\
|
| 165 |
-
\ * Reporting risky content generated by the model:\n developers.facebook.com/llama_output_feedback\n\
|
| 166 |
-
\ * Reporting bugs and security concerns: facebook.com/whitehat/info\n * Reporting\
|
| 167 |
-
\ violations of the Acceptable Use Policy or unlicensed uses of Meta Llama 3: LlamaUseReport@meta.com"
|
| 168 |
-
extra_gated_fields:
|
| 169 |
-
First Name: text
|
| 170 |
-
Last Name: text
|
| 171 |
-
Date of birth: date_picker
|
| 172 |
-
Country: country
|
| 173 |
-
Affiliation: text
|
| 174 |
-
Job title:
|
| 175 |
-
type: select
|
| 176 |
-
options:
|
| 177 |
-
- Student
|
| 178 |
-
- Research Graduate
|
| 179 |
-
- AI researcher
|
| 180 |
-
- AI developer/engineer
|
| 181 |
-
- Reporter
|
| 182 |
-
- Other
|
| 183 |
-
geo: ip_location
|
| 184 |
-
? By clicking Submit below I accept the terms of the license and acknowledge that
|
| 185 |
-
the information I provide will be collected stored processed and shared in accordance
|
| 186 |
-
with the Meta Privacy Policy
|
| 187 |
-
: checkbox
|
| 188 |
-
extra_gated_description: The information you provide will be collected, stored, processed
|
| 189 |
-
and shared in accordance with the [Meta Privacy Policy](https://www.facebook.com/privacy/policy/).
|
| 190 |
-
extra_gated_button_content: Submit
|
| 191 |
-
---
|
| 192 |
-
|
| 193 |
-
# mlx-community/Meta-Llama-3.1-405B-4bit
|
| 194 |
-
|
| 195 |
-
The Model [mlx-community/Meta-Llama-3.1-405B-4bit](https://huggingface.co/mlx-community/Meta-Llama-3.1-405B-4bit) was converted to MLX format from [meta-llama/Meta-Llama-3.1-405B-Instruct](https://huggingface.co/meta-llama/Meta-Llama-3.1-405B-Instruct) using mlx-lm version **0.16.0**.
|
| 196 |
-
|
| 197 |
-
## Use with mlx
|
| 198 |
-
|
| 199 |
-
```bash
|
| 200 |
-
pip install mlx-lm
|
| 201 |
-
```
|
| 202 |
-
|
| 203 |
-
```python
|
| 204 |
-
from mlx_lm import load, generate
|
| 205 |
-
|
| 206 |
-
model, tokenizer = load("mlx-community/Meta-Llama-3.1-405B-4bit")
|
| 207 |
-
response = generate(model, tokenizer, prompt="hello", verbose=True)
|
| 208 |
-
```
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
config.json
DELETED
|
@@ -1,42 +0,0 @@
|
|
| 1 |
-
{
|
| 2 |
-
"architectures": [
|
| 3 |
-
"LlamaForCausalLM"
|
| 4 |
-
],
|
| 5 |
-
"attention_bias": false,
|
| 6 |
-
"attention_dropout": 0.0,
|
| 7 |
-
"bos_token_id": 128000,
|
| 8 |
-
"eos_token_id": [
|
| 9 |
-
128001,
|
| 10 |
-
128008,
|
| 11 |
-
128009
|
| 12 |
-
],
|
| 13 |
-
"hidden_act": "silu",
|
| 14 |
-
"hidden_size": 16384,
|
| 15 |
-
"initializer_range": 0.02,
|
| 16 |
-
"intermediate_size": 53248,
|
| 17 |
-
"max_position_embeddings": 131072,
|
| 18 |
-
"mlp_bias": false,
|
| 19 |
-
"model_type": "llama",
|
| 20 |
-
"num_attention_heads": 128,
|
| 21 |
-
"num_hidden_layers": 126,
|
| 22 |
-
"num_key_value_heads": 16,
|
| 23 |
-
"pretraining_tp": 1,
|
| 24 |
-
"quantization": {
|
| 25 |
-
"group_size": 64,
|
| 26 |
-
"bits": 4
|
| 27 |
-
},
|
| 28 |
-
"rms_norm_eps": 1e-05,
|
| 29 |
-
"rope_scaling": {
|
| 30 |
-
"factor": 8.0,
|
| 31 |
-
"low_freq_factor": 1.0,
|
| 32 |
-
"high_freq_factor": 4.0,
|
| 33 |
-
"original_max_position_embeddings": 8192,
|
| 34 |
-
"rope_type": "llama3"
|
| 35 |
-
},
|
| 36 |
-
"rope_theta": 500000.0,
|
| 37 |
-
"tie_word_embeddings": false,
|
| 38 |
-
"torch_dtype": "bfloat16",
|
| 39 |
-
"transformers_version": "4.42.3",
|
| 40 |
-
"use_cache": true,
|
| 41 |
-
"vocab_size": 128256
|
| 42 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
model-00001-of-00046.safetensors
DELETED
|
@@ -1,3 +0,0 @@
|
|
| 1 |
-
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:268097ba386415bb23a5ef1b152de35b38b5520275046077b5c731ee721b147c
|
| 3 |
-
size 5145762627
|
|
|
|
|
|
|
|
|
|
|
|
model-00002-of-00046.safetensors
DELETED
|
@@ -1,3 +0,0 @@
|
|
| 1 |
-
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:a7876692da74b40fe070617b31c2d0f29659186d67837e4cae67cd20a695c7b9
|
| 3 |
-
size 5285027186
|
|
|
|
|
|
|
|
|
|
|
|
model-00003-of-00046.safetensors
DELETED
|
@@ -1,3 +0,0 @@
|
|
| 1 |
-
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:717c03e181a9cb48047cf4af02acb231a41f3718770e0040711c0a8db815ac83
|
| 3 |
-
size 5247277780
|
|
|
|
|
|
|
|
|
|
|
|
model-00004-of-00046.safetensors
DELETED
|
@@ -1,3 +0,0 @@
|
|
| 1 |
-
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:4cf0c6237d38f692695ab2268fb3cf4a85958a4336af496a700514d38d1ae5ea
|
| 3 |
-
size 4945222858
|
|
|
|
|
|
|
|
|
|
|
|
model-00005-of-00046.safetensors
DELETED
|
@@ -1,3 +0,0 @@
|
|
| 1 |
-
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:c18258d23019872ecfee5caddd045c7be7642453bcc693c757188fa24df94295
|
| 3 |
-
size 4945288661
|
|
|
|
|
|
|
|
|
|
|
|
model-00006-of-00046.safetensors
DELETED
|
@@ -1,3 +0,0 @@
|
|
| 1 |
-
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:246a89743cc9fb1edde7c5900dbd1350a0560595f3fbd0fbe5103cd912446081
|
| 3 |
-
size 4945288655
|
|
|
|
|
|
|
|
|
|
|
|
model-00007-of-00046.safetensors
DELETED
|
@@ -1,3 +0,0 @@
|
|
| 1 |
-
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:beb791f71a5353fa80b9cc3e3a03d85d49897bc3c3c480fd7c271fc341d2eeee
|
| 3 |
-
size 5285027250
|
|
|
|
|
|
|
|
|
|
|
|
model-00008-of-00046.safetensors
DELETED
|
@@ -1,3 +0,0 @@
|
|
| 1 |
-
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:763228be7259c199327373f1b7c88748507fd2be76576d702c6425768815199d
|
| 3 |
-
size 5247277832
|
|
|
|
|
|
|
|
|
|
|
|
model-00009-of-00046.safetensors
DELETED
|
@@ -1,3 +0,0 @@
|
|
| 1 |
-
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:dd11eca4fdbd6260a202b3efce39c34b2bcc1835188b5e6cc76aba5f977dceeb
|
| 3 |
-
size 4945222908
|
|
|
|
|
|
|
|
|
|
|
|
model-00010-of-00046.safetensors
DELETED
|
@@ -1,3 +0,0 @@
|
|
| 1 |
-
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:5668d5881b2ec384472aa2da4ffb5f3bee136a13390c979d03395c68334cac16
|
| 3 |
-
size 4945288665
|
|
|
|
|
|
|
|
|
|
|
|
model-00011-of-00046.safetensors
DELETED
|
@@ -1,3 +0,0 @@
|
|
| 1 |
-
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:f2d3e52ed41f153217b2d7733aeea2de6c7f13fb229714778eebe34e6fc7cde1
|
| 3 |
-
size 4945288651
|
|
|
|
|
|
|
|
|
|
|
|
model-00012-of-00046.safetensors
DELETED
|
@@ -1,3 +0,0 @@
|
|
| 1 |
-
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:36e1490b2075dfd959e5e686ed7ec3b04bd83fcdcb134b6b4cde3bf0038f8d9d
|
| 3 |
-
size 5285027248
|
|
|
|
|
|
|
|
|
|
|
|
model-00013-of-00046.safetensors
DELETED
|
@@ -1,3 +0,0 @@
|
|
| 1 |
-
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:f156ef76a9c4b129c4c71e713faf466684a31e95325201c93f87cfd6e5eb8984
|
| 3 |
-
size 5247277822
|
|
|
|
|
|
|
|
|
|
|
|
model-00014-of-00046.safetensors
DELETED
|
@@ -1,3 +0,0 @@
|
|
| 1 |
-
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:e49f8ac24640653003d2fa14a3b2004d344bd619bca385e286c1be91786a4215
|
| 3 |
-
size 4945222900
|
|
|
|
|
|
|
|
|
|
|
|
model-00015-of-00046.safetensors
DELETED
|
@@ -1,3 +0,0 @@
|
|
| 1 |
-
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:6b4e1f720976bda0c4c67590ee41c8a39db03e4bca94bc776fe19d35e0c2382f
|
| 3 |
-
size 4945288657
|
|
|
|
|
|
|
|
|
|
|
|
model-00016-of-00046.safetensors
DELETED
|
@@ -1,3 +0,0 @@
|
|
| 1 |
-
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:f17c5d446d6344891cb0d44b5d0677bba269c2611e66ab61cadcbe54451ea8e3
|
| 3 |
-
size 4945288667
|
|
|
|
|
|
|
|
|
|
|
|
model-00017-of-00046.safetensors
DELETED
|
@@ -1,3 +0,0 @@
|
|
| 1 |
-
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:bbec628e1c188cbfb0a2f92ad08ff2f4a09d8e802a10d0cdc9bbc0a9546f73ea
|
| 3 |
-
size 5285027268
|
|
|
|
|
|
|
|
|
|
|
|
model-00018-of-00046.safetensors
DELETED
|
@@ -1,3 +0,0 @@
|
|
| 1 |
-
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:876fd572c22dec3bc10b99a5fb9dbc303ab15310f59778c22a710a649bcb4e19
|
| 3 |
-
size 5247277834
|
|
|
|
|
|
|
|
|
|
|
|
model-00019-of-00046.safetensors
DELETED
|
@@ -1,3 +0,0 @@
|
|
| 1 |
-
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:9d5544e53401058c49d79d0e4dfcf105452a73753c1383b7bb37e3a78be47e30
|
| 3 |
-
size 4945222890
|
|
|
|
|
|
|
|
|
|
|
|
model-00020-of-00046.safetensors
DELETED
|
@@ -1,3 +0,0 @@
|
|
| 1 |
-
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:66eea6378ed4f969098d1f999690f34b115f37156d1a86288d69858e06d55e3b
|
| 3 |
-
size 4945288665
|
|
|
|
|
|
|
|
|
|
|
|
model-00021-of-00046.safetensors
DELETED
|
@@ -1,3 +0,0 @@
|
|
| 1 |
-
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:e5ce0c3544bb4bf8b7795704dd7a63012606669359f6962a24da3c60ce3e3926
|
| 3 |
-
size 4945288643
|
|
|
|
|
|
|
|
|
|
|
|
model-00022-of-00046.safetensors
DELETED
|
@@ -1,3 +0,0 @@
|
|
| 1 |
-
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:b3ad9e986d45ab4267b22056661f603afe964e9aeedb956f2e99b9a49e786051
|
| 3 |
-
size 5285027256
|
|
|
|
|
|
|
|
|
|
|
|
model-00023-of-00046.safetensors
DELETED
|
@@ -1,3 +0,0 @@
|
|
| 1 |
-
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:8c7d53004e94688fbd3fee63981652ac0ce596f1f0d77ccf04a989045586db76
|
| 3 |
-
size 5247277830
|
|
|
|
|
|
|
|
|
|
|
|
model-00024-of-00046.safetensors
DELETED
|
@@ -1,3 +0,0 @@
|
|
| 1 |
-
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:0d50b89a547e0dd2ff1c2f520ad06f9c611c529669e16d10b2698ad7d4d7eaf7
|
| 3 |
-
size 4945222912
|
|
|
|
|
|
|
|
|
|
|
|
model-00025-of-00046.safetensors
DELETED
|
@@ -1,3 +0,0 @@
|
|
| 1 |
-
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:71bc832eff038e3104bdb301c06eb0a985a3b324664edb5f3ab748c26dd82669
|
| 3 |
-
size 4945288659
|
|
|
|
|
|
|
|
|
|
|
|
model-00026-of-00046.safetensors
DELETED
|
@@ -1,3 +0,0 @@
|
|
| 1 |
-
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:6fc422642b46abe7cdf0e53f34e857a8d9f7d96d1e64a70cdea04694093abab2
|
| 3 |
-
size 4945288645
|
|
|
|
|
|
|
|
|
|
|
|
model-00027-of-00046.safetensors
DELETED
|
@@ -1,3 +0,0 @@
|
|
| 1 |
-
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:78f9203d5986ce4c37f43134cb1d7f4257a87de021ea01277d74b77c6882f2e0
|
| 3 |
-
size 5285027256
|
|
|
|
|
|
|
|
|
|
|
|
model-00028-of-00046.safetensors
DELETED
|
@@ -1,3 +0,0 @@
|
|
| 1 |
-
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:8ddd7f803a8966e254b1ff434690f35efeb07be2bd5c9b8a2b9d9a945e628739
|
| 3 |
-
size 5247277828
|
|
|
|
|
|
|
|
|
|
|
|
model-00029-of-00046.safetensors
DELETED
|
@@ -1,3 +0,0 @@
|
|
| 1 |
-
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:c1e91ed0054c35887226166f1d3fec120a3587fb8f60384d8648a3294ff5c977
|
| 3 |
-
size 4945222890
|
|
|
|
|
|
|
|
|
|
|
|
model-00030-of-00046.safetensors
DELETED
|
@@ -1,3 +0,0 @@
|
|
| 1 |
-
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:1f0be9829f46e1ce872274c198cd5c2d7802074f75cce830054c28ca0f9443df
|
| 3 |
-
size 4945288649
|
|
|
|
|
|
|
|
|
|
|
|
model-00031-of-00046.safetensors
DELETED
|
@@ -1,3 +0,0 @@
|
|
| 1 |
-
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:81241ab3b7831569a371fd25b03568649598345be551ee3dc4bbd0273b0850c9
|
| 3 |
-
size 4945288637
|
|
|
|
|
|
|
|
|
|
|
|
model-00032-of-00046.safetensors
DELETED
|
@@ -1,3 +0,0 @@
|
|
| 1 |
-
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:00fab98ab224be34c0e5fa1a87099bc73535299d0cbd48f76c7611b7c8e9d468
|
| 3 |
-
size 5285027272
|
|
|
|
|
|
|
|
|
|
|
|
model-00033-of-00046.safetensors
DELETED
|
@@ -1,3 +0,0 @@
|
|
| 1 |
-
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:9cba63880493b3d5bd487d009cd64777b0436197fcf44744f542cb9daa5e4f92
|
| 3 |
-
size 5247277832
|
|
|
|
|
|
|
|
|
|
|
|
model-00034-of-00046.safetensors
DELETED
|
@@ -1,3 +0,0 @@
|
|
| 1 |
-
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:46dfee6401f487976effe9abb88a410fde1cf72c60046cc501bfe89863350e10
|
| 3 |
-
size 4945222894
|
|
|
|
|
|
|
|
|
|
|
|
model-00035-of-00046.safetensors
DELETED
|
@@ -1,3 +0,0 @@
|
|
| 1 |
-
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:f0a1fa4ece2105d504eda39cdaca997b53b8c706975ff0b1cf0a4a41b23165f6
|
| 3 |
-
size 4945288661
|
|
|
|
|
|
|
|
|
|
|
|
model-00036-of-00046.safetensors
DELETED
|
@@ -1,3 +0,0 @@
|
|
| 1 |
-
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:14a1946196dc28d961914215c78f872a70180e17bd21faeb16507a993e5ed709
|
| 3 |
-
size 4945288653
|
|
|
|
|
|
|
|
|
|
|
|
model-00037-of-00046.safetensors
DELETED
|
@@ -1,3 +0,0 @@
|
|
| 1 |
-
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:8f1160cdf984866b74b850232df106bd235b5fd3a6e4f87902b8ad958ed27857
|
| 3 |
-
size 5285027330
|
|
|
|
|
|
|
|
|
|
|
|
model-00038-of-00046.safetensors
DELETED
|
@@ -1,3 +0,0 @@
|
|
| 1 |
-
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:00c661bb35b49fb0fab9d42a1c718bda9a3f31a14b0a59a8b582daa34412d7dd
|
| 3 |
-
size 5247277904
|
|
|
|
|
|
|
|
|
|
|
|
model-00039-of-00046.safetensors
DELETED
|
@@ -1,3 +0,0 @@
|
|
| 1 |
-
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:e19182258a20bdfab54d68a034ff4024c92a1d7f7ccb3bb14533cdf7043d2f6f
|
| 3 |
-
size 4945222950
|
|
|
|
|
|
|
|
|
|
|
|
model-00040-of-00046.safetensors
DELETED
|
@@ -1,3 +0,0 @@
|
|
| 1 |
-
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:2f2a9721724a9c41007c7ae28f32ff241d7f676d967ead8ef88e306eeb47cfb9
|
| 3 |
-
size 4945288695
|
|
|
|
|
|
|
|
|
|
|
|
model-00041-of-00046.safetensors
DELETED
|
@@ -1,3 +0,0 @@
|
|
| 1 |
-
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:648141d00f12e65b7891016ac63cb81c6e41a3867bbc974d5268933061101ff1
|
| 3 |
-
size 4945288701
|
|
|
|
|
|
|
|
|
|
|
|
model-00042-of-00046.safetensors
DELETED
|
@@ -1,3 +0,0 @@
|
|
| 1 |
-
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:e40fd5c164c1b179e4d0f4eba8e3cf7ffae8ea3dc76343fba24f9ce7b05cfe2d
|
| 3 |
-
size 5285027324
|
|
|
|
|
|
|
|
|
|
|
|
model-00043-of-00046.safetensors
DELETED
|
@@ -1,3 +0,0 @@
|
|
| 1 |
-
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:02f093161344f80f5b5dff2b53184fe154d5c5206e1b63e7119222051d01e6d3
|
| 3 |
-
size 5247277896
|
|
|
|
|
|
|
|
|
|
|
|
model-00044-of-00046.safetensors
DELETED
|
@@ -1,3 +0,0 @@
|
|
| 1 |
-
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:f2d9db2f3ab81738250d5072c04a6bf2ae7d19510fcfc45d2ade4e6bb5d8dd74
|
| 3 |
-
size 4945222960
|
|
|
|
|
|
|
|
|
|
|
|
model-00045-of-00046.safetensors
DELETED
|
@@ -1,3 +0,0 @@
|
|
| 1 |
-
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:5f7de4567b170757badbea019d6c2e3ddf839b45107cee1552819cfbcdd0ec85
|
| 3 |
-
size 4945288715
|
|
|
|
|
|
|
|
|
|
|
|
model-00046-of-00046.safetensors
DELETED
|
@@ -1,3 +0,0 @@
|
|
| 1 |
-
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:9f644cf79faf6f2bda1d13721fa9c174eabf953c5c6d2cdff948796e6884d7aa
|
| 3 |
-
size 2163574046
|
|
|
|
|
|
|
|
|
|
|
|
model.safetensors.index.json
DELETED
|
The diff for this file is too large to render.
See raw diff
|
|
|