Update README.md
Browse files
README.md
CHANGED
|
@@ -1,3 +1,47 @@
|
|
| 1 |
-
---
|
| 2 |
-
|
| 3 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
---
|
| 2 |
+
library_name: sentis
|
| 3 |
+
tags:
|
| 4 |
+
- unity-sentis
|
| 5 |
+
- onnx
|
| 6 |
+
- smollm
|
| 7 |
+
- causal-lm
|
| 8 |
+
license: apache-2.0
|
| 9 |
+
language:
|
| 10 |
+
- en
|
| 11 |
+
base_model: HuggingFaceTB/SmolLM3-3B
|
| 12 |
+
pipeline_tag: text-generation
|
| 13 |
+
---
|
| 14 |
+
|
| 15 |
+
# SmolLM3-3B for Unity Sentis
|
| 16 |
+
|
| 17 |
+
This repository contains optimized versions of the [SmolLM3-3B](https://huggingface.co/HuggingFaceTB/SmolLM3-3B) model, specifically formatted for use in **Unity Sentis**.
|
| 18 |
+
|
| 19 |
+
## Available Versions
|
| 20 |
+
|
| 21 |
+
| File Name | Format | Precision | Size | Best For |
|
| 22 |
+
| :--- | :--- | :--- | :--- | :--- |
|
| 23 |
+
| `model.onnx` | ONNX | FP32 | ~12GB | High-fidelity source / Desktop |
|
| 24 |
+
| `model_FP16.sentis` | Sentis | FP16 | ~6GB | Balanced Performance / Modern GPUs |
|
| 25 |
+
| `model_Uint8.sentis` | Sentis | Uint8 | ~3GB | Maximum Performance / Mobile / Low-end PC |
|
| 26 |
+
|
| 27 |
+
## How to use in Unity
|
| 28 |
+
|
| 29 |
+
1. **Install Sentis**: Ensure you have the `com.unity.sentis` package installed via the Unity Package Manager (2.1.0+ recommended).
|
| 30 |
+
2. **Download Model**: Download the `.sentis` file of your choice.
|
| 31 |
+
3. **Import**: Drag the `.sentis` file into your Unity Project.
|
| 32 |
+
4. **Setup Tokenizer**: You will need a compatible tokenizer (like the `tokenizer.json` from the base SmolLM3 repo) to convert text to tokens.
|
| 33 |
+
|
| 34 |
+
### Basic C# Loading Snippet
|
| 35 |
+
```csharp
|
| 36 |
+
using Unity.Sentis;
|
| 37 |
+
using UnityEngine;
|
| 38 |
+
|
| 39 |
+
public class MyLLM : MonoBehaviour {
|
| 40 |
+
public ModelAsset modelAsset;
|
| 41 |
+
private IWorker engine;
|
| 42 |
+
|
| 43 |
+
void Start() {
|
| 44 |
+
Model runtimeModel = ModelLoader.Load(modelAsset);
|
| 45 |
+
engine = WorkerFactory.CreateWorker(BackendType.GPUCompute, runtimeModel);
|
| 46 |
+
}
|
| 47 |
+
}
|