Upload README.md
Browse files
README.md
CHANGED
|
@@ -67,7 +67,48 @@ generated_text = generate_text(
|
|
| 67 |
print(generated_text)
|
| 68 |
```
|
| 69 |
|
| 70 |
-
### Method 2:
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 71 |
```python
|
| 72 |
from deepseek_tinystories.modeling_deepseek import DeepseekInspiredModel, DeepSeekModelConfig
|
| 73 |
from deepseek_tinystories.processor import TinyStoriesProcesssor
|
|
|
|
| 67 |
print(generated_text)
|
| 68 |
```
|
| 69 |
|
| 70 |
+
### Method 2: Using snapshot_download
|
| 71 |
+
```python
|
| 72 |
+
from huggingface_hub import snapshot_download
|
| 73 |
+
import sys
|
| 74 |
+
import torch, json
|
| 75 |
+
|
| 76 |
+
# Download the entire repository
|
| 77 |
+
repo_id = "sky-2002/deepseek-tinystories-60M"
|
| 78 |
+
repo_dir = snapshot_download(repo_id)
|
| 79 |
+
|
| 80 |
+
# Import the local package from the downloaded repo
|
| 81 |
+
sys.path.append(str(repo_dir))
|
| 82 |
+
|
| 83 |
+
from deepseek_tinystories import DeepseekInspiredModel, DeepSeekModelConfig, TinyStoriesProcesssor, generate_text
|
| 84 |
+
|
| 85 |
+
# Load config & model
|
| 86 |
+
config_path = f"{repo_dir}/config.json"
|
| 87 |
+
model_path = f"{repo_dir}/pytorch_model.bin"
|
| 88 |
+
|
| 89 |
+
config = DeepSeekModelConfig(**json.load(open(config_path)))
|
| 90 |
+
model = DeepseekInspiredModel(config)
|
| 91 |
+
model.load_state_dict(torch.load(model_path, map_location="cpu"))
|
| 92 |
+
model.eval()
|
| 93 |
+
|
| 94 |
+
# Initialize processor
|
| 95 |
+
processor = TinyStoriesProcesssor()
|
| 96 |
+
|
| 97 |
+
# Generate text
|
| 98 |
+
prompt = "Once upon a time, there was a little girl..."
|
| 99 |
+
generated_text = generate_text(
|
| 100 |
+
model=model,
|
| 101 |
+
data_processor=processor,
|
| 102 |
+
prompt=prompt,
|
| 103 |
+
max_new_tokens=50,
|
| 104 |
+
temperature=0.8,
|
| 105 |
+
top_k=40,
|
| 106 |
+
device="cpu"
|
| 107 |
+
)
|
| 108 |
+
print(generated_text)
|
| 109 |
+
```
|
| 110 |
+
|
| 111 |
+
### Method 3: Module-specific imports
|
| 112 |
```python
|
| 113 |
from deepseek_tinystories.modeling_deepseek import DeepseekInspiredModel, DeepSeekModelConfig
|
| 114 |
from deepseek_tinystories.processor import TinyStoriesProcesssor
|