sky-2002 commited on
Commit
9f68fac
·
verified ·
1 Parent(s): be75a6d

Upload README.md

Browse files
Files changed (1) hide show
  1. README.md +42 -1
README.md CHANGED
@@ -67,7 +67,48 @@ generated_text = generate_text(
67
  print(generated_text)
68
  ```
69
 
70
- ### Method 2: Module-specific imports
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
71
  ```python
72
  from deepseek_tinystories.modeling_deepseek import DeepseekInspiredModel, DeepSeekModelConfig
73
  from deepseek_tinystories.processor import TinyStoriesProcesssor
 
67
  print(generated_text)
68
  ```
69
 
70
+ ### Method 2: Using snapshot_download
71
+ ```python
72
+ from huggingface_hub import snapshot_download
73
+ import sys
74
+ import torch, json
75
+
76
+ # Download the entire repository
77
+ repo_id = "sky-2002/deepseek-tinystories-60M"
78
+ repo_dir = snapshot_download(repo_id)
79
+
80
+ # Import the local package from the downloaded repo
81
+ sys.path.append(str(repo_dir))
82
+
83
+ from deepseek_tinystories import DeepseekInspiredModel, DeepSeekModelConfig, TinyStoriesProcesssor, generate_text
84
+
85
+ # Load config & model
86
+ config_path = f"{repo_dir}/config.json"
87
+ model_path = f"{repo_dir}/pytorch_model.bin"
88
+
89
+ config = DeepSeekModelConfig(**json.load(open(config_path)))
90
+ model = DeepseekInspiredModel(config)
91
+ model.load_state_dict(torch.load(model_path, map_location="cpu"))
92
+ model.eval()
93
+
94
+ # Initialize processor
95
+ processor = TinyStoriesProcesssor()
96
+
97
+ # Generate text
98
+ prompt = "Once upon a time, there was a little girl..."
99
+ generated_text = generate_text(
100
+ model=model,
101
+ data_processor=processor,
102
+ prompt=prompt,
103
+ max_new_tokens=50,
104
+ temperature=0.8,
105
+ top_k=40,
106
+ device="cpu"
107
+ )
108
+ print(generated_text)
109
+ ```
110
+
111
+ ### Method 3: Module-specific imports
112
  ```python
113
  from deepseek_tinystories.modeling_deepseek import DeepseekInspiredModel, DeepSeekModelConfig
114
  from deepseek_tinystories.processor import TinyStoriesProcesssor