Instructions to use SkyworkAIGC/SkyCode with libraries, inference providers, notebooks, and local apps. Follow these links to get started.
- Libraries
- Transformers
How to use SkyworkAIGC/SkyCode with Transformers:
# Use a pipeline as a high-level helper from transformers import pipeline pipe = pipeline("text-generation", model="SkyworkAIGC/SkyCode")# Load model directly from transformers import AutoTokenizer, AutoModelForCausalLM tokenizer = AutoTokenizer.from_pretrained("SkyworkAIGC/SkyCode") model = AutoModelForCausalLM.from_pretrained("SkyworkAIGC/SkyCode") - Notebooks
- Google Colab
- Kaggle
- Local Apps
- vLLM
How to use SkyworkAIGC/SkyCode with vLLM:
Install from pip and serve model
# Install vLLM from pip: pip install vllm # Start the vLLM server: vllm serve "SkyworkAIGC/SkyCode" # Call the server using curl (OpenAI-compatible API): curl -X POST "http://localhost:8000/v1/completions" \ -H "Content-Type: application/json" \ --data '{ "model": "SkyworkAIGC/SkyCode", "prompt": "Once upon a time,", "max_tokens": 512, "temperature": 0.5 }'Use Docker
docker model run hf.co/SkyworkAIGC/SkyCode
- SGLang
How to use SkyworkAIGC/SkyCode with SGLang:
Install from pip and serve model
# Install SGLang from pip: pip install sglang # Start the SGLang server: python3 -m sglang.launch_server \ --model-path "SkyworkAIGC/SkyCode" \ --host 0.0.0.0 \ --port 30000 # Call the server using curl (OpenAI-compatible API): curl -X POST "http://localhost:30000/v1/completions" \ -H "Content-Type: application/json" \ --data '{ "model": "SkyworkAIGC/SkyCode", "prompt": "Once upon a time,", "max_tokens": 512, "temperature": 0.5 }'Use Docker images
docker run --gpus all \ --shm-size 32g \ -p 30000:30000 \ -v ~/.cache/huggingface:/root/.cache/huggingface \ --env "HF_TOKEN=<secret>" \ --ipc=host \ lmsysorg/sglang:latest \ python3 -m sglang.launch_server \ --model-path "SkyworkAIGC/SkyCode" \ --host 0.0.0.0 \ --port 30000 # Call the server using curl (OpenAI-compatible API): curl -X POST "http://localhost:30000/v1/completions" \ -H "Content-Type: application/json" \ --data '{ "model": "SkyworkAIGC/SkyCode", "prompt": "Once upon a time,", "max_tokens": 512, "temperature": 0.5 }' - Docker Model Runner
How to use SkyworkAIGC/SkyCode with Docker Model Runner:
docker model run hf.co/SkyworkAIGC/SkyCode
SkyWork commited on
Commit ·
a852f27
1
Parent(s): 6fcd10a
Update tokenization_sky.py
Browse files- tokenization_sky.py +3 -3
tokenization_sky.py
CHANGED
|
@@ -325,7 +325,7 @@ class SkyTokenizer(PreTrainedTokenizer):
|
|
| 325 |
|
| 326 |
def _tokenize(self, text, **kwargs):
|
| 327 |
"""Tokenize a string."""
|
| 328 |
-
return self.trie.match(text, **kwargs)
|
| 329 |
|
| 330 |
def _decode(self,
|
| 331 |
token_ids: Union[int, List[int], "np.ndarray", "torch.Tensor", "tf.Tensor"],
|
|
@@ -393,7 +393,7 @@ class SkyTokenizer(PreTrainedTokenizer):
|
|
| 393 |
) -> BatchEncoding:
|
| 394 |
def get_input_ids(text):
|
| 395 |
if isinstance(text, str):
|
| 396 |
-
text_id = self.trie.match(text)
|
| 397 |
return text_id
|
| 398 |
elif isinstance(text, list) and len(text) > 0 and isinstance(text[0], str):
|
| 399 |
return [self.trie.match(t, unk_id=self.unk_token_id) for t in text]
|
|
@@ -458,7 +458,7 @@ class SkyTokenizer(PreTrainedTokenizer):
|
|
| 458 |
) -> BatchEncoding:
|
| 459 |
def get_input_ids(text):
|
| 460 |
if isinstance(text, str):
|
| 461 |
-
text_id = self.trie.match(text)
|
| 462 |
return text_id
|
| 463 |
elif isinstance(text, list) and len(text) > 0 and isinstance(text[0], str):
|
| 464 |
return [self.trie.match(t, unk_id=self.unk_token_id) for t in text]
|
|
|
|
| 325 |
|
| 326 |
def _tokenize(self, text, **kwargs):
|
| 327 |
"""Tokenize a string."""
|
| 328 |
+
return self.trie.match(text, unk_id=self.unk_token_id, **kwargs)
|
| 329 |
|
| 330 |
def _decode(self,
|
| 331 |
token_ids: Union[int, List[int], "np.ndarray", "torch.Tensor", "tf.Tensor"],
|
|
|
|
| 393 |
) -> BatchEncoding:
|
| 394 |
def get_input_ids(text):
|
| 395 |
if isinstance(text, str):
|
| 396 |
+
text_id = self.trie.match(text, unk_id=self.unk_token_id)
|
| 397 |
return text_id
|
| 398 |
elif isinstance(text, list) and len(text) > 0 and isinstance(text[0], str):
|
| 399 |
return [self.trie.match(t, unk_id=self.unk_token_id) for t in text]
|
|
|
|
| 458 |
) -> BatchEncoding:
|
| 459 |
def get_input_ids(text):
|
| 460 |
if isinstance(text, str):
|
| 461 |
+
text_id = self.trie.match(text, unk_id=self.unk_token_id)
|
| 462 |
return text_id
|
| 463 |
elif isinstance(text, list) and len(text) > 0 and isinstance(text[0], str):
|
| 464 |
return [self.trie.match(t, unk_id=self.unk_token_id) for t in text]
|