Staticaliza
/

ReyaChat

Text Generation

compressed-tensors

Model card Files Files and versions

Staticaliza commited on Jun 23, 2025

Commit

41df97e

·

verified ·

1 Parent(s): b322146

Update README.md

Files changed (1) hide show

README.md +8 -0

README.md CHANGED Viewed

@@ -25,6 +25,14 @@ from vllm import LLM, SamplingParams
 repo = snapshot_download(repo_id="Staticaliza/Reya-Human", allow_patterns=["*.json", "*.bin", "*.safetensors"])
 llm = LLM(model=repo, dtype="auto", tensor_parallel_size=torch.cuda.device_count(), enforce_eager=True, trust_remote_code=True)
 params = SamplingParams(
     max_tokens=256,
     temperature=1,

 repo = snapshot_download(repo_id="Staticaliza/Reya-Human", allow_patterns=["*.json", "*.bin", "*.safetensors"])
 llm = LLM(model=repo, dtype="auto", tensor_parallel_size=torch.cuda.device_count(), enforce_eager=True, trust_remote_code=True)
+# ChatML is suggested
+input = """<|im_start|>system
+You are Reya.<|im_end|>
+<|im_start|>user
+Hi.<|im_end|>
+<|im_start|>assistant
+"""
 params = SamplingParams(
     max_tokens=256,
     temperature=1,