OpenMOSS-Team
/

MOSS-TTSD-v1.0

feature-extraction

Model card Files Files and versions

YWMditto commited on 15 days ago

Commit

d2d6a31

·

1 Parent(s): a25e3ca

update readme

Files changed (1) hide show

README.md +24 -1

README.md CHANGED Viewed

@@ -152,6 +152,7 @@ MOSS-TTSD uses a **continuation** workflow: provide reference audio for each spe
 ```python
 from pathlib import Path
 import torch
 import torchaudio
 from transformers import AutoModel, AutoProcessor
@@ -166,6 +167,28 @@ pretrained_model_name_or_path = "OpenMOSS-Team/MOSS-TTSD-v1.0"
 device = "cuda" if torch.cuda.is_available() else "cpu"
 dtype = torch.bfloat16 if device == "cuda" else torch.float32
 processor = AutoProcessor.from_pretrained(
     pretrained_model_name_or_path,
     trust_remote_code=True,
@@ -176,7 +199,7 @@ model = AutoModel.from_pretrained(
     pretrained_model_name_or_path,
     trust_remote_code=True,
     # If FlashAttention 2 is installed, you can set attn_implementation="flash_attention_2"
-    attn_implementation="sdpa",
     torch_dtype=dtype,
 ).to(device)
 model.eval()

 ```python
 from pathlib import Path
+import importlib.util
 import torch
 import torchaudio
 from transformers import AutoModel, AutoProcessor
 device = "cuda" if torch.cuda.is_available() else "cpu"
 dtype = torch.bfloat16 if device == "cuda" else torch.float32
+def resolve_attn_implementation() -> str:
+    # Prefer FlashAttention 2 when package + device conditions are met.
+    if (
+        device == "cuda"
+        and importlib.util.find_spec("flash_attn") is not None
+        and dtype in {torch.float16, torch.bfloat16}
+    ):
+        major, _ = torch.cuda.get_device_capability()
+        if major >= 8:
+            return "flash_attention_2"
+    # CUDA fallback: use PyTorch SDPA kernels.
+    if device == "cuda":
+        return "sdpa"
+    # CPU fallback.
+    return "eager"
+attn_implementation = resolve_attn_implementation()
+print(f"[INFO] Using attn_implementation={attn_implementation}")
 processor = AutoProcessor.from_pretrained(
     pretrained_model_name_or_path,
     trust_remote_code=True,
     pretrained_model_name_or_path,
     trust_remote_code=True,
     # If FlashAttention 2 is installed, you can set attn_implementation="flash_attention_2"
+    attn_implementation=attn_implementation,
     torch_dtype=dtype,
 ).to(device)
 model.eval()