idah4
/

byteetm-korean-tiny

+from transformers import PreTrainedModel, PretrainedConfig
+import torch.nn as nn, torch.nn.functional as F, torch
+class ByteETMConfig(PretrainedConfig):
+    model_type = "byteetm"
+    def __init__(self, vocab_size=258, n_embd=512, n_head=8, n_layer=6, block_size=256, **kwargs):
+        super().__init__(**kwargs)
+        self.vocab_size = vocab_size
+        self.n_embd = n_embd
+        self.n_head = n_head
+        self.n_layer = n_layer
+        self.block_size = block_size
+class HFByteETM(PreTrainedModel):
+    config_class = ByteETMConfig
+    def __init__(self, config):
+        super().__init__(config)
+        from .model import ByteETM     # 네가 정의한 실제 모델
+        self.model = ByteETM(
+            vocab_size=config.vocab_size,
+            n_embd=config.n_embd,
+            n_head=config.n_head,
+            n_layer=config.n_layer,
+            block_size=config.block_size
+        )
+    def forward(self, input_ids, **kwargs):
+        logits, _ = self.model(input_ids)
+        return {"logits": logits}