Upload folder using huggingface_hub

Browse files

Files changed (19) hide show

__pycache__/handler.cpython-38.pyc +0 -0
rnnlm_model/__pycache__/__init__.cpython-311.pyc +0 -0
rnnlm_model/__pycache__/__init__.cpython-312.pyc +0 -0
rnnlm_model/__pycache__/configuration_rnnlm.cpython-311.pyc +0 -0
rnnlm_model/__pycache__/configuration_rnnlm.cpython-312.pyc +0 -0
rnnlm_model/__pycache__/modeling_rnnlm.cpython-311.pyc +0 -0
rnnlm_model/__pycache__/modeling_rnnlm.cpython-312.pyc +0 -0
rnnlm_model/__pycache__/modeling_rnnlm.cpython-38.pyc +0 -0
rnnlm_model/__pycache__/pipeline_rnnlm.cpython-311.pyc +0 -0
rnnlm_model/__pycache__/pipeline_rnnlm.cpython-312.pyc +0 -0
rnnlm_model/__pycache__/pipeline_rnnlm.cpython-38.pyc +0 -0
rnnlm_model/__pycache__/tokenization_rnnlm.cpython-311.pyc +0 -0
rnnlm_model/__pycache__/tokenization_rnnlm.cpython-312.pyc +0 -0
rnnlm_model/__pycache__/tokenization_utils.cpython-311.pyc +0 -0
rnnlm_model/__pycache__/tokenization_utils.cpython-312.pyc +0 -0
rnnlm_model/__pycache__/tokenization_utils.cpython-38.pyc +0 -0
rnnlm_model/modeling_rnnlm.py +14 -3
rnnlm_model/pipeline_rnnlm.py +18 -0
rnnlm_model/tokenization_utils.py +9 -9

__pycache__/handler.cpython-38.pyc ADDED Viewed

Binary file (2.88 kB). View file

rnnlm_model/__pycache__/__init__.cpython-311.pyc ADDED Viewed

Binary file (576 Bytes). View file

rnnlm_model/__pycache__/__init__.cpython-312.pyc ADDED Viewed

Binary file (530 Bytes). View file

rnnlm_model/__pycache__/configuration_rnnlm.cpython-311.pyc ADDED Viewed

Binary file (2.11 kB). View file

rnnlm_model/__pycache__/configuration_rnnlm.cpython-312.pyc ADDED Viewed

Binary file (1.87 kB). View file

rnnlm_model/__pycache__/modeling_rnnlm.cpython-311.pyc ADDED Viewed

Binary file (17.4 kB). View file

rnnlm_model/__pycache__/modeling_rnnlm.cpython-312.pyc ADDED Viewed

Binary file (16.6 kB). View file

rnnlm_model/__pycache__/modeling_rnnlm.cpython-38.pyc CHANGED Viewed

Binary files a/rnnlm_model/__pycache__/modeling_rnnlm.cpython-38.pyc and b/rnnlm_model/__pycache__/modeling_rnnlm.cpython-38.pyc differ

rnnlm_model/__pycache__/pipeline_rnnlm.cpython-311.pyc ADDED Viewed

Binary file (6.17 kB). View file

rnnlm_model/__pycache__/pipeline_rnnlm.cpython-312.pyc ADDED Viewed

Binary file (5.38 kB). View file

rnnlm_model/__pycache__/pipeline_rnnlm.cpython-38.pyc CHANGED Viewed

Binary files a/rnnlm_model/__pycache__/pipeline_rnnlm.cpython-38.pyc and b/rnnlm_model/__pycache__/pipeline_rnnlm.cpython-38.pyc differ

rnnlm_model/__pycache__/tokenization_rnnlm.cpython-311.pyc ADDED Viewed

Binary file (17.4 kB). View file

rnnlm_model/__pycache__/tokenization_rnnlm.cpython-312.pyc ADDED Viewed

Binary file (15.3 kB). View file

rnnlm_model/__pycache__/tokenization_utils.cpython-311.pyc ADDED Viewed

Binary file (24.6 kB). View file

rnnlm_model/__pycache__/tokenization_utils.cpython-312.pyc ADDED Viewed

Binary file (18.1 kB). View file

rnnlm_model/__pycache__/tokenization_utils.cpython-38.pyc CHANGED Viewed

Binary files a/rnnlm_model/__pycache__/tokenization_utils.cpython-38.pyc and b/rnnlm_model/__pycache__/tokenization_utils.cpython-38.pyc differ

rnnlm_model/modeling_rnnlm.py CHANGED Viewed

@@ -6,14 +6,18 @@ import torch.nn as nn
 try:
     from transformers import PreTrainedModel
     from transformers.modeling_outputs import CausalLMOutputWithPast
-    from transformers.generation import LogitsProcessor, LogitsProcessorList
 except ImportError:
     from transformers.modeling_utils import PreTrainedModel
     from transformers.modeling_outputs import CausalLMOutputWithPast
     try:
-        from transformers.generation import LogitsProcessor, LogitsProcessorList
     except ImportError:
-        from transformers.generation_utils import LogitsProcessor, LogitsProcessorList
 from .configuration_rnnlm import RNNLMConfig
@@ -113,6 +117,8 @@ class RNNLMForCausalLM(PreTrainedModel):
     def __init__(self, config: RNNLMConfig, **kwargs):
         super().__init__(config)
         self.config = config
         self.vocab_size = config.vocab_size
         self.embedding_dim = config.embedding_dim
         self.hidden_size = config.hidden_size
@@ -299,4 +305,9 @@ class RNNLMForCausalLM(PreTrainedModel):
             logits_processor = LogitsProcessorList(logits_processor)
         logits_processor.insert(0, processor)
         kwargs["logits_processor"] = logits_processor
         return super().generate(inputs, **kwargs)

 try:
     from transformers import PreTrainedModel
     from transformers.modeling_outputs import CausalLMOutputWithPast
+    from transformers.generation import GenerationMixin, LogitsProcessor, LogitsProcessorList
 except ImportError:
     from transformers.modeling_utils import PreTrainedModel
     from transformers.modeling_outputs import CausalLMOutputWithPast
     try:
+        from transformers.generation import GenerationMixin, LogitsProcessor, LogitsProcessorList
     except ImportError:
+        try:
+            from transformers.generation_utils import GenerationMixin, LogitsProcessor, LogitsProcessorList
+        except ImportError:
+            from transformers.generation_utils import LogitsProcessor, LogitsProcessorList
+            GenerationMixin = None
 from .configuration_rnnlm import RNNLMConfig
     def __init__(self, config: RNNLMConfig, **kwargs):
         super().__init__(config)
         self.config = config
+        # RNNLM has no tied weights; transformers expects this attribute (dict) for .update()
+        self.all_tied_weights_keys = {}
         self.vocab_size = config.vocab_size
         self.embedding_dim = config.embedding_dim
         self.hidden_size = config.hidden_size
             logits_processor = LogitsProcessorList(logits_processor)
         logits_processor.insert(0, processor)
         kwargs["logits_processor"] = logits_processor
+        # RNNLM uses tuple cache (hidden states), not DynamicCache; avoid cache to prevent "not subscriptable" error
+        kwargs.setdefault("use_cache", False)
+        # Call GenerationMixin.generate explicitly (super() can fail in some loading contexts)
+        if GenerationMixin is not None:
+            return GenerationMixin.generate(self, inputs, **kwargs)
         return super().generate(inputs, **kwargs)

rnnlm_model/pipeline_rnnlm.py CHANGED Viewed

@@ -3,6 +3,7 @@
 from transformers.pipelines.text_generation import TextGenerationPipeline
 from transformers.pipelines.text_generation import ReturnType
 class RNNLMTextGenerationPipeline(TextGenerationPipeline):
@@ -14,6 +15,23 @@ class RNNLMTextGenerationPipeline(TextGenerationPipeline):
     When the tokenizer has generalize_ents=True, entities are extracted from the
     prompt and used to replace ENT_PERSON_0, ENT_GPE_0, etc. in the generated output.
     """
     def postprocess(
         self,

 from transformers.pipelines.text_generation import TextGenerationPipeline
 from transformers.pipelines.text_generation import ReturnType
+from transformers import GenerationConfig
 class RNNLMTextGenerationPipeline(TextGenerationPipeline):
     When the tokenizer has generalize_ents=True, entities are extracted from the
     prompt and used to replace ENT_PERSON_0, ENT_GPE_0, etc. in the generated output.
     """
+    assistant_model = None  # Class default for transformers compatibility (assisted decoding)
+    assistant_tokenizer = None
+    prefix = None  # For XLNet/TransfoXL; RNNLM doesn't use it
+    def __init__(self, *args, **kwargs):
+        super().__init__(*args, **kwargs)
+        # Newer transformers expect these; RNNLM doesn't use them
+        self.assistant_model = None
+        self.assistant_tokenizer = None
+        self.prefix = getattr(self, "prefix", None)
+        if not hasattr(self, "generation_config") or self.generation_config is None:
+            self.generation_config = GenerationConfig(
+                pad_token_id=getattr(self.tokenizer, "pad_token_id", 0),
+                max_new_tokens=256,
+                do_sample=True,
+                temperature=0.7,
+            )
     def postprocess(
         self,

rnnlm_model/tokenization_utils.py CHANGED Viewed

@@ -265,14 +265,14 @@ def detokenize_tok_seq(encoder, seq, ents=[], begin_sentence=True):
         # capitalize first-person "I" pronoun
         detok_sent = re.sub(r"(^| )i ", r"\1I ", detok_sent)
-        # rules for contractions
-        detok_sent = re.sub(" n\'\s*t ", "n\'t ", detok_sent)
-        detok_sent = re.sub(" \'\s*d ", "\'d ", detok_sent)
-        detok_sent = re.sub(" \'\s*s ", "\'s ", detok_sent)
-        detok_sent = re.sub(" \'\s*ve ", "\'ve ", detok_sent)
-        detok_sent = re.sub(" \'\s*ll ", "\'ll ", detok_sent)
-        detok_sent = re.sub(" \'\s*m ", "\'m ", detok_sent)
-        detok_sent = re.sub(" \'\s*re ", "\'re ", detok_sent)
         # rules for formatting punctuation
         detok_sent = re.sub(" \.", ".", detok_sent)
@@ -291,7 +291,7 @@ def detokenize_tok_seq(encoder, seq, ents=[], begin_sentence=True):
         detok_sent = re.sub("\`\`", "\"", detok_sent)
         # filter repetitive characters
-        detok_sent = re.sub("([\"\']\s*){2,}", "\" ", detok_sent)
         # map each opening puncutation mark to closing mark
         punc_pairs = {"\'": "\'", "\'": "\'",

         # capitalize first-person "I" pronoun
         detok_sent = re.sub(r"(^| )i ", r"\1I ", detok_sent)
+        # rules for contractions (pattern: raw string for \s; replacement: no backslash)
+        detok_sent = re.sub(r" n'\s*t ", "n't ", detok_sent)
+        detok_sent = re.sub(r" '\s*d ", "'d ", detok_sent)
+        detok_sent = re.sub(r" '\s*s ", "'s ", detok_sent)
+        detok_sent = re.sub(r" '\s*ve ", "'ve ", detok_sent)
+        detok_sent = re.sub(r" '\s*ll ", "'ll ", detok_sent)
+        detok_sent = re.sub(r" '\s*m ", "'m ", detok_sent)
+        detok_sent = re.sub(r" '\s*re ", "'re ", detok_sent)
         # rules for formatting punctuation
         detok_sent = re.sub(" \.", ".", detok_sent)
         detok_sent = re.sub("\`\`", "\"", detok_sent)
         # filter repetitive characters
+        detok_sent = re.sub(r'(["\']\s*){2,}', '" ', detok_sent)
         # map each opening puncutation mark to closing mark
         punc_pairs = {"\'": "\'", "\'": "\'",