Spaces:

sourize
/

DeepTalks

Sleeping

App Files Files Community

sourize commited on Apr 30, 2025

Commit

55faf97

1 Parent(s): 857744a

Commit

Browse files

Files changed (11) hide show

app.py +60 -50
models/phi2-deeptalk-lora/README.md +0 -202
models/phi2-deeptalk-lora/adapter_config.json +0 -36
models/phi2-deeptalk-lora/adapter_model.safetensors +0 -3
models/phi2-deeptalk-lora/added_tokens.json +0 -41
models/phi2-deeptalk-lora/merges.txt +0 -0
models/phi2-deeptalk-lora/special_tokens_map.json +0 -30
models/phi2-deeptalk-lora/tokenizer.json +0 -0
models/phi2-deeptalk-lora/tokenizer_config.json +0 -335
models/phi2-deeptalk-lora/training_args.bin +0 -3
models/phi2-deeptalk-lora/vocab.json +0 -0

app.py CHANGED Viewed

@@ -7,36 +7,39 @@ from transformers import (
     AutoModelForCausalLM,
     BitsAndBytesConfig,
 )
-from peft import LoraConfig, get_peft_model
-from safetensors.torch import load_file as safe_load
 # ── Configuration ──────────────────────────────────────────────────────────
-BASE_MODEL      = "microsoft/phi-2"
-ADAPTER_DIR     = os.path.join(os.path.dirname(__file__), "models", "phi2-deeptalk-lora")
-CONTEXT_TURNS   = 6
-MAX_NEW_TOKENS  = 32
-DEVICE_MAP      = "auto"
 SYSTEM = (
-    "You are a helpful assistant for DeepTalks with base Phi-2 fine-tuned "
-    "by Sourish for domain support.\n"
-    "Answer only using the conversation context below.\n"
     "If you don’t know, say “I don't know.”\n"
 )
-# ── Model loader (cached) ──────────────────────────────────────────────────
 @st.cache_resource(show_spinner=False)
-def load_generator():
-    # 1) Tokenizer (from official HF cache)
     tokenizer = AutoTokenizer.from_pretrained(
-        BASE_MODEL, trust_remote_code=True, padding_side="left"
     )
     if tokenizer.pad_token_id is None:
         tokenizer.add_special_tokens({"pad_token": "[PAD]"})
-    # 2) Base model (4-bit on GPU, else FP16/FP32)
     if torch.cuda.is_available():
-        bnb = BitsAndBytesConfig(
             load_in_4bit=True,
             bnb_4bit_quant_type="nf4",
             bnb_4bit_compute_dtype="float16",
@@ -45,8 +48,10 @@ def load_generator():
         base = AutoModelForCausalLM.from_pretrained(
             BASE_MODEL,
             trust_remote_code=True,
-            quantization_config=bnb,
-            device_map=DEVICE_MAP,
         )
     else:
         dtype = torch.float16 if torch.cuda.is_available() else torch.float32
@@ -54,76 +59,81 @@ def load_generator():
             BASE_MODEL,
             trust_remote_code=True,
             torch_dtype=dtype,
-            device_map=DEVICE_MAP,
         )
-    # 3) Resize embeddings & wrap LoRA
     base.resize_token_embeddings(len(tokenizer))
-    peft_config = LoraConfig.from_pretrained(ADAPTER_DIR, local_files_only=True)
-    model       = get_peft_model(base, peft_config)
-    # 4) Load adapter weights (.safetensors)
-    adapter_file = os.path.join(ADAPTER_DIR, "adapter_model.safetensors")
-    state_dict   = safe_load(adapter_file)
-    model.load_state_dict(state_dict, strict=False)
     model.eval()
-    # 5) Build a **greedy** pipeline for max speed
     gen = pipeline(
         "text-generation",
         model=model,
         tokenizer=tokenizer,
-        device_map=DEVICE_MAP,
         max_new_tokens=MAX_NEW_TOKENS,
-        do_sample=False,     # greedy
         use_cache=True,
         return_full_text=False,
     )
-    return tokenizer, gen
-tokenizer, generator = load_generator()
 # ── Streamlit UI ──────────────────────────────────────────────────────────
 st.set_page_config(layout="centered")
 st.title("🧠 Memory-Aware Phi-2 Chat")
-# Initialize chat history
 if "history" not in st.session_state:
-    st.session_state.history = []  # list of (role, text)
-# Render past messages
 for role, text in st.session_state.history:
-    st.chat_message("user" if role=="You" else "assistant").write(text)
-# User input at bottom
 user_input = st.chat_input("Your message…")
 if user_input:
-    # Show/store user turn
     st.chat_message("user").write(user_input)
     st.session_state.history.append(("You", user_input))
-    # Build context from last N turns
     recent = st.session_state.history[-CONTEXT_TURNS*2:]
-    ctx = "\n".join(
-        f"{'User' if r=='You' else 'Assistant'}: {t}"
-        for r,t in recent
-    )
     prompt = f"""{SYSTEM}
 Context:
-{ctx}
 User: {user_input}
 Assistant:"""
-    # Generate reply (spinner)
     with st.spinner("Thinking…"):
         try:
-            out = generator(prompt)[0]["generated_text"].strip()
         except Exception as e:
-            out = "I’m sorry, something went wrong."
-            st.error(f"Error: {e}")
-    # Show/store assistant
-    st.chat_message("assistant").write(out)
-    st.session_state.history.append(("Bot", out))

     AutoModelForCausalLM,
     BitsAndBytesConfig,
 )
+from peft import PeftModel
+import logging
 # ── Configuration ──────────────────────────────────────────────────────────
+BASE_MODEL     = "microsoft/phi-2"
+ADAPTER_REPO   = "sourize/phi2-memory-lora"
+CONTEXT_TURNS  = 6
+MAX_NEW_TOKENS = 32
+OFFLOAD_DIR    = "offload"
 SYSTEM = (
+    "You are a helpful assistant for DeepTalks with base Phi-2 "
+    "fine-tuned by Sourish for domain support.\n"
+    "Answer **only** using the conversation context below.\n"
+    "Do NOT output any lines beginning with 'User:' or 'Assistant:'.\n"
     "If you don’t know, say “I don't know.”\n"
 )
 @st.cache_resource(show_spinner=False)
+def load_pipeline():
+    # 1) Tokenizer
     tokenizer = AutoTokenizer.from_pretrained(
+        BASE_MODEL,
+        trust_remote_code=True,
+        padding_side="left",
     )
     if tokenizer.pad_token_id is None:
         tokenizer.add_special_tokens({"pad_token": "[PAD]"})
+    # 2) Base model (4-bit quant on GPU, else FP16/FP32)
     if torch.cuda.is_available():
+        bnb_config = BitsAndBytesConfig(
             load_in_4bit=True,
             bnb_4bit_quant_type="nf4",
             bnb_4bit_compute_dtype="float16",
         base = AutoModelForCausalLM.from_pretrained(
             BASE_MODEL,
             trust_remote_code=True,
+            quantization_config=bnb_config,
+            device_map="auto",
+            offload_folder=OFFLOAD_DIR,
+            offload_state_dict=True,
         )
     else:
         dtype = torch.float16 if torch.cuda.is_available() else torch.float32
             BASE_MODEL,
             trust_remote_code=True,
             torch_dtype=dtype,
+            device_map="auto",
+            offload_folder=OFFLOAD_DIR,
+            offload_state_dict=True,
         )
+    # 3) Resize embeddings
     base.resize_token_embeddings(len(tokenizer))
+    # 4) Overlay LoRA adapter from Hugging Face Hub
+    model = PeftModel.from_pretrained(
+        base,
+        ADAPTER_REPO,
+        trust_remote_code=True,
+        device_map="auto",
+        torch_dtype="auto",
+        offload_folder=OFFLOAD_DIR,
+        offload_state_dict=True,
+    )
     model.eval()
+    # 5) Build generation pipeline (greedy for speed)
     gen = pipeline(
         "text-generation",
         model=model,
         tokenizer=tokenizer,
+        device_map="auto",
         max_new_tokens=MAX_NEW_TOKENS,
+        do_sample=False,      # greedy decoding
         use_cache=True,
         return_full_text=False,
     )
+    logging.info(f"Loaded pipeline with model {BASE_MODEL} + adapter {ADAPTER_REPO}")
+    return gen
+generator = load_pipeline()
 # ── Streamlit UI ──────────────────────────────────────────────────────────
 st.set_page_config(layout="centered")
 st.title("🧠 Memory-Aware Phi-2 Chat")
+# initialize chat history
 if "history" not in st.session_state:
+    st.session_state.history = []  # List of (role, text)
+# render chat history
 for role, text in st.session_state.history:
+    st.chat_message("user" if role == "You" else "assistant").write(text)
+# user input
 user_input = st.chat_input("Your message…")
 if user_input:
+    # show & store user turn
     st.chat_message("user").write(user_input)
     st.session_state.history.append(("You", user_input))
+    # build context from last CONTEXT_TURNS
     recent = st.session_state.history[-CONTEXT_TURNS*2:]
+    context = "\n".join(t for _, t in recent)
     prompt = f"""{SYSTEM}
 Context:
+{context}
 User: {user_input}
 Assistant:"""
+    # generate reply
     with st.spinner("Thinking…"):
         try:
+            output = generator(prompt)[0]["generated_text"].strip()
         except Exception as e:
+            output = "I’m sorry, something went wrong."
+            st.error(f"Generation error: {e}")
+    # show & store assistant turn
+    st.chat_message("assistant").write(output)
+    st.session_state.history.append(("Bot", output))

models/phi2-deeptalk-lora/README.md DELETED Viewed

@@ -1,202 +0,0 @@
----
-base_model: microsoft/phi-2
-library_name: peft
----
-# Model Card for Model ID
-<!-- Provide a quick summary of what the model is/does. -->
-## Model Details
-### Model Description
-<!-- Provide a longer summary of what this model is. -->
-- **Developed by:** [More Information Needed]
-- **Funded by [optional]:** [More Information Needed]
-- **Shared by [optional]:** [More Information Needed]
-- **Model type:** [More Information Needed]
-- **Language(s) (NLP):** [More Information Needed]
-- **License:** [More Information Needed]
-- **Finetuned from model [optional]:** [More Information Needed]
-### Model Sources [optional]
-<!-- Provide the basic links for the model. -->
-- **Repository:** [More Information Needed]
-- **Paper [optional]:** [More Information Needed]
-- **Demo [optional]:** [More Information Needed]
-## Uses
-<!-- Address questions around how the model is intended to be used, including the foreseeable users of the model and those affected by the model. -->
-### Direct Use
-<!-- This section is for the model use without fine-tuning or plugging into a larger ecosystem/app. -->
-[More Information Needed]
-### Downstream Use [optional]
-<!-- This section is for the model use when fine-tuned for a task, or when plugged into a larger ecosystem/app -->
-[More Information Needed]
-### Out-of-Scope Use
-<!-- This section addresses misuse, malicious use, and uses that the model will not work well for. -->
-[More Information Needed]
-## Bias, Risks, and Limitations
-<!-- This section is meant to convey both technical and sociotechnical limitations. -->
-[More Information Needed]
-### Recommendations
-<!-- This section is meant to convey recommendations with respect to the bias, risk, and technical limitations. -->
-Users (both direct and downstream) should be made aware of the risks, biases and limitations of the model. More information needed for further recommendations.
-## How to Get Started with the Model
-Use the code below to get started with the model.
-[More Information Needed]
-## Training Details
-### Training Data
-<!-- This should link to a Dataset Card, perhaps with a short stub of information on what the training data is all about as well as documentation related to data pre-processing or additional filtering. -->
-[More Information Needed]
-### Training Procedure
-<!-- This relates heavily to the Technical Specifications. Content here should link to that section when it is relevant to the training procedure. -->
-#### Preprocessing [optional]
-[More Information Needed]
-#### Training Hyperparameters
-- **Training regime:** [More Information Needed] <!--fp32, fp16 mixed precision, bf16 mixed precision, bf16 non-mixed precision, fp16 non-mixed precision, fp8 mixed precision -->
-#### Speeds, Sizes, Times [optional]
-<!-- This section provides information about throughput, start/end time, checkpoint size if relevant, etc. -->
-[More Information Needed]
-## Evaluation
-<!-- This section describes the evaluation protocols and provides the results. -->
-### Testing Data, Factors & Metrics
-#### Testing Data
-<!-- This should link to a Dataset Card if possible. -->
-[More Information Needed]
-#### Factors
-<!-- These are the things the evaluation is disaggregating by, e.g., subpopulations or domains. -->
-[More Information Needed]
-#### Metrics
-<!-- These are the evaluation metrics being used, ideally with a description of why. -->
-[More Information Needed]
-### Results
-[More Information Needed]
-#### Summary
-## Model Examination [optional]
-<!-- Relevant interpretability work for the model goes here -->
-[More Information Needed]
-## Environmental Impact
-<!-- Total emissions (in grams of CO2eq) and additional considerations, such as electricity usage, go here. Edit the suggested text below accordingly -->
-Carbon emissions can be estimated using the [Machine Learning Impact calculator](https://mlco2.github.io/impact#compute) presented in [Lacoste et al. (2019)](https://arxiv.org/abs/1910.09700).
-- **Hardware Type:** [More Information Needed]
-- **Hours used:** [More Information Needed]
-- **Cloud Provider:** [More Information Needed]
-- **Compute Region:** [More Information Needed]
-- **Carbon Emitted:** [More Information Needed]
-## Technical Specifications [optional]
-### Model Architecture and Objective
-[More Information Needed]
-### Compute Infrastructure
-[More Information Needed]
-#### Hardware
-[More Information Needed]
-#### Software
-[More Information Needed]
-## Citation [optional]
-<!-- If there is a paper or blog post introducing the model, the APA and Bibtex information for that should go in this section. -->
-**BibTeX:**
-[More Information Needed]
-**APA:**
-[More Information Needed]
-## Glossary [optional]
-<!-- If relevant, include terms and calculations in this section that can help readers understand the model or model card. -->
-[More Information Needed]
-## More Information [optional]
-[More Information Needed]
-## Model Card Authors [optional]
-[More Information Needed]
-## Model Card Contact
-[More Information Needed]
-### Framework versions
-- PEFT 0.14.0

models/phi2-deeptalk-lora/adapter_config.json DELETED Viewed

@@ -1,36 +0,0 @@
-{
-  "alpha_pattern": {},
-  "auto_mapping": null,
-  "base_model_name_or_path": "microsoft/phi-2",
-  "bias": "none",
-  "eva_config": null,
-  "exclude_modules": null,
-  "fan_in_fan_out": false,
-  "inference_mode": true,
-  "init_lora_weights": true,
-  "layer_replication": null,
-  "layers_pattern": null,
-  "layers_to_transform": null,
-  "loftq_config": {},
-  "lora_alpha": 32,
-  "lora_bias": false,
-  "lora_dropout": 0.05,
-  "megatron_config": null,
-  "megatron_core": "megatron.core",
-  "modules_to_save": null,
-  "peft_type": "LORA",
-  "r": 4,
-  "rank_pattern": {},
-  "revision": null,
-  "target_modules": [
-    "dense",
-    "k_proj",
-    "fc2",
-    "fc1",
-    "v_proj",
-    "q_proj"
-  ],
-  "task_type": "CAUSAL_LM",
-  "use_dora": false,
-  "use_rslora": false
-}

models/phi2-deeptalk-lora/adapter_model.safetensors DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:7aa408089fb13fb4630b32e35cf2ccaec31e99aa519c3c0ec24ce465179ac34b
-size 538774784

models/phi2-deeptalk-lora/added_tokens.json DELETED Viewed

@@ -1,41 +0,0 @@
-{
-  "\t\t": 50294,
-  "\t\t\t": 50293,
-  "\t\t\t\t": 50292,
-  "\t\t\t\t\t": 50291,
-  "\t\t\t\t\t\t": 50290,
-  "\t\t\t\t\t\t\t": 50289,
-  "\t\t\t\t\t\t\t\t": 50288,
-  "\t\t\t\t\t\t\t\t\t": 50287,
-  "  ": 50286,
-  "   ": 50285,
-  "    ": 50284,
-  "     ": 50283,
-  "      ": 50282,
-  "       ": 50281,
-  "        ": 50280,
-  "         ": 50279,
-  "          ": 50278,
-  "           ": 50277,
-  "            ": 50276,
-  "             ": 50275,
-  "              ": 50274,
-  "               ": 50273,
-  "                ": 50272,
-  "                 ": 50271,
-  "                  ": 50270,
-  "                   ": 50269,
-  "                    ": 50268,
-  "                     ": 50267,
-  "                      ": 50266,
-  "                       ": 50265,
-  "                        ": 50264,
-  "                         ": 50263,
-  "                          ": 50262,
-  "                           ": 50261,
-  "                            ": 50260,
-  "                             ": 50259,
-  "                              ": 50258,
-  "                               ": 50257,
-  "[PAD]": 50295
-}

models/phi2-deeptalk-lora/merges.txt DELETED Viewed

The diff for this file is too large to render. See raw diff

models/phi2-deeptalk-lora/special_tokens_map.json DELETED Viewed

@@ -1,30 +0,0 @@
-{
-  "bos_token": {
-    "content": "<|endoftext|>",
-    "lstrip": false,
-    "normalized": false,
-    "rstrip": false,
-    "single_word": false
-  },
-  "eos_token": {
-    "content": "<|endoftext|>",
-    "lstrip": false,
-    "normalized": false,
-    "rstrip": false,
-    "single_word": false
-  },
-  "pad_token": {
-    "content": "[PAD]",
-    "lstrip": false,
-    "normalized": false,
-    "rstrip": false,
-    "single_word": false
-  },
-  "unk_token": {
-    "content": "<|endoftext|>",
-    "lstrip": false,
-    "normalized": false,
-    "rstrip": false,
-    "single_word": false
-  }
-}

models/phi2-deeptalk-lora/tokenizer.json DELETED Viewed

The diff for this file is too large to render. See raw diff

models/phi2-deeptalk-lora/tokenizer_config.json DELETED Viewed

@@ -1,335 +0,0 @@
-{
-  "add_prefix_space": false,
-  "added_tokens_decoder": {
-    "50256": {
-      "content": "<|endoftext|>",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": true
-    },
-    "50257": {
-      "content": "                               ",
-      "lstrip": false,
-      "normalized": true,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
-    },
-    "50258": {
-      "content": "                              ",
-      "lstrip": false,
-      "normalized": true,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
-    },
-    "50259": {
-      "content": "                             ",
-      "lstrip": false,
-      "normalized": true,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
-    },
-    "50260": {
-      "content": "                            ",
-      "lstrip": false,
-      "normalized": true,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
-    },
-    "50261": {
-      "content": "                           ",
-      "lstrip": false,
-      "normalized": true,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
-    },
-    "50262": {
-      "content": "                          ",
-      "lstrip": false,
-      "normalized": true,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
-    },
-    "50263": {
-      "content": "                         ",
-      "lstrip": false,
-      "normalized": true,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
-    },
-    "50264": {
-      "content": "                        ",
-      "lstrip": false,
-      "normalized": true,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
-    },
-    "50265": {
-      "content": "                       ",
-      "lstrip": false,
-      "normalized": true,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
-    },
-    "50266": {
-      "content": "                      ",
-      "lstrip": false,
-      "normalized": true,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
-    },
-    "50267": {
-      "content": "                     ",
-      "lstrip": false,
-      "normalized": true,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
-    },
-    "50268": {
-      "content": "                    ",
-      "lstrip": false,
-      "normalized": true,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
-    },
-    "50269": {
-      "content": "                   ",
-      "lstrip": false,
-      "normalized": true,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
-    },
-    "50270": {
-      "content": "                  ",
-      "lstrip": false,
-      "normalized": true,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
-    },
-    "50271": {
-      "content": "                 ",
-      "lstrip": false,
-      "normalized": true,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
-    },
-    "50272": {
-      "content": "                ",
-      "lstrip": false,
-      "normalized": true,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
-    },
-    "50273": {
-      "content": "               ",
-      "lstrip": false,
-      "normalized": true,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
-    },
-    "50274": {
-      "content": "              ",
-      "lstrip": false,
-      "normalized": true,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
-    },
-    "50275": {
-      "content": "             ",
-      "lstrip": false,
-      "normalized": true,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
-    },
-    "50276": {
-      "content": "            ",
-      "lstrip": false,
-      "normalized": true,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
-    },
-    "50277": {
-      "content": "           ",
-      "lstrip": false,
-      "normalized": true,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
-    },
-    "50278": {
-      "content": "          ",
-      "lstrip": false,
-      "normalized": true,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
-    },
-    "50279": {
-      "content": "         ",
-      "lstrip": false,
-      "normalized": true,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
-    },
-    "50280": {
-      "content": "        ",
-      "lstrip": false,
-      "normalized": true,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
-    },
-    "50281": {
-      "content": "       ",
-      "lstrip": false,
-      "normalized": true,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
-    },
-    "50282": {
-      "content": "      ",
-      "lstrip": false,
-      "normalized": true,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
-    },
-    "50283": {
-      "content": "     ",
-      "lstrip": false,
-      "normalized": true,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
-    },
-    "50284": {
-      "content": "    ",
-      "lstrip": false,
-      "normalized": true,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
-    },
-    "50285": {
-      "content": "   ",
-      "lstrip": false,
-      "normalized": true,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
-    },
-    "50286": {
-      "content": "  ",
-      "lstrip": false,
-      "normalized": true,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
-    },
-    "50287": {
-      "content": "\t\t\t\t\t\t\t\t\t",
-      "lstrip": false,
-      "normalized": true,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
-    },
-    "50288": {
-      "content": "\t\t\t\t\t\t\t\t",
-      "lstrip": false,
-      "normalized": true,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
-    },
-    "50289": {
-      "content": "\t\t\t\t\t\t\t",
-      "lstrip": false,
-      "normalized": true,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
-    },
-    "50290": {
-      "content": "\t\t\t\t\t\t",
-      "lstrip": false,
-      "normalized": true,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
-    },
-    "50291": {
-      "content": "\t\t\t\t\t",
-      "lstrip": false,
-      "normalized": true,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
-    },
-    "50292": {
-      "content": "\t\t\t\t",
-      "lstrip": false,
-      "normalized": true,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
-    },
-    "50293": {
-      "content": "\t\t\t",
-      "lstrip": false,
-      "normalized": true,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
-    },
-    "50294": {
-      "content": "\t\t",
-      "lstrip": false,
-      "normalized": true,
-      "rstrip": false,
-      "single_word": false,
-      "special": false
-    },
-    "50295": {
-      "content": "[PAD]",
-      "lstrip": false,
-      "normalized": false,
-      "rstrip": false,
-      "single_word": false,
-      "special": true
-    }
-  },
-  "bos_token": "<|endoftext|>",
-  "clean_up_tokenization_spaces": true,
-  "eos_token": "<|endoftext|>",
-  "extra_special_tokens": {},
-  "model_max_length": 2048,
-  "pad_token": "[PAD]",
-  "padding_side": "left",
-  "return_token_type_ids": false,
-  "tokenizer_class": "CodeGenTokenizer",
-  "unk_token": "<|endoftext|>"
-}

models/phi2-deeptalk-lora/training_args.bin DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:3fa1d3e24dbecb64fba08308dbfbc755a81ffcfafe47980e4bbfb871f79b0ebd
-size 5304

models/phi2-deeptalk-lora/vocab.json DELETED Viewed

The diff for this file is too large to render. See raw diff