{
 "nbformat": 4,
 "nbformat_minor": 0,
 "metadata": {
  "colab": {
   "provenance": [],
   "gpuType": "T4"
  },
  "kernelspec": {
   "name": "python3",
   "display_name": "Python 3"
  },
  "language_info": {
   "name": "python"
  },
  "accelerator": "GPU"
 },
 "cells": [
  {
   "cell_type": "markdown",
   "source": [
    "First of all we need to install requied **libraries**"
   ],
   "metadata": {
    "id": "k3d4WSh2zKRR"
   }
  },
  {
   "cell_type": "code",
   "execution_count": 21,
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "id": "tIdoqVV1izoz",
    "outputId": "392af71f-8313-4be0-c1da-6334550bc69d"
   },
   "outputs": [
    {
     "output_type": "stream",
     "name": "stdout",
     "text": [
      "\u001b[?25l   \u001b[90m\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u001b[0m \u001b[32m0.0/84.1 kB\u001b[0m \u001b[31m?\u001b[0m eta \u001b[36m-:--:--\u001b[0m\r\u001b[2K   \u001b[90m\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u2501\u001b[0m \u001b[32m84.1/84.1 kB\u001b[0m \u001b[31m9.1 MB/s\u001b[0m eta \u001b[36m0:00:00\u001b[0m\n",
      "\u001b[?25h"
     ]
    }
   ],
   "source": [
    "!pip install transformers datasets peft evaluate accelerate -q"
   ]
  },
  {
   "cell_type": "markdown",
   "source": [
    "Verifying Installations"
   ],
   "metadata": {
    "id": "Ym_FNQY4zU3y"
   }
  },
  {
   "cell_type": "code",
   "source": [
    "import transformers\n",
    "import datasets\n",
    "import peft\n",
    "import evaluate\n",
    "print(f\"Tramsformers: {transformers.__version__}\")\n",
    "print(f\"Datasets: {datasets.__version__}\")\n",
    "print(f\"PEFT: {peft.__version__}\")\n",
    "print(f\"Evaluate: {evaluate.__version__}\")"
   ],
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "id": "wOie5cSZxVIZ",
    "outputId": "e208377e-dcac-4a59-cc15-6f99bc018284"
   },
   "execution_count": 22,
   "outputs": [
    {
     "output_type": "stream",
     "name": "stdout",
     "text": [
      "Tramsformers: 5.0.0\n",
      "Datasets: 4.0.0\n",
      "PEFT: 0.18.1\n",
      "Evaluate: 0.4.6\n"
     ]
    }
   ]
  },
  {
   "cell_type": "markdown",
   "source": [
    "**Load the datasets**"
   ],
   "metadata": {
    "id": "77A5H5jUzinc"
   }
  },
  {
   "cell_type": "code",
   "source": [
    "from datasets import load_dataset"
   ],
   "metadata": {
    "id": "101qqBCBz-JB"
   },
   "execution_count": 18,
   "outputs": []
  },
  {
   "cell_type": "markdown",
   "source": [
    "loading banking77 dataset"
   ],
   "metadata": {
    "id": "bEcOwfZV0IXa"
   }
  },
  {
   "cell_type": "code",
   "source": [
    "dataset =load_dataset(\"legacy-datasets/banking77\")"
   ],
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/",
     "height": 177,
     "referenced_widgets": [
      "5655c5cca3d547b6a0ac08d1b1fbf008",
      "f9ec87bec967441f92f74b6518819709",
      "84a24ca325464e1db0cdb56f096c10fc",
      "e326b50a6a6f41f79d9af1e544645348",
      "cea5de85e6994e4ba40219434102842d",
      "c2a9c610fe1b4e93a7aacafeb22069ba",
      "aaa2991f6f854d188eb62177c0ccf457",
      "d069596b4ad54bb9a785403e0491fbef",
      "075bc577ced6404bb1e6a63b47c6139e",
      "5549923675df4864a223429518765dd2",
      "d0949c0967184dc097899dc1dffc0bd5",
      "e062cedda9ff4128b90dc0b76ce7d71c",
      "9f20dfd7ca6743338810ee564f1bbf95",
      "3589858387154504a9f7663935156d5c",
      "6af6400d7394437ea2aaa7816aab963f",
      "15b8413c1cb1464d9c5fbe0899d855e6",
      "7d04113fcd084ff09ea5fa7c5718680c",
      "ac29f3c9178041ed967f11aaa98195e8",
      "71b87b8a3c27421b9b3b0fa7f86b44c5",
      "8572d5854f2e4cc49ccf7ad17ee7ddd5",
      "5d2a532c7f52411a9d1e19fe58b44970",
      "fc1caa125cb04ef1a26c6018d2702e0d",
      "9ced219b80c74d5392c00c786dc3663a",
      "25f95444cec04b4fba706853567f0a31",
      "0cb3c9f5192548bcb970b06d71e1fe4b",
      "ebb6abfa10e4494480fcef655d7bc280",
      "ca9fd314395c4949b090ade258664516",
      "040f6956c7cb416dbca66863045d40e7",
      "3108dd45cc04481989000aec773bdc8b",
      "7803a811de55428abb91932f0a3c325e",
      "f34a912cde854e35a345ce5a807f27ea",
      "c339895ae7554611ae9679a6e80eaccb",
      "db0946daeef94404a0ba4ba58132ccbb",
      "5daf5aacab4c4028a127c4128e4a9c97",
      "7abc88f1c19b47449b924e183c42e21a",
      "d25694f9d9bc4bffb3f8a53ec5a58749",
      "ad5bd6f328ec41818e62602dbc53dc77",
      "f796fe7a076d409284f65fda06a96633",
      "ba6dfbc2bdf249c8b08b45c30495e684",
      "d96a1cae1c2846ca8243e4b9cf80f9a2",
      "32853e628e794361bee346a975a35534",
      "2ec24fdc2a5d47e7bd9224349535fd74",
      "bd57051fd3f544d7911b3c43a4b7a63b",
      "aa2e7b6a1a794c239e064988383918f6",
      "ce41312305a54e0e97b9d113a8245c34",
      "82293b8d416847dd96f71c0ed5e805fd",
      "57b3d091a24047a8ab97d5d6535a79ef",
      "3ba69b950f0848c89aa090f1a69fba57",
      "93db226d05cd4e9582cc685ec47dfeb2",
      "261c90036bd746ffb020e5f55e27a104",
      "0f3994568d514d30ba2e727c5a52c9bd",
      "2628185d0ede4f039eb7e38368761d73",
      "02771cfe0334486293ed5570c86f9f46",
      "fc512a98af3d426ba5be0278c3184398",
      "f4faf71ce3e6438b8a788cff559839b5"
     ]
    },
    "id": "HbYjKkL40NDQ",
    "outputId": "eaf2f031-5f62-4187-d930-5c3f3ce112fa"
   },
   "execution_count": 19,
   "outputs": [
    {
     "output_type": "display_data",
     "data": {
      "text/plain": [
       "README.md: 0.00B [00:00, ?B/s]"
      ],
      "application/vnd.jupyter.widget-view+json": {
       "version_major": 2,
       "version_minor": 0,
       "model_id": "5655c5cca3d547b6a0ac08d1b1fbf008"
      }
     },
     "metadata": {}
    },
    {
     "output_type": "display_data",
     "data": {
      "text/plain": [
       "data/train-00000-of-00001.parquet:   0%|          | 0.00/298k [00:00<?, ?B/s]"
      ],
      "application/vnd.jupyter.widget-view+json": {
       "version_major": 2,
       "version_minor": 0,
       "model_id": "e062cedda9ff4128b90dc0b76ce7d71c"
      }
     },
     "metadata": {}
    },
    {
     "output_type": "display_data",
     "data": {
      "text/plain": [
       "data/test-00000-of-00001.parquet:   0%|          | 0.00/93.9k [00:00<?, ?B/s]"
      ],
      "application/vnd.jupyter.widget-view+json": {
       "version_major": 2,
       "version_minor": 0,
       "model_id": "9ced219b80c74d5392c00c786dc3663a"
      }
     },
     "metadata": {}
    },
    {
     "output_type": "display_data",
     "data": {
      "text/plain": [
       "Generating train split:   0%|          | 0/10003 [00:00<?, ? examples/s]"
      ],
      "application/vnd.jupyter.widget-view+json": {
       "version_major": 2,
       "version_minor": 0,
       "model_id": "5daf5aacab4c4028a127c4128e4a9c97"
      }
     },
     "metadata": {}
    },
    {
     "output_type": "display_data",
     "data": {
      "text/plain": [
       "Generating test split:   0%|          | 0/3080 [00:00<?, ? examples/s]"
      ],
      "application/vnd.jupyter.widget-view+json": {
       "version_major": 2,
       "version_minor": 0,
       "model_id": "ce41312305a54e0e97b9d113a8245c34"
      }
     },
     "metadata": {}
    }
   ]
  },
  {
   "cell_type": "code",
   "source": [
    "print(dataset)\n",
    "print(\"\\nfirst training example:\")\n",
    "print(dataset[\"train\"][0])\n",
    "print(\"\\nNumber of classes:\")\n",
    "print(dataset[\"train\"].features[\"label\"].num_classes)\n",
    "print(\"\\nClass name sample:\")\n",
    "print(dataset[\"train\"].features[\"label\"].names[:10])"
   ],
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "id": "4NAVv8e12M-i",
    "outputId": "c4971df2-57d9-432f-aec8-facc8d81323f"
   },
   "execution_count": 23,
   "outputs": [
    {
     "output_type": "stream",
     "name": "stdout",
     "text": [
      "DatasetDict({\n",
      "    train: Dataset({\n",
      "        features: ['text', 'label'],\n",
      "        num_rows: 10003\n",
      "    })\n",
      "    test: Dataset({\n",
      "        features: ['text', 'label'],\n",
      "        num_rows: 3080\n",
      "    })\n",
      "})\n",
      "\n",
      "first training example:\n",
      "{'text': 'I am still waiting on my card?', 'label': 11}\n",
      "\n",
      "Number of classes:\n",
      "77\n",
      "\n",
      "Class name sample:\n",
      "['activate_my_card', 'age_limit', 'apple_pay_or_google_pay', 'atm_support', 'automatic_top_up', 'balance_not_updated_after_bank_transfer', 'balance_not_updated_after_cheque_or_cash_deposit', 'beneficiary_not_allowed', 'cancel_transfer', 'card_about_to_expire']\n"
     ]
    }
   ]
  },
  {
   "cell_type": "markdown",
   "source": [
    "Exploration of our data"
   ],
   "metadata": {
    "id": "8ljNKnLg8gpo"
   }
  },
  {
   "cell_type": "code",
   "source": [
    "import pandas as pd\n",
    "from collections import Counter\n",
    "\n",
    "# Convert to pandas for easy exploration\n",
    "train_df = pd.DataFrame(dataset[\"train\"])\n",
    "\n",
    "# Check class distribution\n",
    "label_counts = Counter(train_df[\"label\"])\n",
    "print(f\"Most common class count: {max(label_counts.values())}\")\n",
    "print(f\"Least common class count: {min(label_counts.values())}\")\n",
    "print(f\"Average examples per class: {len(train_df) / 77:.1f}\")\n",
    "\n",
    "# Check text lengths\n",
    "train_df[\"text_length\"] = train_df[\"text\"].apply(len)\n",
    "print(f\"\\nAverage text length: {train_df['text_length'].mean():.1f} chars\")\n",
    "print(f\"Max text length: {train_df['text_length'].max()} chars\")\n",
    "print(f\"Min text length: {train_df['text_length'].min()} chars\")\n",
    "\n",
    "# Sample a few examples\n",
    "print(\"\\nSample examples:\")\n",
    "print(train_df.sample(3)[[\"text\", \"label\"]].to_string())"
   ],
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "id": "VMuS1YMs8gD0",
    "outputId": "e882392c-c480-49a0-cf23-22bf5d4f7719"
   },
   "execution_count": 24,
   "outputs": [
    {
     "output_type": "stream",
     "name": "stdout",
     "text": [
      "Most common class count: 187\n",
      "Least common class count: 35\n",
      "Average examples per class: 129.9\n",
      "\n",
      "Average text length: 59.5 chars\n",
      "Max text length: 433 chars\n",
      "Min text length: 13 chars\n",
      "\n",
      "Sample examples:\n",
      "                                          text  label\n",
      "6323     What happens when I am charged twice?     63\n",
      "7588     I need to deposit money to my account     65\n",
      "8413  I need to get a disposable virtual card?     37\n"
     ]
    }
   ]
  },
  {
   "cell_type": "markdown",
   "source": [
    "Load Tokenizer"
   ],
   "metadata": {
    "id": "VY8TnPx59uHs"
   }
  },
  {
   "cell_type": "code",
   "source": [
    "from transformers import AutoTokenizer\n",
    "\n",
    "# Load DistilBERT tokenizer\n",
    "tokenizer = AutoTokenizer.from_pretrained(\"distilbert-base-uncased\")\n",
    "\n",
    "# Test it on a sample\n",
    "sample_text = \"I am still waiting on my card\"\n",
    "tokens = tokenizer(sample_text, return_tensors=\"pt\")\n",
    "\n",
    "print(f\"Input IDs: {tokens['input_ids']}\")\n",
    "print(f\"Attention mask: {tokens['attention_mask']}\")\n",
    "print(f\"Number of tokens: {tokens['input_ids'].shape[1]}\")\n",
    "\n",
    "# Decode back to see what tokenization looks like\n",
    "decoded = tokenizer.convert_ids_to_tokens(tokens['input_ids'][0])\n",
    "print(f\"\\nTokens: {decoded}\")"
   ],
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/",
     "height": 200,
     "referenced_widgets": [
      "5d3515f5b99249118f03a3bba6337702",
      "caef023bb6724c7188dd3a04e7545e97",
      "b72c865e438f4cd5ab0354f0d295ed9a",
      "1e7f4e243238443cb7666f318f9d8668",
      "bff495be5cb74b8983841a5ecaf9873a",
      "090f9a5711ba4486b93b5fc1b71db5be",
      "358bdf0fc5584cc8932732e0a49b6ff7",
      "f4f74da3e2ca4f04840ff7bde9920861",
      "e545b1ddd9d842af95786ec85947cd9c",
      "928b3ea3a03340898aa5efe3c09ad50f",
      "3b053fc05dcd4dd1a77b4f518f19544c",
      "ef5b2ef23bd746e18dfc1c65d6610e78",
      "439eb1aa42f54840ac5859c9fdb1db3e",
      "af9d1abcdb6e43b0abb2229e2950ec8d",
      "1d27b8140f63419cb9eeec0d957928e0",
      "a95ab24b98364df0a3d3b014969b9282",
      "5a9c1b0354d34a6daee039680d0e6cbc",
      "c0bfd92cb2514eb8a725b9daf9a48706",
      "10815927eb7f4d969f894e231790de84",
      "1b71eb5b79564259a1d37ddfe914a96b",
      "de0e1a6ff6164057a4afe8d05810af27",
      "4611c210cb784302bab7a2a17f70ade5",
      "8c913887ace8439fad51f9c48a24b484",
      "c0bc4504f436443f81591c9cad717ae2",
      "299320c22d964963a17fa263f01ffeb1",
      "7b3c5bbf806541efa472b89a4ba8c5fb",
      "a5bc918affcd4363abaf5f6ae01fbe3e",
      "00ba7fabe034457295f054f5f305baec",
      "c020b2d2c22d442ba8014e7a2397c0e0",
      "ee1e7fac952c474fb8c8319c8b549a1d",
      "fa91ffd63341452cab732697435ab76e",
      "faa5c6c2c4e744d09c13bebbece0b7c7",
      "13924391b6134272bc7f36e17fcc1465"
     ]
    },
    "id": "fSySHvJV9xC6",
    "outputId": "dfb9be00-9e08-44de-bcd4-d7a753e7c313"
   },
   "execution_count": 13,
   "outputs": [
    {
     "output_type": "display_data",
     "data": {
      "text/plain": [
       "tokenizer_config.json:   0%|          | 0.00/48.0 [00:00<?, ?B/s]"
      ],
      "application/vnd.jupyter.widget-view+json": {
       "version_major": 2,
       "version_minor": 0,
       "model_id": "5d3515f5b99249118f03a3bba6337702"
      }
     },
     "metadata": {}
    },
    {
     "output_type": "display_data",
     "data": {
      "text/plain": [
       "vocab.txt: 0.00B [00:00, ?B/s]"
      ],
      "application/vnd.jupyter.widget-view+json": {
       "version_major": 2,
       "version_minor": 0,
       "model_id": "ef5b2ef23bd746e18dfc1c65d6610e78"
      }
     },
     "metadata": {}
    },
    {
     "output_type": "display_data",
     "data": {
      "text/plain": [
       "tokenizer.json: 0.00B [00:00, ?B/s]"
      ],
      "application/vnd.jupyter.widget-view+json": {
       "version_major": 2,
       "version_minor": 0,
       "model_id": "8c913887ace8439fad51f9c48a24b484"
      }
     },
     "metadata": {}
    },
    {
     "output_type": "stream",
     "name": "stdout",
     "text": [
      "Input IDs: tensor([[ 101, 1045, 2572, 2145, 3403, 2006, 2026, 4003,  102]])\n",
      "Attention mask: tensor([[1, 1, 1, 1, 1, 1, 1, 1, 1]])\n",
      "Number of tokens: 9\n",
      "\n",
      "Tokens: ['[CLS]', 'i', 'am', 'still', 'waiting', 'on', 'my', 'card', '[SEP]']\n"
     ]
    }
   ]
  },
  {
   "cell_type": "markdown",
   "source": [
    "Tokenizing full dataset"
   ],
   "metadata": {
    "id": "odj4nLnA_A0S"
   }
  },
  {
   "cell_type": "code",
   "source": [
    "def tokenize_function(examples):\n",
    "    return tokenizer(\n",
    "        examples[\"text\"],\n",
    "        padding=\"max_length\",\n",
    "        truncation=True,\n",
    "        max_length=128\n",
    "    )\n",
    "\n",
    "# Apply tokenization to entire dataset\n",
    "tokenized_dataset = dataset.map(tokenize_function, batched=True)\n",
    "\n",
    "# Format for PyTorch\n",
    "tokenized_dataset = tokenized_dataset.rename_column(\"label\", \"labels\")\n",
    "tokenized_dataset.set_format(\"torch\",\n",
    "    columns=[\"input_ids\", \"attention_mask\", \"labels\"])\n",
    "\n",
    "print(\"Tokenization complete\")\n",
    "print(tokenized_dataset)"
   ],
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/",
     "height": 272,
     "referenced_widgets": [
      "3d3b4303c4084345b92dd994f8d6771e",
      "4070987387fe401c81d3a54d8e5c3ecf",
      "406aeedc023e43ddb502f3123683e90b",
      "4077bd422fb84cbfbfa5cb6c1dfb0348",
      "12e03c893c724b9b82dca8ad76883697",
      "3e2228d5ab694e959c6dcadb15778d1d",
      "23863c415a674344846d1880a2287863",
      "1f293d561028462b9d58953261cb8450",
      "a341a908e1244761af2029c9ae889f30",
      "b44449ffea8a463fbc7c1998f42afe8f",
      "76e943008cd742ddac2e196a12564527",
      "069d7689682640898a475a5c9b307948",
      "2e57cf4042f34d97b8d3f0664f844fea",
      "90b6944be5054513a454720d918ef05e",
      "8059c06376db454c86496ebf7508bcdd",
      "39a3b7ce8ef445b0908fbaf89aaa696d",
      "f402081cb93d41b5bc2302c12f8cc0df",
      "f3696cfa42554147b4e371169b6c21d2",
      "4868838542d0402fb9d6110cd5e501c0",
      "4c04f2bae3db4c97bb4ad896c70fde88",
      "30475722304246baa0bb481196a52f42",
      "2dcbb774a855432498b3bf61a43d524e"
     ]
    },
    "id": "Zq8IBR4G_Eph",
    "outputId": "0a01eb82-a0a0-41f4-bbf0-e5f9cf38ab87"
   },
   "execution_count": 25,
   "outputs": [
    {
     "output_type": "display_data",
     "data": {
      "text/plain": [
       "Map:   0%|          | 0/10003 [00:00<?, ? examples/s]"
      ],
      "application/vnd.jupyter.widget-view+json": {
       "version_major": 2,
       "version_minor": 0,
       "model_id": "3d3b4303c4084345b92dd994f8d6771e"
      }
     },
     "metadata": {}
    },
    {
     "output_type": "display_data",
     "data": {
      "text/plain": [
       "Map:   0%|          | 0/3080 [00:00<?, ? examples/s]"
      ],
      "application/vnd.jupyter.widget-view+json": {
       "version_major": 2,
       "version_minor": 0,
       "model_id": "069d7689682640898a475a5c9b307948"
      }
     },
     "metadata": {}
    },
    {
     "output_type": "stream",
     "name": "stdout",
     "text": [
      "Tokenization complete\n",
      "DatasetDict({\n",
      "    train: Dataset({\n",
      "        features: ['text', 'labels', 'input_ids', 'token_type_ids', 'attention_mask'],\n",
      "        num_rows: 10003\n",
      "    })\n",
      "    test: Dataset({\n",
      "        features: ['text', 'labels', 'input_ids', 'token_type_ids', 'attention_mask'],\n",
      "        num_rows: 3080\n",
      "    })\n",
      "})\n"
     ]
    }
   ]
  },
  {
   "cell_type": "markdown",
   "source": [
    "Next we load D.Bert model"
   ],
   "metadata": {
    "id": "N0Zrh9f0BBkS"
   }
  },
  {
   "cell_type": "code",
   "source": [
    "from transformers import AutoModelForSequenceClassification\n",
    "import torch\n",
    "\n",
    "# Load DistilBERT with classification head\n",
    "model = AutoModelForSequenceClassification.from_pretrained(\n",
    "    \"distilbert-base-uncased\",\n",
    "    num_labels=77\n",
    ")\n",
    "\n",
    "# Check model size\n",
    "total_params = sum(p.numel() for p in model.parameters())\n",
    "trainable_params = sum(p.numel() for p in model.parameters() if p.requires_grad)\n",
    "\n",
    "print(f\"Total parameters: {total_params:,}\")\n",
    "print(f\"Trainable parameters: {trainable_params:,}\")\n",
    "print(f\"\\nModel architecture:\")\n",
    "print(model)"
   ],
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/",
     "height": 1000,
     "referenced_widgets": [
      "83fca435c3524f5dbeedecd1c27e93c6",
      "669641020fdd4a888131fb973a0e3b78",
      "93caf7bedbd24892b1f62e3cc8ebea0c",
      "a65d0b219356463eb41a7ae68064e1d8",
      "1aa0bf6aab894ce3b5e1351141cde750",
      "3329862c824d41c297d30d85342a3112",
      "0cfc73b1d2934e35b335deb9720e6850",
      "34a42cb2c02f42c78748295f4b0d9abd",
      "988724583fd1492ca5afb282df022b54",
      "30b166b25cc748c68af7bb2dd2150e1b",
      "2c2b69d9109c45a7b0b4354310b46799",
      "b9f978dbfad94bc79124bff0f2b1cc21",
      "b54f7996d92746a4bd136eca6d171321",
      "e6946d5789d74179b4b0fff465645d60",
      "b8c624b4124a42399bc94351e2f01cbc",
      "66aa404df0854749ae1ccee3900d4fd6",
      "b4e708d619f94ad593ae3fd95950aa95",
      "56a38756f37b431fbc7d38609dda6351",
      "884a0768c0634d80a08cd151c1150baf",
      "3372b466426944fca669a2d75ae9897b",
      "5444e1997bd34a24b1b3f465a1433157",
      "7a49f4a8c9bf43b1b4341590648bba11",
      "b0116707b7914e09952aeaed53bc8b77",
      "211365c83af24826afd5c8335d44492b",
      "2be3baf810014eeeb1502bfae6a3a362",
      "417c846e302140498afe0ca730cdace2",
      "2e852df38b1b478aaa644da2b7eb03fe",
      "a7fef33895cc453194d30d0c12da43b4",
      "9d5a1a2087894cf0b0b9081901547f47",
      "64aed83b046a404eaa8ac0d7b0c819d3",
      "0a6c5caa64e24aaca5114384800f97c8",
      "4ccfdc8495f54e7c848cadb0f54cc7e4",
      "4e0a1a2e7db3408f855a7dbb38b5ab2c"
     ]
    },
    "id": "6m-wW5iMBFb4",
    "outputId": "3d9ce035-6dad-401e-f00b-5db1bc58b8e3"
   },
   "execution_count": 8,
   "outputs": [
    {
     "output_type": "stream",
     "name": "stderr",
     "text": [
      "/usr/local/lib/python3.12/dist-packages/huggingface_hub/utils/_auth.py:93: UserWarning: \n",
      "The secret `HF_TOKEN` does not exist in your Colab secrets.\n",
      "To authenticate with the Hugging Face Hub, create a token in your settings tab (https://huggingface.co/settings/tokens), set it as secret in your Google Colab and restart your session.\n",
      "You will be able to reuse this secret in all of your notebooks.\n",
      "Please note that authentication is recommended but still optional to access public models or datasets.\n",
      "  warnings.warn(\n",
      "Warning: You are sending unauthenticated requests to the HF Hub. Please set a HF_TOKEN to enable higher rate limits and faster downloads.\n",
      "WARNING:huggingface_hub.utils._http:Warning: You are sending unauthenticated requests to the HF Hub. Please set a HF_TOKEN to enable higher rate limits and faster downloads.\n"
     ]
    },
    {
     "output_type": "display_data",
     "data": {
      "text/plain": [
       "config.json:   0%|          | 0.00/483 [00:00<?, ?B/s]"
      ],
      "application/vnd.jupyter.widget-view+json": {
       "version_major": 2,
       "version_minor": 0,
       "model_id": "83fca435c3524f5dbeedecd1c27e93c6"
      }
     },
     "metadata": {}
    },
    {
     "output_type": "display_data",
     "data": {
      "text/plain": [
       "model.safetensors:   0%|          | 0.00/268M [00:00<?, ?B/s]"
      ],
      "application/vnd.jupyter.widget-view+json": {
       "version_major": 2,
       "version_minor": 0,
       "model_id": "b9f978dbfad94bc79124bff0f2b1cc21"
      }
     },
     "metadata": {}
    },
    {
     "output_type": "display_data",
     "data": {
      "text/plain": [
       "Loading weights:   0%|          | 0/100 [00:00<?, ?it/s]"
      ],
      "application/vnd.jupyter.widget-view+json": {
       "version_major": 2,
       "version_minor": 0,
       "model_id": "b0116707b7914e09952aeaed53bc8b77"
      }
     },
     "metadata": {}
    },
    {
     "output_type": "stream",
     "name": "stderr",
     "text": [
      "DistilBertForSequenceClassification LOAD REPORT from: distilbert-base-uncased\n",
      "Key                     | Status     | \n",
      "------------------------+------------+-\n",
      "vocab_transform.bias    | UNEXPECTED | \n",
      "vocab_transform.weight  | UNEXPECTED | \n",
      "vocab_layer_norm.bias   | UNEXPECTED | \n",
      "vocab_projector.bias    | UNEXPECTED | \n",
      "vocab_layer_norm.weight | UNEXPECTED | \n",
      "classifier.weight       | MISSING    | \n",
      "pre_classifier.weight   | MISSING    | \n",
      "classifier.bias         | MISSING    | \n",
      "pre_classifier.bias     | MISSING    | \n",
      "\n",
      "Notes:\n",
      "- UNEXPECTED\t:can be ignored when loading from different task/architecture; not ok if you expect identical arch.\n",
      "- MISSING\t:those params were newly initialized because missing from the checkpoint. Consider training on your downstream task.\n"
     ]
    },
    {
     "output_type": "stream",
     "name": "stdout",
     "text": [
      "Total parameters: 67,012,685\n",
      "Trainable parameters: 67,012,685\n",
      "\n",
      "Model architecture:\n",
      "DistilBertForSequenceClassification(\n",
      "  (distilbert): DistilBertModel(\n",
      "    (embeddings): Embeddings(\n",
      "      (word_embeddings): Embedding(30522, 768, padding_idx=0)\n",
      "      (position_embeddings): Embedding(512, 768)\n",
      "      (LayerNorm): LayerNorm((768,), eps=1e-12, elementwise_affine=True)\n",
      "      (dropout): Dropout(p=0.1, inplace=False)\n",
      "    )\n",
      "    (transformer): Transformer(\n",
      "      (layer): ModuleList(\n",
      "        (0-5): 6 x TransformerBlock(\n",
      "          (attention): DistilBertSelfAttention(\n",
      "            (q_lin): Linear(in_features=768, out_features=768, bias=True)\n",
      "            (k_lin): Linear(in_features=768, out_features=768, bias=True)\n",
      "            (v_lin): Linear(in_features=768, out_features=768, bias=True)\n",
      "            (out_lin): Linear(in_features=768, out_features=768, bias=True)\n",
      "            (dropout): Dropout(p=0.1, inplace=False)\n",
      "          )\n",
      "          (sa_layer_norm): LayerNorm((768,), eps=1e-12, elementwise_affine=True)\n",
      "          (ffn): FFN(\n",
      "            (dropout): Dropout(p=0.1, inplace=False)\n",
      "            (lin1): Linear(in_features=768, out_features=3072, bias=True)\n",
      "            (lin2): Linear(in_features=3072, out_features=768, bias=True)\n",
      "            (activation): GELUActivation()\n",
      "          )\n",
      "          (output_layer_norm): LayerNorm((768,), eps=1e-12, elementwise_affine=True)\n",
      "        )\n",
      "      )\n",
      "    )\n",
      "  )\n",
      "  (pre_classifier): Linear(in_features=768, out_features=768, bias=True)\n",
      "  (classifier): Linear(in_features=768, out_features=77, bias=True)\n",
      "  (dropout): Dropout(p=0.2, inplace=False)\n",
      ")\n"
     ]
    }
   ]
  },
  {
   "cell_type": "markdown",
   "source": [
    "Apply LORA"
   ],
   "metadata": {
    "id": "GAPflyxgDi3z"
   }
  },
  {
   "cell_type": "code",
   "source": [
    "from peft import LoraConfig, get_peft_model, TaskType\n",
    "\n",
    "# Define LoRA configuration\n",
    "lora_config = LoraConfig(\n",
    "    r=8,                     # rank\n",
    "    lora_alpha=16,           # scaling factor\n",
    "    target_modules=[\"q_lin\", \"v_lin\"],  # attention matrices\n",
    "    lora_dropout=0.1,        # dropout for regularization\n",
    "    bias=\"none\",             # don't train bias terms\n",
    "    task_type=TaskType.SEQ_CLS  # sequence classification\n",
    ")\n",
    "\n",
    "# Wrap model with LoRA\n",
    "model = get_peft_model(model, lora_config)\n",
    "\n",
    "# Verify trainable parameters\n",
    "model.print_trainable_parameters()"
   ],
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "id": "bBSDZW8cDl6S",
    "outputId": "5e49c45d-1d25-4ba7-b79a-39c083b7a0d1"
   },
   "execution_count": 10,
   "outputs": [
    {
     "output_type": "stream",
     "name": "stdout",
     "text": [
      "trainable params: 797,261 || all params: 67,809,946 || trainable%: 1.1757\n"
     ]
    }
   ]
  },
  {
   "cell_type": "markdown",
   "source": [
    "Handle Class Imbalance"
   ],
   "metadata": {
    "id": "d0bJwYzuED0y"
   }
  },
  {
   "cell_type": "code",
   "source": [
    "import torch\n",
    "import numpy as np\n",
    "from torch.nn import CrossEntropyLoss\n",
    "\n",
    "# Calculate class weights\n",
    "label_counts = torch.zeros(77)\n",
    "for example in tokenized_dataset[\"train\"]:\n",
    "    label_counts[example[\"labels\"]] += 1\n",
    "\n",
    "# Inverse frequency weighting\n",
    "class_weights = 1.0 / label_counts\n",
    "class_weights = class_weights / class_weights.sum() * 77\n",
    "\n",
    "print(\"Class weights calculated\")\n",
    "print(f\"Max weight: {class_weights.max():.4f}\")\n",
    "print(f\"Min weight: {class_weights.min():.4f}\")\n",
    "print(f\"Weight ratio: {class_weights.max()/class_weights.min():.2f}x\")"
   ],
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "id": "2lW4p2NIEEwp",
    "outputId": "c6199a86-c6d7-4f0e-cf4d-0da1dc405ded"
   },
   "execution_count": 26,
   "outputs": [
    {
     "output_type": "stream",
     "name": "stdout",
     "text": [
      "Class weights calculated\n",
      "Max weight: 3.3678\n",
      "Min weight: 0.6303\n",
      "Weight ratio: 5.34x\n"
     ]
    }
   ]
  },
  {
   "cell_type": "markdown",
   "source": [
    "Training Setup"
   ],
   "metadata": {
    "id": "woAiMK7CE5p4"
   }
  },
  {
   "cell_type": "code",
   "source": [
    "from transformers import TrainingArguments, Trainer\n",
    "import evaluate\n",
    "import numpy as np\n",
    "\n",
    "# Load accuracy metric\n",
    "metric = evaluate.load(\"accuracy\")\n",
    "\n",
    "def compute_metrics(eval_pred):\n",
    "    logits, labels = eval_pred\n",
    "    predictions = np.argmax(logits, axis=-1)\n",
    "    return metric.compute(predictions=predictions, references=labels)\n",
    "\n",
    "# Training arguments\n",
    "training_args = TrainingArguments(\n",
    "    output_dir=\"./banking77-lora\",\n",
    "    num_train_epochs=5,\n",
    "    per_device_train_batch_size=32,\n",
    "    per_device_eval_batch_size=64,\n",
    "    warmup_steps=100,\n",
    "    weight_decay=0.01,\n",
    "    logging_dir=\"./logs\",\n",
    "    logging_steps=50,\n",
    "    eval_strategy=\"epoch\",\n",
    "    save_strategy=\"epoch\",\n",
    "    load_best_model_at_end=True,\n",
    "    metric_for_best_model=\"accuracy\",\n",
    "    fp16=True\n",
    ")\n",
    "\n",
    "print(\"Training arguments configured\")\n",
    "print(f\"Epochs: {training_args.num_train_epochs}\")\n",
    "print(f\"Batch size: {training_args.per_device_train_batch_size}\")"
   ],
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/",
     "height": 118,
     "referenced_widgets": [
      "30a35724f4ab47a79f986e445f9fb45a",
      "e0693b3f938b45efb3e9e4a57fdb271b",
      "ad6691d6dd9b4c238268285f4b904324",
      "75cf0ab190274751a2600973261cae5f",
      "7493d553c592409a9996fe3733862622",
      "bc4e07ef062e45559c45093ed6189ff1",
      "292d1e16fa4b4344b7911fab0f700bbf",
      "8e43b5e38ef443e8a3f39a950fbf71e8",
      "6765a4b2da96451382db666a2c254e31",
      "79400bfe8b79423aabc1bb84509be578",
      "49fc3dbd7b244374af8f38f6987adaa9"
     ]
    },
    "id": "qQGl2_JcE3B5",
    "outputId": "5a61e27b-cdbc-4044-a4ce-bf1816085d27"
   },
   "execution_count": 27,
   "outputs": [
    {
     "output_type": "display_data",
     "data": {
      "text/plain": [
       "Downloading builder script: 0.00B [00:00, ?B/s]"
      ],
      "application/vnd.jupyter.widget-view+json": {
       "version_major": 2,
       "version_minor": 0,
       "model_id": "30a35724f4ab47a79f986e445f9fb45a"
      }
     },
     "metadata": {}
    },
    {
     "output_type": "stream",
     "name": "stderr",
     "text": [
      "`logging_dir` is deprecated and will be removed in v5.2. Please set `TENSORBOARD_LOGGING_DIR` instead.\n"
     ]
    },
    {
     "output_type": "stream",
     "name": "stdout",
     "text": [
      "Training arguments configured\n",
      "Epochs: 5\n",
      "Batch size: 32\n"
     ]
    }
   ]
  },
  {
   "cell_type": "markdown",
   "source": [
    " Create Weighted Trainer"
   ],
   "metadata": {
    "id": "ojEwhpP_GMST"
   }
  },
  {
   "cell_type": "code",
   "source": [
    "from torch.nn import CrossEntropyLoss\n",
    "\n",
    "# Custom trainer to handle class imbalance\n",
    "class WeightedTrainer(Trainer):\n",
    "    def compute_loss(self, model, inputs, return_outputs=False, **kwargs):\n",
    "        labels = inputs.get(\"labels\")\n",
    "        outputs = model(**inputs)\n",
    "        logits = outputs.get(\"logits\")\n",
    "\n",
    "        # Apply class weights to loss\n",
    "        loss_fct = CrossEntropyLoss(\n",
    "            weight=class_weights.to(model.device)\n",
    "        )\n",
    "        loss = loss_fct(logits.view(-1, 77), labels.view(-1))\n",
    "\n",
    "        return (loss, outputs) if return_outputs else loss\n",
    "\n",
    "# Split validation set from training data\n",
    "train_val = tokenized_dataset[\"train\"].train_test_split(\n",
    "    test_size=0.1,\n",
    "    seed=42\n",
    ")\n",
    "\n",
    "# Initialize trainer\n",
    "trainer = WeightedTrainer(\n",
    "    model=model,\n",
    "    args=training_args,\n",
    "    train_dataset=train_val[\"train\"],\n",
    "    eval_dataset=train_val[\"test\"],\n",
    "    compute_metrics=compute_metrics,\n",
    ")\n",
    "\n",
    "print(\"Trainer initialized\")\n",
    "print(f\"Training examples: {len(train_val['train'])}\")\n",
    "print(f\"Validation examples: {len(train_val['test'])}\")"
   ],
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/"
    },
    "id": "Dw_qRMBhGNuR",
    "outputId": "7fc393e4-7ba3-40d3-9d56-2b10d669f3d9"
   },
   "execution_count": 28,
   "outputs": [
    {
     "output_type": "stream",
     "name": "stdout",
     "text": [
      "Trainer initialized\n",
      "Training examples: 9002\n",
      "Validation examples: 1001\n"
     ]
    }
   ]
  },
  {
   "cell_type": "markdown",
   "source": [
    "Training of model"
   ],
   "metadata": {
    "id": "oGcLNKgCGy_x"
   }
  },
  {
   "cell_type": "code",
   "source": [
    "# Save model to Google Drive to prevent losing progress\n",
    "from google.colab import drive\n",
    "drive.mount('/content/drive')\n",
    "\n",
    "# Start training\n",
    "print(\"Starting training...\")\n",
    "trainer.train()\n",
    "\n",
    "# Save final model\n",
    "trainer.save_model(\"/content/drive/MyDrive/banking77-lora-final\")\n",
    "print(\"Model saved to Google Drive\")"
   ],
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/",
     "height": 285
    },
    "id": "Dn26Q34UG3px",
    "outputId": "c335d4d9-a1cc-47a7-9214-d44a79ae7a79"
   },
   "execution_count": 29,
   "outputs": [
    {
     "output_type": "stream",
     "name": "stdout",
     "text": [
      "Mounted at /content/drive\n",
      "Starting training...\n"
     ]
    },
    {
     "output_type": "display_data",
     "data": {
      "text/plain": [
       "<IPython.core.display.HTML object>"
      ],
      "text/html": [
       "\n",
       "    <div>\n",
       "      \n",
       "      <progress value='1410' max='1410' style='width:300px; height:20px; vertical-align: middle;'></progress>\n",
       "      [1410/1410 01:45, Epoch 5/5]\n",
       "    </div>\n",
       "    <table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       " <tr style=\"text-align: left;\">\n",
       "      <th>Epoch</th>\n",
       "      <th>Training Loss</th>\n",
       "      <th>Validation Loss</th>\n",
       "      <th>Accuracy</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <td>1</td>\n",
       "      <td>3.995700</td>\n",
       "      <td>3.609172</td>\n",
       "      <td>0.293706</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <td>2</td>\n",
       "      <td>2.572789</td>\n",
       "      <td>2.307555</td>\n",
       "      <td>0.604396</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <td>3</td>\n",
       "      <td>2.008083</td>\n",
       "      <td>1.736333</td>\n",
       "      <td>0.693307</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <td>4</td>\n",
       "      <td>1.693004</td>\n",
       "      <td>1.496839</td>\n",
       "      <td>0.712288</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <td>5</td>\n",
       "      <td>1.582025</td>\n",
       "      <td>1.425961</td>\n",
       "      <td>0.735265</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table><p>"
      ]
     },
     "metadata": {}
    },
    {
     "output_type": "stream",
     "name": "stdout",
     "text": [
      "Model saved to Google Drive\n"
     ]
    }
   ]
  },
  {
   "cell_type": "markdown",
   "source": [
    "Model Evaluation"
   ],
   "metadata": {
    "id": "1xAONxM4H-U7"
   }
  },
  {
   "cell_type": "code",
   "source": [
    "import numpy as np\n",
    "from sklearn.metrics import classification_report, confusion_matrix\n",
    "import matplotlib.pyplot as plt\n",
    "import seaborn as sns\n",
    "\n",
    "# Get predictions on test set\n",
    "predictions = trainer.predict(tokenized_dataset[\"test\"])\n",
    "pred_labels = np.argmax(predictions.predictions, axis=-1)\n",
    "true_labels = predictions.label_ids\n",
    "\n",
    "# Overall accuracy\n",
    "accuracy = (pred_labels == true_labels).mean()\n",
    "print(f\"Test Accuracy: {accuracy:.4f} ({accuracy*100:.2f}%)\")\n",
    "\n",
    "# Detailed per class report\n",
    "class_names = dataset[\"test\"].features[\"label\"].names\n",
    "report = classification_report(\n",
    "    true_labels,\n",
    "    pred_labels,\n",
    "    target_names=class_names,\n",
    "    output_dict=True\n",
    ")\n",
    "\n",
    "# Find best and worst performing intents\n",
    "report_df = pd.DataFrame(report).transpose()\n",
    "report_df = report_df.drop(\n",
    "    [\"accuracy\", \"macro avg\", \"weighted avg\"]\n",
    ")\n",
    "\n",
    "print(\"\\nTop 5 best performing intents:\")\n",
    "print(report_df.nlargest(5, \"f1-score\")[[\"f1-score\", \"support\"]])\n",
    "\n",
    "print(\"\\nTop 5 worst performing intents:\")\n",
    "print(report_df.nsmallest(5, \"f1-score\")[[\"f1-score\", \"support\"]])"
   ],
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/",
     "height": 312
    },
    "id": "NCqJLNLpIBdd",
    "outputId": "b9dd7cb3-7ee5-4c4c-d95f-2b54e2056cbe"
   },
   "execution_count": 30,
   "outputs": [
    {
     "output_type": "display_data",
     "data": {
      "text/plain": [
       "<IPython.core.display.HTML object>"
      ],
      "text/html": []
     },
     "metadata": {}
    },
    {
     "output_type": "stream",
     "name": "stdout",
     "text": [
      "Test Accuracy: 0.7175 (71.75%)\n",
      "\n",
      "Top 5 best performing intents:\n",
      "                    f1-score  support\n",
      "verify_top_up       1.000000     40.0\n",
      "age_limit           0.975610     40.0\n",
      "change_pin          0.950000     40.0\n",
      "passcode_forgotten  0.930233     40.0\n",
      "get_physical_card   0.928571     40.0\n",
      "\n",
      "Top 5 worst performing intents:\n",
      "                                    f1-score  support\n",
      "transfer_not_received_by_recipient  0.310345     40.0\n",
      "cash_withdrawal_not_recognised      0.338983     40.0\n",
      "supported_cards_and_currencies      0.339623     40.0\n",
      "topping_up_by_card                  0.339623     40.0\n",
      "top_up_by_bank_transfer_charge      0.392857     40.0\n"
     ]
    }
   ]
  },
  {
   "cell_type": "code",
   "source": [
    "model.save_pretrained(\"banking77-lora-final\")\n",
    "tokenizer.save_pretrained(\"banking77-lora-final\")\n",
    "print(\"Model saved locally\")"
   ],
   "metadata": {
    "id": "HXa6IDJnCjj3",
    "outputId": "0a070d10-f66f-4622-cbbd-aa03fd7a9fe2",
    "colab": {
     "base_uri": "https://localhost:8080/"
    }
   },
   "execution_count": 32,
   "outputs": [
    {
     "output_type": "stream",
     "name": "stdout",
     "text": [
      "Model saved locally\n"
     ]
    }
   ]
  },
  {
   "cell_type": "markdown",
   "source": [
    "Inference Code"
   ],
   "metadata": {
    "id": "2TwhO54Px12T"
   }
  },
  {
   "cell_type": "code",
   "source": [
    "from peft import PeftModel, PeftConfig\n",
    "from transformers import AutoModelForSequenceClassification, AutoTokenizer\n",
    "import torch\n",
    "\n",
    "# Load your fine-tuned model\n",
    "def load_model(model_path=\"./banking77-lora-final\"):\n",
    "    tokenizer = AutoTokenizer.from_pretrained(model_path)\n",
    "    config = PeftConfig.from_pretrained(model_path)\n",
    "    model = AutoModelForSequenceClassification.from_pretrained(\n",
    "        config.base_model_name_or_path,\n",
    "        num_labels=77\n",
    "    )\n",
    "    model = PeftModel.from_pretrained(model, model_path)\n",
    "    model.eval()\n",
    "    return model, tokenizer\n",
    "\n",
    "# Predict intent\n",
    "def predict_intent(text, model, tokenizer):\n",
    "    class_names = dataset[\"test\"].features[\"label\"].names\n",
    "\n",
    "    inputs = tokenizer(\n",
    "        text,\n",
    "        return_tensors=\"pt\",\n",
    "        padding=True,\n",
    "        truncation=True,\n",
    "        max_length=128\n",
    "    )\n",
    "\n",
    "    with torch.no_grad():\n",
    "        outputs = model(**inputs)\n",
    "        probabilities = torch.softmax(outputs.logits, dim=-1)\n",
    "        confidence, predicted_class = torch.max(probabilities, dim=-1)\n",
    "\n",
    "    return {\n",
    "        \"intent\": class_names[predicted_class.item()],\n",
    "        \"confidence\": f\"{confidence.item()*100:.2f}%\",\n",
    "        \"text\": text\n",
    "    }\n",
    "\n",
    "# Load model\n",
    "model, tokenizer = load_model()\n",
    "\n",
    "# Test with real examples\n",
    "test_queries = [\n",
    "    \"I lost my card and need a replacement\",\n",
    "    \"Why was my payment declined?\",\n",
    "    \"How do I add money to my account?\",\n",
    "    \"I want to change my PIN number\",\n",
    "    \"What currencies do you support?\"\n",
    "]\n",
    "\n",
    "print(\"Intent Classification Results:\")\n",
    "print(\"=\"*50)\n",
    "for query in test_queries:\n",
    "    result = predict_intent(query, model, tokenizer)\n",
    "    print(f\"\\nText: {result['text']}\")\n",
    "    print(f\"Intent: {result['intent']}\")\n",
    "    print(f\"Confidence: {result['confidence']}\")"
   ],
   "metadata": {
    "colab": {
     "base_uri": "https://localhost:8080/",
     "height": 708,
     "referenced_widgets": [
      "6d1d9c5c8eef4194987337d6b9460eab",
      "c60e097ae7b74ce0b0643759a3d3b7e9",
      "76d184cb05634b18ae417b8e55e11969",
      "6055c976102140c486f4e7c5d7769d17",
      "43ff9fa4a0ab42aebc985ee1db03bd67",
      "1c4ed9c9153b4fffb0085f4bb7951c1a",
      "cc2a475498f040f4904916a3616fb63e",
      "9b9fed4da36f45c0b58bc93a025e4d4f",
      "bce6f1ae436f49ff93c9c1c806ac6481",
      "ddec6967ce674c7c89d68eaa05ede1c8",
      "ccf88702043a455abac5352aca0141a0"
     ]
    },
    "id": "MSa_7Zpcx4td",
    "outputId": "db9a8cee-ab7d-4654-cfbf-e0cad855a3b2"
   },
   "execution_count": 33,
   "outputs": [
    {
     "output_type": "display_data",
     "data": {
      "text/plain": [
       "Loading weights:   0%|          | 0/100 [00:00<?, ?it/s]"
      ],
      "application/vnd.jupyter.widget-view+json": {
       "version_major": 2,
       "version_minor": 0,
       "model_id": "6d1d9c5c8eef4194987337d6b9460eab"
      }
     },
     "metadata": {}
    },
    {
     "output_type": "stream",
     "name": "stderr",
     "text": [
      "DistilBertForSequenceClassification LOAD REPORT from: distilbert-base-uncased\n",
      "Key                     | Status     | \n",
      "------------------------+------------+-\n",
      "vocab_transform.bias    | UNEXPECTED | \n",
      "vocab_transform.weight  | UNEXPECTED | \n",
      "vocab_layer_norm.bias   | UNEXPECTED | \n",
      "vocab_projector.bias    | UNEXPECTED | \n",
      "vocab_layer_norm.weight | UNEXPECTED | \n",
      "classifier.weight       | MISSING    | \n",
      "pre_classifier.weight   | MISSING    | \n",
      "classifier.bias         | MISSING    | \n",
      "pre_classifier.bias     | MISSING    | \n",
      "\n",
      "Notes:\n",
      "- UNEXPECTED\t:can be ignored when loading from different task/architecture; not ok if you expect identical arch.\n",
      "- MISSING\t:those params were newly initialized because missing from the checkpoint. Consider training on your downstream task.\n"
     ]
    },
    {
     "output_type": "stream",
     "name": "stdout",
     "text": [
      "Intent Classification Results:\n",
      "==================================================\n",
      "\n",
      "Text: I lost my card and need a replacement\n",
      "Intent: card_not_working\n",
      "Confidence: 14.40%\n",
      "\n",
      "Text: Why was my payment declined?\n",
      "Intent: declined_card_payment\n",
      "Confidence: 19.94%\n",
      "\n",
      "Text: How do I add money to my account?\n",
      "Intent: transfer_into_account\n",
      "Confidence: 16.11%\n",
      "\n",
      "Text: I want to change my PIN number\n",
      "Intent: change_pin\n",
      "Confidence: 47.46%\n",
      "\n",
      "Text: What currencies do you support?\n",
      "Intent: fiat_currency_support\n",
      "Confidence: 35.15%\n"
     ]
    }
   ]
  }
 ]
}