Upload 10 files

- Added pre-trained BERT model files (config, checkpoints, vocab).
- Uploaded fine-tuned BERT model and weights.
- Included requirements.txt with specific dependencies.
- Added README.md with instructions on model usage and dependencies.
- Added Python script for running the model and making predictions.

Files changed (11) hide show

.gitattributes +1 -0
Intent predictor.ipynb +194 -0
README.md +45 -0
bert_200_max_seq_len_model.h5 +3 -0
bert_adv_synthetic_weights_v2(14).h5 +3 -0
bert_config.json +13 -0
bert_model.ckpt.data-00000-of-00001 +3 -0
bert_model.ckpt.index +0 -0
bert_model.ckpt.meta +0 -0
requirements.txt +7 -0
vocab.txt +0 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+bert_model.ckpt.data-00000-of-00001 filter=lfs diff=lfs merge=lfs -text

Intent predictor.ipynb ADDED Viewed

	@@ -0,0 +1,194 @@

+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import os\n",
+    "import math\n",
+    "import datetime\n",
+    "\n",
+    "from tqdm import tqdm\n",
+    "\n",
+    "import pandas as pd\n",
+    "import numpy as np\n",
+    "\n",
+    "import tensorflow as tf\n",
+    "from tensorflow import keras\n",
+    "\n",
+    "import bert\n",
+    "from bert import BertModelLayer\n",
+    "from bert.loader import StockBertConfig, map_stock_config_to_params, load_stock_weights\n",
+    "from bert.tokenization.bert_tokenization import FullTokenizer"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "bert_model_name=\"uncased_L-12_H-768_A-12\"\n",
+    "\n",
+    "bert_ckpt_dir = os.path.join(\"model/\", bert_model_name)\n",
+    "bert_ckpt_file = os.path.join(bert_ckpt_dir, \"bert_model.ckpt\")\n",
+    "bert_config_file = os.path.join(bert_ckpt_dir, \"bert_config.json\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "tokenizer = FullTokenizer(vocab_file=os.path.join(bert_ckpt_dir, \"vocab.txt\"))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "classes = ['service_availability_check',\n",
+    "            'billing_inquiry', \n",
+    "            'order_cancellation',\n",
+    "              'address_verification',\n",
+    "                'user_authentication',\n",
+    "                  'account_information_update',\n",
+    "                    'call_divert', \n",
+    "                    'customer_service_escalation',\n",
+    "                      'appointment_scheduling',\n",
+    "                        'order_status_inquiry',\n",
+    "                          'product_information_request',\n",
+    "                            'complaint_registration',\n",
+    "                              'call_disconnect',\n",
+    "                                'appointment_confirmation', \n",
+    "                                'appointment_cancellation']\n",
+    "\n",
+    "\n",
+    "max_seq_len = 200"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 5,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "def create_model(max_seq_len, bert_ckpt_file):\n",
+    "  with tf.io.gfile.GFile(bert_config_file, \"r\") as reader:\n",
+    "      bc = StockBertConfig.from_json_string(reader.read())\n",
+    "      bert_params = map_stock_config_to_params(bc)\n",
+    "      bert_params.adapter_size = None\n",
+    "      bert = BertModelLayer.from_params(bert_params, name=\"bert\")\n",
+    "  input_ids = keras.layers.Input(\n",
+    "    shape=(max_seq_len, ),\n",
+    "    dtype='int32',\n",
+    "    name=\"input_ids\"\n",
+    "  )\n",
+    "  bert_output = bert(input_ids)\n",
+    "  print(\"bert shape\", bert_output.shape)\n",
+    "  cls_out = keras.layers.Lambda(lambda seq: seq[:, 0, :])(bert_output)\n",
+    "  cls_out = keras.layers.Dropout(0.5)(cls_out)\n",
+    "  logits = keras.layers.Dense(units=768, activation=\"tanh\")(cls_out)\n",
+    "  logits = keras.layers.Dropout(0.5)(logits)\n",
+    "  logits = keras.layers.Dense(\n",
+    "    units=len(classes),\n",
+    "    activation=\"softmax\"\n",
+    "  )(logits)\n",
+    "  model = keras.Model(inputs=input_ids, outputs=logits)\n",
+    "  model.build(input_shape=(None, max_seq_len))\n",
+    "  load_stock_weights(bert, bert_ckpt_file)\n",
+    "  return model\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "model = create_model(max_seq_len, bert_ckpt_file)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 7,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "model.load_weights('bert_adv_synthetic_weights_v2(14).h5') "
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 17,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Run this if you change the max_seq_len\n",
+    "#model.save('bert_200_max_seq_len_model.h5') \n",
+    " "
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 8,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "def intent_recognizer(sentences):\n",
+    "  pred_tokens = map(tokenizer.tokenize, sentences)\n",
+    "  pred_tokens = map(lambda tok: [\"[CLS]\"] + tok + [\"[SEP]\"], pred_tokens)\n",
+    "  pred_token_ids = list(map(tokenizer.convert_tokens_to_ids, pred_tokens))\n",
+    "  pred_token_ids = map(lambda tids: tids +[0]*(max_seq_len-len(tids)),pred_token_ids)\n",
+    "  pred_token_ids = np.array(list(pred_token_ids))\n",
+    "  predictions = model.predict(pred_token_ids).argmax(axis=-1)\n",
+    "  for text, label in zip(sentences, predictions):\n",
+    "    print(\"text:\", text, \"\\nintent:\", classes[label])\n",
+    "    print()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "sentences = [\"While I’ve been speaking with you, I realized that my particular request might be better handled by someone with a more specialized focus. I believe there’s another team, maybe the one that deals with customer inquiries more closely, that would be better suited to help me. It seems like my issue falls outside the general scope, and I’d really appreciate being put in touch with the department or individual who is more equipped to provide the support I’m looking for. I’m thinking maybe the sales or technical support team could be more in line with what I need.\"]\n",
+    "intent_recognizer(sentences)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "base",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.7.4"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 2
+}

README.md ADDED Viewed

	@@ -0,0 +1,45 @@

+# Custom BERT Model for Intent Recognition
+This repository contains a custom fine-tuned BERT model for intent recognition. The model was trained to recognize a set of customer service-related intents, and it's based on the pre-trained BERT architecture (uncased_L-12_H-768_A-12).
+## Python Version
+This project is compatible with **Python 3.7.4**. It is recommended to use this version for compatibility with the listed dependencies.
+## Model Information
+- **Base Architecture**: BERT (uncased_L-12_H-768_A-12)
+- **Max Sequence Length**: 200
+- **Number of Intents**: 15
+## Classes
+The model is trained to classify the following customer service-related intents:
+don't change the order while intializing
+1. `service_availability_check`
+2. `billing_inquiry`
+3. `order_cancellation`
+4. `address_verification`
+5. `user_authentication`
+6. `account_information_update`
+7. `call_divert`
+8. `customer_service_escalation`
+9. `appointment_scheduling`
+10. `order_status_inquiry`
+11. `product_information_request`
+12. `complaint_registration`
+13. `call_disconnect`
+14. `appointment_confirmation`
+15. `appointment_cancellation`
+## How to Use
+To use the model, load the configuration file (bert_config.json), the checkpoint files (bert_model.ckpt*), and the vocabulary file (vocab.txt). Along with these, load the saved fine-tuned model or weights (if you plan to modify layers or change the max_seq_len [the length of input sentences]). This ensures that the model is correctly configured and functions as expected for your custom use case.
+## Intended Use
+This model is designed for intent recognition in customer service applications and supports a variety of queries such as billing inquiries, order cancellations, service availability checks, and more.
+.

bert_200_max_seq_len_model.h5 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5caa23740f8446cb18470b329be05337a7f6f9ff044cf9150beefa48e491ef7f
+size 438221296

bert_adv_synthetic_weights_v2(14).h5 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f2733aa63247a3f1e7671c8283521e94d552a12f0ad79cebd66502cd46902c7b
+size 438219568

bert_config.json ADDED Viewed

	@@ -0,0 +1,13 @@

+{
+  "attention_probs_dropout_prob": 0.1,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "max_position_embeddings": 512,
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "type_vocab_size": 2,
+  "vocab_size": 30522
+}

bert_model.ckpt.data-00000-of-00001 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:58580dc5e0bf0ae0d2efd51d0e8272b2f808857f0a43a88aaf7549da6d7a8a84
+size 440425712

bert_model.ckpt.index ADDED Viewed

Binary file (8.53 kB). View file

bert_model.ckpt.meta ADDED Viewed

Binary file (904 kB). View file

requirements.txt ADDED Viewed

	@@ -0,0 +1,7 @@

+# Python 3.7.4 required
+tensorflow==2.2.0
+keras==2.3.0-tf
+bert-for-tf2==0.14.9
+pandas==1.3.5
+numpy==1.19.5

vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff