Spaces:

Meghna05
/

csp-chat

Runtime error

App Files Files Community

Meghna05 commited on Apr 13, 2024

Commit

779ea9c

verified ·

1 Parent(s): 2c97c9d

Upload app.py

Browse files

Files changed (1) hide show

app.py +280 -0

app.py ADDED Viewed

	@@ -0,0 +1,280 @@

+#!/usr/bin/env python
+# coding: utf-8
+# # CHATBOTS - Using Natural Language Processing and Tensorflow
+# In this Jupyter Notebook, We are going to Build a Chatbot that Understands the Context of Sentense and Respond accordingly.
+These are the Things that we are going to do in this Project -
+1. Transforming the Conversational Intents into Tensorflow model (Neural Network using TFLEARN) using NLP and Save it as Pickle also.
+2. Load the Same Pickle and Model to Build the Framework to Process the Responses.
+3. At Last, We Show How the Inputs are Processed and Give the Reponses.
+-------------------------------------------------------------------------------------------------------
+##### TFLEARN  - TFlearn is a modular and transparent deep learning library built on top of Tensorflow. It was designed to provide a higher-level API to TensorFlow in order to facilitate and speed-up experimentations, while remaining fully transparent and compatible with it.  (http://tflearn.org/)
+-------------------------------------------------------------------------------------------------------
+##### TENSORFLOW - TensorFlow is an end-to-end open source platform for machine learning. It has a comprehensive, flexible ecosystem of tools, libraries and community resources that lets researchers push the state-of-the-art in ML and developers easily build and deploy ML powered applications.
+# In[ ]:
+# In[5]:
+#Used in Tensorflow Model
+import numpy as np
+import tensorflow.compat.v1 as tf
+tf.disable_v2_behavior()
+import tflearn
+import random
+#Usde to for Contextualisation and Other NLP Tasks.
+import nltk
+from nltk.stem.lancaster import LancasterStemmer
+stemmer = LancasterStemmer()
+#Other
+import json
+import pickle
+import warnings
+warnings.filterwarnings("ignore")
+# In[6]:
+print("Processing the Intents.....")
+with open('intents.json') as json_data:
+    intents = json.load(json_data)
+# In[7]:
+words = []
+classes = []
+documents = []
+ignore_words = ['?']
+print("Looping through the Intents to Convert them to words, classes, documents and ignore_words.......")
+for intent in intents['intents']:
+    for pattern in intent['patterns']:
+        # tokenize each word in the sentence
+        w = nltk.word_tokenize(pattern)
+        # add to our words list
+        words.extend(w)
+        # add to documents in our corpus
+        documents.append((w, intent['tag']))
+        # add to our classes list
+        if intent['tag'] not in classes:
+            classes.append(intent['tag'])
+# In[8]:
+print("Stemming, Lowering and Removing Duplicates.......")
+words = [stemmer.stem(w.lower()) for w in words if w not in ignore_words]
+words = sorted(list(set(words)))
+# remove duplicates
+classes = sorted(list(set(classes)))
+print (len(documents), "documents")
+print (len(classes), "classes", classes)
+print (len(words), "unique stemmed words", words)
+# In[9]:
+print("Creating the Data for our Model.....")
+training = []
+output = []
+print("Creating an List (Empty) for Output.....")
+output_empty = [0] * len(classes)
+print("Creating Training Set, Bag of Words for our Model....")
+for doc in documents:
+    # Initialize our bag of words
+    bag = []
+    # List of tokenized words for the pattern
+    pattern_words = doc[0]
+    # Stem each word
+    pattern_words = [stemmer.stem(word.lower()) for word in pattern_words]
+    # Create our bag of words array
+    for w in words:
+        bag.append(1) if w in pattern_words else bag.append(0)
+    # Output is a '0' for each tag and '1' for current tag
+    output_row = list(output_empty)
+    output_row[classes.index(doc[1])] = 1
+    # Append the feature vector and output row as a tuple
+    training.append((bag, output_row))
+print("Shuffling Randomly and Converting into Numpy Array for Faster Processing......")
+random.shuffle(training)
+# Separate feature vectors and output rows into separate lists
+train_x = np.array([x[0] for x in training])
+train_y = np.array([x[1] for x in training])
+print("Creating Train and Test Lists.....")
+print("Building Neural Network for Our Chatbot to be Contextual....")
+print("Resetting graph data....")
+tf.reset_default_graph()
+# In[ ]:
+# In[10]:
+net = tflearn.input_data(shape=[None, len(train_x[0])])
+net = tflearn.fully_connected(net, 8)
+net = tflearn.fully_connected(net, 8)
+net = tflearn.fully_connected(net, len(train_y[0]), activation='softmax')
+net = tflearn.regression(net)
+print("Training....")
+# In[11]:
+model = tflearn.DNN(net, tensorboard_dir='tflearn_logs')
+# In[12]:
+print("Training the Model.......")
+model.fit(train_x, train_y, n_epoch=1000, batch_size=8, show_metric=True)
+print("Saving the Model.......")
+model.save('model.tflearn')
+# In[13]:
+print("Pickle is also Saved..........")
+#pickling
+pickle.dump( {'words':words, 'classes':classes, 'train_x':train_x, 'train_y':train_y}, open( "training_data", "wb" ) )
+# In[14]:
+print("Loading Pickle.....")
+data = pickle.load( open( "training_data", "rb" ) )#serializes the dta (convert in byte stream)
+words = data['words']
+classes = data['classes']
+train_x = data['train_x']
+train_y = data['train_y']
+with open('intents.json') as json_data:
+    intents = json.load(json_data)
+print("Loading the Model......")
+# load our saved model
+model.load('./model.tflearn')
+# In[30]:
+def clean_up_sentence(sentence):
+    # It Tokenize or Break it into the constituents parts of Sentense.
+    sentence_words = nltk.word_tokenize(sentence)
+    # Stemming means to find the root of the word.
+    sentence_words = [stemmer.stem(word.lower()) for word in sentence_words]
+    return sentence_words
+# Return the Array of Bag of Words: True or False and 0 or 1 for each word of bag that exists in the Sentence
+def bow(sentence, words, show_details=False):
+    sentence_words = clean_up_sentence(sentence)
+    bag = [0]*len(words)
+    for s in sentence_words:
+        for i,w in enumerate(words):
+            if w == s:
+                bag[i] = 1
+                if show_details:
+                    print ("found in bag: %s" % w)
+    return(np.array(bag))
+ERROR_THRESHOLD = 0.25
+print("ERROR_THRESHOLD = 0.25")
+def classify(sentence):
+    # Prediction or To Get the Posibility or Probability from the Model
+    results = model.predict([bow(sentence, words)])[0]
+    # Exclude those results which are Below Threshold
+    results = [[i,r] for i,r in enumerate(results) if r>ERROR_THRESHOLD]
+    # Sorting is Done because heigher Confidence Answer comes first.
+    results.sort(key=lambda x: x[1], reverse=True)
+    return_list = []
+    for r in results:
+        return_list.append((classes[r[0]], r[1])) #Tuppl -> Intent and Probability
+    return return_list
+def response(sentence, userID='123', show_details=False):
+    results = classify(sentence)
+    if results:
+        while results:
+            for i in intents['intents']:
+                if i['tag'] == results[0][0]:
+                    # Return a random response from the list of responses for the matching intent
+                    return random.choice(i['responses'])
+            results.pop(0)
+    # If no matching intent was found, return a default response
+    return "Sorry, I didn't understand that."
+# In[ ]:
+# In[31]:
+import gradio as gr
+def chat_response(message):
+    return response(message)  # Return the response from the chatbot
+gr.Interface(fn=chat_response, inputs="text", outputs="text").launch()
+# In[ ]:
+# In[54]:
+# In[44]:
+# In[ ]: