Source code for botiverse.bots.BasicBot.BasicBot

import numpy as np
import json
from gensim.utils import tokenize
import numpy as np
from botiverse.models import SVM, NeuralNet
from botiverse.preprocessors import GloVe, TF_IDF, TF_IDF_GLOVE, BoW
from nltk.stem.porter import PorterStemmer
stemmer = PorterStemmer()


[docs]class BasicBot:
    '''
    An interface for a basic chatbot model suitable for small datasets such as FAQs. Note that the
    underlying model is not sequential (either an NN or an SVM).
    '''
    def __init__(self, machine='nn', repr='tf-idf'):
        """
        Instantiate a basic chat bot model that uses a classic feedforward neural network.
        Data can be then used to train the chatbot model.
        
        :param name: The chatbot's name.
        :type name: string
        :param machine: The machine learning model to use. Either 'nn' or 'svm', else must be a model object that has appropriate fit and predict methods.
        :type machine: string
        :param repr: The representation to use. Either 'glove', 'tf-idf', or 'tf-idf-glove' or 'bow', else must be a model object that has appropriate transform_list and transform methods.
        :type repr: string
        """
        self.model = None
        self.machine = machine
        self.repr = repr
        
        if repr == 'glove': 
            self.transformer = GloVe()
        elif repr == 'tf-idf':
            self.transformer = TF_IDF()
        elif repr == 'tf-idf-glove':
            self.transformer = TF_IDF_GLOVE()
        elif repr == 'bow':
            self.transformer = BoW()
        elif type(repr) != str:
            # if machine or transform is not a string, then assume it is a model
            self.transformer = repr
        else:
            raise Exception('Representation must either be one of those the basic chatbot support or a custom one that implement the transform API. Found was ' + repr)
            
        self.tf = None
        self.idf = None
        self.classes = None
        
        

    def setup_data(self):
        """
        Internal method to setup the data for training. This method is called automatically when the train method is called.
                
        :meta private:
        """  
        all_words = []
        classes = []
        sentence_list = []                             # sentence_table[i] is a tuple (list of words, class)
        y = []
        for intent in self.raw_data:                    #this is a list of dictionaries. each has a tag (class), list of patterns and list of responses.
            tag = intent['tag']
            classes.append(tag)
            for pattern in intent['patterns']:
                if self.repr == 'tf-idf' or self.repr == 'tf-idf-glove' or self.repr == 'bow':
                    all_words += list(tokenize(pattern, to_lower=True))     
                sentence_list.append(pattern)
                y.append(tag)

        # stem and lower each word
        all_words = [stemmer.stem(word.lower()) for word in all_words if word not in ['?', '!', '.', ',']]
        
        # remove duplicates and sort alphabetically
        all_words = sorted(set(all_words))
        classes = sorted(set(classes))
        
        self.all_words = all_words
        self.classes = classes
        
        X = self.transformer.transform_list(sentence_list, all_words=all_words)

        # convert each class to its index
        for i, tag in enumerate(y):
            y[i] = classes.index(tag)
        y = np.array(y)
        return X, y
    
[docs]    def read_data(self, path):
        """
        Read the data from a JSON file found in `path` for the chatbot to train on later.
        
        :param path: The path to the JSON file
        :type number: string
        """
        with open(path, 'r') as f:
            self.raw_data = json.load(f) 

        self.X, self.y = self.setup_data()
        
[docs]    def train(self, max_epochs=None, early_stop=False, **kwargs):
        """
        Train the chatbot model with previously read data.
        
        :param max_epochs: The maximum number of epochs to train for. If None, then the number of epochs is `30 * len(self.classes)`
        :type max_epochs: int
        :param early_stop: Whether to use early stopping or not. If True, the models stops whenever the validation loss stops decreasing for 100 epochs.
        :type early_stop: bool
        :param kwargs: Any additional arguments to pass to the model's fit method.
        """
        X, y = self.X, self.y
        if self.machine == 'nn':
            self.model = NeuralNet(structure=[X.shape[1], 12, len(self.classes)], activation='sigmoid')
            max_epochs = max_epochs if max_epochs is not None else 30 * len(self.classes)
            if early_stop:
                self.model.fit(X, y, batch_size=1, epochs=max_epochs, λ = 0.02, eval_train=True, val_split=0.2, patience=100)
                self.model.fit(X, y, batch_size=1, epochs=max_epochs, λ = 0.02, eval_train=True, val_split=0.0)
            else:
                self.model.fit(X, y, batch_size=1, epochs=max_epochs, λ = 0.02, eval_train=True, val_split=0.0)
                
        elif self.machine == 'svm':
            self.model = SVM(kernel='linear', C=700)
            self.model.fit(X, y, eval_train=True)
        elif type(self.machine) != str:
                self.machine.fit(X, y, **kwargs)
        else:
            raise Exception('Machine must either be one of those the basic chatbot support or a custom one that implement the fit API. Found was ' + self.machine)


[docs]    def save(self, path):
        '''
        Save the chatbot model to a file. Not supported yet for SVM models.
        
        :param path: The path to the file
        '''
        if self.machine == 'svm':
            print("Could Not Save: SVM model is for experimentation only and does not allow saving yet.")
        else:
            if type(self.machine) != str:
                self.machine.save(path+'.bot')
            else:
                self.model.save(path+'.bot')
    
[docs]    def load(self, load_path, data_path):
        '''
        Load the model from a file. 
        
        :param load_path: The path to the file
        :type load_path: string
        :param data_path: The path to the JSON file containing the data used to train the model to sample responses from.
        :type data_path: string
        '''
        if self.machine == 'svm':
            print("Could Not Load: SVM is for experimentation only and does not allow loading yet.")
        else:
            if type(self.machine) != str:
                self.model = self.machine.load(load_path + '.bot')
            else:
                self.model = NeuralNet.load(load_path + '.bot')
            # following can be optimized.
            with open(data_path, 'r') as f:
                self.raw_data = json.load(f)
                self.classes = sorted(set([intent['tag'] for intent in self.raw_data]))
                
                # compute all words again 
                all_words = []
                for intent in self.raw_data:
                    for pattern in intent['patterns']:
                        all_words += list(tokenize(pattern, to_lower=True))
                all_words = [stemmer.stem(word.lower()) for word in all_words if word not in ['?', '!', '.', ',']]
                self.all_words = sorted(set(all_words))
                # set the transformer's all_words if needed
                if hasattr(self.transformer, 'all_words'):  self.transformer.all_words = self.all_words
                    
                
[docs]    def infer(self, prompt, confidence=None, test=False):
        """
        Infer a suitable response to the given prompt.
        
        :param prompt: The user's prompt
        :type prompt: string
        :param confidence: The minimum confidence (probability) required for the chatbot to respond. If None, then the confidence is `2/len(self.classes)`
        :type confidence: float
        :param test: Whether to return the class of the prompt instead of a response. Helpful to test on unkonwn data.
        :type test: bool
        
        :return: The chatbot's response or the class of the prompt if `test` is True.
        :rtype: string
        """
        if confidence is None: confidence = 2/len(self.classes)
        vector = self.transformer.transform(prompt) 
        # predict the class of the prompt
        tag_idx, tag_prob = self.model.predict(vector)
        tag_idx, tag_prob = tag_idx[0], tag_prob[0]
        tag = self.classes[tag_idx]
        if tag_prob < confidence: return "Sorry, I didn't get that. I'm only capable of answering questions about the following topics: " + ', '.join(self.classes)
        for intent in self.raw_data:
            if tag == intent["tag"]:
                if test: return tag
                return np.random.choice(intent['responses'])