From dc30f1a9a51f2afa3ac4157baea26a8581e997de Mon Sep 17 00:00:00 2001
From: Kumar Apurva <66004696+KUMAR-APURVA@users.noreply.github.com>
Date: Thu, 10 Jun 2021 12:05:16 +0530
Subject: [PATCH 1/4] [Ch4Nb07] Fixed path issues and version problem
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit
1. Added try except block for window and colab and also checked if the file is already present or we need to download it.
2. Fixed the path issues.
3. Upgraded Ktrain version from ‘0.2.2’ to ‘0.26.3’
---
...Sentiment_Classification_IMDB_ktrain.ipynb | 889 ++++++++----------
1 file changed, 415 insertions(+), 474 deletions(-)
diff --git a/Ch4/07_BERT_Sentiment_Classification_IMDB_ktrain.ipynb b/Ch4/07_BERT_Sentiment_Classification_IMDB_ktrain.ipynb
index cbd8c0d..1574dfb 100644
--- a/Ch4/07_BERT_Sentiment_Classification_IMDB_ktrain.ipynb
+++ b/Ch4/07_BERT_Sentiment_Classification_IMDB_ktrain.ipynb
@@ -1,504 +1,445 @@
{
- "nbformat": 4,
- "nbformat_minor": 0,
- "metadata": {
- "colab": {
- "name": "BERT_Sentiment_Classification_IMDB.ipynb",
- "provenance": [],
- "collapsed_sections": []
- },
- "kernelspec": {
- "name": "python3",
- "display_name": "Python 3"
- },
- "accelerator": "GPU"
+ "cells": [
+ {
+ "cell_type": "markdown",
+ "metadata": {
+ "colab_type": "text",
+ "id": "ypR4NNY7oyEV"
+ },
+ "source": [
+ "#### We need to install the ktrain library. Its a light weight wrapper for keras to help train neural networks. With only a few lines of code it allows you to build models, estimate optimal learning rate, loading and preprocessing text and image data from various sources and much more. More about our approach can be found at [this](https://towardsdatascience.com/bert-text-classification-in-3-lines-of-code-using-keras-264db7e7a358) article."
+ ]
},
- "cells": [
- {
- "cell_type": "markdown",
- "metadata": {
- "id": "ypR4NNY7oyEV",
- "colab_type": "text"
- },
- "source": [
- "#### We need to install the ktrain library. Its a light weight wrapper for keras to help train neural networks. With only a few lines of code it allows you to build models, estimate optimal learning rate, loading and preprocessing text and image data from various sources and much more. More about our approach can be found at [this](https://towardsdatascience.com/bert-text-classification-in-3-lines-of-code-using-keras-264db7e7a358) article."
- ]
+ {
+ "cell_type": "code",
+ "execution_count": 1,
+ "metadata": {
+ "colab": {
+ "base_uri": "https://localhost:8080/",
+ "height": 1000
},
+ "colab_type": "code",
+ "id": "58WB13Jx3rQm",
+ "outputId": "847a6286-f36b-4b32-a791-5ab6d625c701"
+ },
+ "outputs": [
{
- "cell_type": "code",
- "metadata": {
- "id": "58WB13Jx3rQm",
- "colab_type": "code",
- "outputId": "847a6286-f36b-4b32-a791-5ab6d625c701",
- "colab": {
- "base_uri": "https://localhost:8080/",
- "height": 1000
- }
- },
- "source": [
- "!pip3 install ktrain==0.2.2"
- ],
- "execution_count": 1,
- "outputs": [
- {
- "output_type": "stream",
- "text": [
- "Collecting ktrain==0.2.2\n",
- "\u001b[?25l Downloading https://files.pythonhosted.org/packages/83/ce/f8dd172bec1486c02f20cc5099055fb2e8850fc414eb7bc922f29e4e13ec/ktrain-0.2.2.tar.gz (43kB)\n",
- "\r\u001b[K |███████▋ | 10kB 26.3MB/s eta 0:00:01\r\u001b[K |███████████████▎ | 20kB 1.7MB/s eta 0:00:01\r\u001b[K |██████████████████████▉ | 30kB 2.5MB/s eta 0:00:01\r\u001b[K |██████████████████████████████▌ | 40kB 1.7MB/s eta 0:00:01\r\u001b[K |████████████████████████████████| 51kB 1.8MB/s \n",
- "\u001b[?25hRequirement already satisfied: keras>=2.2.4 in /usr/local/lib/python3.6/dist-packages (from ktrain==0.2.2) (2.2.5)\n",
- "Requirement already satisfied: scikit-learn>=0.20.0 in /usr/local/lib/python3.6/dist-packages (from ktrain==0.2.2) (0.22.1)\n",
- "Requirement already satisfied: matplotlib>=3.0.0 in /usr/local/lib/python3.6/dist-packages (from ktrain==0.2.2) (3.1.2)\n",
- "Requirement already satisfied: pandas>=0.24.2 in /usr/local/lib/python3.6/dist-packages (from ktrain==0.2.2) (0.25.3)\n",
- "Requirement already satisfied: fastprogress>=0.1.21 in /usr/local/lib/python3.6/dist-packages (from ktrain==0.2.2) (0.2.2)\n",
- "Collecting keras_bert\n",
- " Downloading https://files.pythonhosted.org/packages/2c/0f/cdc886c1018943ea62d3209bc964413d5aa9d0eb7e493abd8545be679294/keras-bert-0.81.0.tar.gz\n",
- "Requirement already satisfied: requests in /usr/local/lib/python3.6/dist-packages (from ktrain==0.2.2) (2.21.0)\n",
- "Requirement already satisfied: six>=1.9.0 in /usr/local/lib/python3.6/dist-packages (from keras>=2.2.4->ktrain==0.2.2) (1.12.0)\n",
- "Requirement already satisfied: h5py in /usr/local/lib/python3.6/dist-packages (from keras>=2.2.4->ktrain==0.2.2) (2.8.0)\n",
- "Requirement already satisfied: numpy>=1.9.1 in /usr/local/lib/python3.6/dist-packages (from keras>=2.2.4->ktrain==0.2.2) (1.17.5)\n",
- "Requirement already satisfied: keras-applications>=1.0.8 in /usr/local/lib/python3.6/dist-packages (from keras>=2.2.4->ktrain==0.2.2) (1.0.8)\n",
- "Requirement already satisfied: keras-preprocessing>=1.1.0 in /usr/local/lib/python3.6/dist-packages (from keras>=2.2.4->ktrain==0.2.2) (1.1.0)\n",
- "Requirement already satisfied: pyyaml in /usr/local/lib/python3.6/dist-packages (from keras>=2.2.4->ktrain==0.2.2) (3.13)\n",
- "Requirement already satisfied: scipy>=0.14 in /usr/local/lib/python3.6/dist-packages (from keras>=2.2.4->ktrain==0.2.2) (1.4.1)\n",
- "Requirement already satisfied: joblib>=0.11 in /usr/local/lib/python3.6/dist-packages (from scikit-learn>=0.20.0->ktrain==0.2.2) (0.14.1)\n",
- "Requirement already satisfied: kiwisolver>=1.0.1 in /usr/local/lib/python3.6/dist-packages (from matplotlib>=3.0.0->ktrain==0.2.2) (1.1.0)\n",
- "Requirement already satisfied: python-dateutil>=2.1 in /usr/local/lib/python3.6/dist-packages (from matplotlib>=3.0.0->ktrain==0.2.2) (2.6.1)\n",
- "Requirement already satisfied: pyparsing!=2.0.4,!=2.1.2,!=2.1.6,>=2.0.1 in /usr/local/lib/python3.6/dist-packages (from matplotlib>=3.0.0->ktrain==0.2.2) (2.4.6)\n",
- "Requirement already satisfied: cycler>=0.10 in /usr/local/lib/python3.6/dist-packages (from matplotlib>=3.0.0->ktrain==0.2.2) (0.10.0)\n",
- "Requirement already satisfied: pytz>=2017.2 in /usr/local/lib/python3.6/dist-packages (from pandas>=0.24.2->ktrain==0.2.2) (2018.9)\n",
- "Collecting keras-transformer>=0.30.0\n",
- " Downloading https://files.pythonhosted.org/packages/54/0c/fede535ac576c03863c44bf2e0bf051fe21f5e10103631b6b6236ae446f3/keras-transformer-0.32.0.tar.gz\n",
- "Requirement already satisfied: idna<2.9,>=2.5 in /usr/local/lib/python3.6/dist-packages (from requests->ktrain==0.2.2) (2.8)\n",
- "Requirement already satisfied: urllib3<1.25,>=1.21.1 in /usr/local/lib/python3.6/dist-packages (from requests->ktrain==0.2.2) (1.24.3)\n",
- "Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.6/dist-packages (from requests->ktrain==0.2.2) (2019.11.28)\n",
- "Requirement already satisfied: chardet<3.1.0,>=3.0.2 in /usr/local/lib/python3.6/dist-packages (from requests->ktrain==0.2.2) (3.0.4)\n",
- "Requirement already satisfied: setuptools in /usr/local/lib/python3.6/dist-packages (from kiwisolver>=1.0.1->matplotlib>=3.0.0->ktrain==0.2.2) (45.1.0)\n",
- "Collecting keras-pos-embd>=0.10.0\n",
- " Downloading https://files.pythonhosted.org/packages/09/70/b63ed8fc660da2bb6ae29b9895401c628da5740c048c190b5d7107cadd02/keras-pos-embd-0.11.0.tar.gz\n",
- "Collecting keras-multi-head>=0.22.0\n",
- " Downloading https://files.pythonhosted.org/packages/40/3e/d0a64bb2ac5217928effe4507c26bbd19b86145d16a1948bc2d4f4c6338a/keras-multi-head-0.22.0.tar.gz\n",
- "Collecting keras-layer-normalization>=0.12.0\n",
- " Downloading https://files.pythonhosted.org/packages/a4/0e/d1078df0494bac9ce1a67954e5380b6e7569668f0f3b50a9531c62c1fc4a/keras-layer-normalization-0.14.0.tar.gz\n",
- "Collecting keras-position-wise-feed-forward>=0.5.0\n",
- " Downloading https://files.pythonhosted.org/packages/e3/59/f0faa1037c033059e7e9e7758e6c23b4d1c0772cd48de14c4b6fd4033ad5/keras-position-wise-feed-forward-0.6.0.tar.gz\n",
- "Collecting keras-embed-sim>=0.7.0\n",
- " Downloading https://files.pythonhosted.org/packages/bc/20/735fd53f6896e2af63af47e212601c1b8a7a80d00b6126c388c9d1233892/keras-embed-sim-0.7.0.tar.gz\n",
- "Collecting keras-self-attention==0.41.0\n",
- " Downloading https://files.pythonhosted.org/packages/1b/1c/01599219bef7266fa43b3316e4f55bcb487734d3bafdc60ffd564f3cfe29/keras-self-attention-0.41.0.tar.gz\n",
- "Building wheels for collected packages: ktrain, keras-bert, keras-transformer, keras-pos-embd, keras-multi-head, keras-layer-normalization, keras-position-wise-feed-forward, keras-embed-sim, keras-self-attention\n",
- " Building wheel for ktrain (setup.py) ... \u001b[?25l\u001b[?25hdone\n",
- " Created wheel for ktrain: filename=ktrain-0.2.2-cp36-none-any.whl size=50418 sha256=30ac3da49ca22b1ec10c57ae08d3bab9756222409cd3463f85ef190fe66dc8d0\n",
- " Stored in directory: /root/.cache/pip/wheels/fa/21/6f/e0452e1564ccab53339b601dbd1f37ed81e34868826200e8f8\n",
- " Building wheel for keras-bert (setup.py) ... \u001b[?25l\u001b[?25hdone\n",
- " Created wheel for keras-bert: filename=keras_bert-0.81.0-cp36-none-any.whl size=37913 sha256=180438bed7964563b41411bcd633f83794ceb0ac2817898291612600cfb39f3a\n",
- " Stored in directory: /root/.cache/pip/wheels/bd/27/da/ffc2d573aa48b87440ec4f98bc7c992e3a2d899edb2d22ef9e\n",
- " Building wheel for keras-transformer (setup.py) ... \u001b[?25l\u001b[?25hdone\n",
- " Created wheel for keras-transformer: filename=keras_transformer-0.32.0-cp36-none-any.whl size=13266 sha256=4f32a5e7c46dec4f5dbeb040523f6c94b46048bb5eab2f85a4ee1c71b9b71206\n",
- " Stored in directory: /root/.cache/pip/wheels/62/f0/ce/82fa5d024d5ef8e263f26a50dcee23820efe245680ce9c922a\n",
- " Building wheel for keras-pos-embd (setup.py) ... \u001b[?25l\u001b[?25hdone\n",
- " Created wheel for keras-pos-embd: filename=keras_pos_embd-0.11.0-cp36-none-any.whl size=7554 sha256=c6c8607ddbc95fc5c3c2412f94d41d2d6780d3b30004543791e9313492b2de49\n",
- " Stored in directory: /root/.cache/pip/wheels/5b/a1/a0/ce6b1d49ba1a9a76f592e70cf297b05c96bc9f418146761032\n",
- " Building wheel for keras-multi-head (setup.py) ... \u001b[?25l\u001b[?25hdone\n",
- " Created wheel for keras-multi-head: filename=keras_multi_head-0.22.0-cp36-none-any.whl size=15371 sha256=05c6dc4ab2d005d29f310419143e25714eb6a7ffb169e008d1c18666019fcf5d\n",
- " Stored in directory: /root/.cache/pip/wheels/bb/df/3f/81b36f41b66e6a9cd69224c70a737de2bb6b2f7feb3272c25e\n",
- " Building wheel for keras-layer-normalization (setup.py) ... \u001b[?25l\u001b[?25hdone\n",
- " Created wheel for keras-layer-normalization: filename=keras_layer_normalization-0.14.0-cp36-none-any.whl size=5268 sha256=affb377c258c1f72bd3be271eb6a578a1be567626b082c7d51c96af3c685707f\n",
- " Stored in directory: /root/.cache/pip/wheels/54/80/22/a638a7d406fd155e507aa33d703e3fa2612b9eb7bb4f4fe667\n",
- " Building wheel for keras-position-wise-feed-forward (setup.py) ... \u001b[?25l\u001b[?25hdone\n",
- " Created wheel for keras-position-wise-feed-forward: filename=keras_position_wise_feed_forward-0.6.0-cp36-none-any.whl size=5623 sha256=794c37b5c74aa2d635f3581d8f1e82e8e4e08f9709c8b08beba747cc84d786a2\n",
- " Stored in directory: /root/.cache/pip/wheels/39/e2/e2/3514fef126a00574b13bc0b9e23891800158df3a3c19c96e3b\n",
- " Building wheel for keras-embed-sim (setup.py) ... \u001b[?25l\u001b[?25hdone\n",
- " Created wheel for keras-embed-sim: filename=keras_embed_sim-0.7.0-cp36-none-any.whl size=4676 sha256=922770c4ee921ab176dd5e405a9a0c30a2abd4bbb9b02b313f81308d1c00cd3f\n",
- " Stored in directory: /root/.cache/pip/wheels/d1/bc/b1/b0c45cee4ca2e6c86586b0218ffafe7f0703c6d07fdf049866\n",
- " Building wheel for keras-self-attention (setup.py) ... \u001b[?25l\u001b[?25hdone\n",
- " Created wheel for keras-self-attention: filename=keras_self_attention-0.41.0-cp36-none-any.whl size=17288 sha256=1ad03d750cc19684d453b79f17fcc64565051904d5c87d91d0c17fb6a9bbced4\n",
- " Stored in directory: /root/.cache/pip/wheels/cc/dc/17/84258b27a04cd38ac91998abe148203720ca696186635db694\n",
- "Successfully built ktrain keras-bert keras-transformer keras-pos-embd keras-multi-head keras-layer-normalization keras-position-wise-feed-forward keras-embed-sim keras-self-attention\n",
- "Installing collected packages: keras-pos-embd, keras-self-attention, keras-multi-head, keras-layer-normalization, keras-position-wise-feed-forward, keras-embed-sim, keras-transformer, keras-bert, ktrain\n",
- "Successfully installed keras-bert-0.81.0 keras-embed-sim-0.7.0 keras-layer-normalization-0.14.0 keras-multi-head-0.22.0 keras-pos-embd-0.11.0 keras-position-wise-feed-forward-0.6.0 keras-self-attention-0.41.0 keras-transformer-0.32.0 ktrain-0.2.2\n"
- ],
- "name": "stdout"
- }
- ]
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "Requirement already satisfied: ktrain==0.26.3 in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (0.26.3)\n",
+ "Requirement already satisfied: ipython in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from ktrain==0.26.3) (7.16.1)\n",
+ "Requirement already satisfied: keras-bert>=0.86.0 in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from ktrain==0.26.3) (0.86.0)\n",
+ "Requirement already satisfied: joblib in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from ktrain==0.26.3) (1.0.1)\n",
+ "Requirement already satisfied: requests in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from ktrain==0.26.3) (2.25.1)\n",
+ "Collecting seqeval==0.0.19\n",
+ " Using cached seqeval-0.0.19-py3-none-any.whl\n",
+ "Requirement already satisfied: cchardet in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from ktrain==0.26.3) (2.1.7)\n",
+ "Requirement already satisfied: pandas>=1.0.1 in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from ktrain==0.26.3) (1.1.5)\n",
+ "Requirement already satisfied: jieba in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from ktrain==0.26.3) (0.42.1)\n",
+ "Requirement already satisfied: sentencepiece in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from ktrain==0.26.3) (0.1.95)\n",
+ "Requirement already satisfied: langdetect in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from ktrain==0.26.3) (1.0.9)\n",
+ "Requirement already satisfied: packaging in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from ktrain==0.26.3) (20.9)\n",
+ "Requirement already satisfied: networkx>=2.3 in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from ktrain==0.26.3) (2.5.1)\n",
+ "Requirement already satisfied: syntok in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from ktrain==0.26.3) (1.3.1)\n",
+ "Requirement already satisfied: scikit-learn==0.23.2 in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from ktrain==0.26.3) (0.23.2)\n",
+ "Requirement already satisfied: matplotlib>=3.0.0 in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from ktrain==0.26.3) (3.3.4)\n",
+ "Requirement already satisfied: transformers<=4.3.3,>=4.0.0 in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from ktrain==0.26.3) (4.3.3)\n",
+ "Requirement already satisfied: fastprogress>=0.1.21 in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from ktrain==0.26.3) (1.0.0)\n",
+ "Requirement already satisfied: whoosh in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from ktrain==0.26.3) (2.7.4)\n",
+ "Requirement already satisfied: numpy>=1.13.3 in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from scikit-learn==0.23.2->ktrain==0.26.3) (1.19.5)\n",
+ "Requirement already satisfied: scipy>=0.19.1 in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from scikit-learn==0.23.2->ktrain==0.26.3) (1.4.1)\n",
+ "Requirement already satisfied: threadpoolctl>=2.0.0 in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from scikit-learn==0.23.2->ktrain==0.26.3) (2.1.0)\n",
+ "Requirement already satisfied: Keras>=2.2.4 in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from seqeval==0.0.19->ktrain==0.26.3) (2.4.3)\n",
+ "Requirement already satisfied: pyyaml in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from Keras>=2.2.4->seqeval==0.0.19->ktrain==0.26.3) (5.4.1)\n",
+ "Requirement already satisfied: h5py in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from Keras>=2.2.4->seqeval==0.0.19->ktrain==0.26.3) (2.10.0)\n",
+ "Requirement already satisfied: keras-transformer>=0.38.0 in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from keras-bert>=0.86.0->ktrain==0.26.3) (0.38.0)\n",
+ "Requirement already satisfied: keras-pos-embd>=0.11.0 in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from keras-transformer>=0.38.0->keras-bert>=0.86.0->ktrain==0.26.3) (0.11.0)\n",
+ "Requirement already satisfied: keras-layer-normalization>=0.14.0 in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from keras-transformer>=0.38.0->keras-bert>=0.86.0->ktrain==0.26.3) (0.14.0)\n",
+ "Requirement already satisfied: keras-position-wise-feed-forward>=0.6.0 in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from keras-transformer>=0.38.0->keras-bert>=0.86.0->ktrain==0.26.3) (0.6.0)\n",
+ "Requirement already satisfied: keras-embed-sim>=0.8.0 in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from keras-transformer>=0.38.0->keras-bert>=0.86.0->ktrain==0.26.3) (0.8.0)\n",
+ "Requirement already satisfied: keras-multi-head>=0.27.0 in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from keras-transformer>=0.38.0->keras-bert>=0.86.0->ktrain==0.26.3) (0.27.0)\n",
+ "Requirement already satisfied: keras-self-attention==0.46.0 in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from keras-multi-head>=0.27.0->keras-transformer>=0.38.0->keras-bert>=0.86.0->ktrain==0.26.3) (0.46.0)\n",
+ "Requirement already satisfied: pyparsing!=2.0.4,!=2.1.2,!=2.1.6,>=2.0.3 in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from matplotlib>=3.0.0->ktrain==0.26.3) (2.4.7)\n",
+ "Requirement already satisfied: kiwisolver>=1.0.1 in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from matplotlib>=3.0.0->ktrain==0.26.3) (1.3.1)\n",
+ "Requirement already satisfied: python-dateutil>=2.1 in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from matplotlib>=3.0.0->ktrain==0.26.3) (2.8.1)\n",
+ "Requirement already satisfied: cycler>=0.10 in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from matplotlib>=3.0.0->ktrain==0.26.3) (0.10.0)\n",
+ "Requirement already satisfied: pillow>=6.2.0 in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from matplotlib>=3.0.0->ktrain==0.26.3) (8.2.0)\n",
+ "Requirement already satisfied: six in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from cycler>=0.10->matplotlib>=3.0.0->ktrain==0.26.3) (1.15.0)\n",
+ "Requirement already satisfied: decorator<5,>=4.3 in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from networkx>=2.3->ktrain==0.26.3) (4.4.2)\n",
+ "Requirement already satisfied: pytz>=2017.2 in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from pandas>=1.0.1->ktrain==0.26.3) (2021.1)\n",
+ "Requirement already satisfied: dataclasses in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from transformers<=4.3.3,>=4.0.0->ktrain==0.26.3) (0.8)\n",
+ "Requirement already satisfied: importlib-metadata in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from transformers<=4.3.3,>=4.0.0->ktrain==0.26.3) (4.4.0)\n",
+ "Requirement already satisfied: tokenizers<0.11,>=0.10.1 in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from transformers<=4.3.3,>=4.0.0->ktrain==0.26.3) (0.10.3)\n",
+ "Requirement already satisfied: regex!=2019.12.17 in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from transformers<=4.3.3,>=4.0.0->ktrain==0.26.3) (2021.4.4)\n",
+ "Requirement already satisfied: tqdm>=4.27 in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from transformers<=4.3.3,>=4.0.0->ktrain==0.26.3) (4.61.0)\n",
+ "Requirement already satisfied: filelock in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from transformers<=4.3.3,>=4.0.0->ktrain==0.26.3) (3.0.12)\n",
+ "Requirement already satisfied: sacremoses in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from transformers<=4.3.3,>=4.0.0->ktrain==0.26.3) (0.0.45)\n",
+ "Requirement already satisfied: zipp>=0.5 in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from importlib-metadata->transformers<=4.3.3,>=4.0.0->ktrain==0.26.3) (3.4.1)\n",
+ "Requirement already satisfied: typing-extensions>=3.6.4 in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from importlib-metadata->transformers<=4.3.3,>=4.0.0->ktrain==0.26.3) (3.7.4.3)\n",
+ "Requirement already satisfied: pygments in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from ipython->ktrain==0.26.3) (2.9.0)\n",
+ "Requirement already satisfied: setuptools>=18.5 in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from ipython->ktrain==0.26.3) (52.0.0.post20210125)\n",
+ "Requirement already satisfied: traitlets>=4.2 in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from ipython->ktrain==0.26.3) (4.3.3)\n",
+ "Requirement already satisfied: jedi>=0.10 in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from ipython->ktrain==0.26.3) (0.17.0)\n",
+ "Requirement already satisfied: pickleshare in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from ipython->ktrain==0.26.3) (0.7.5)"
+ ]
},
{
- "cell_type": "code",
- "metadata": {
- "id": "KN6N85ah8VXf",
- "colab_type": "code",
- "outputId": "6e97b40b-ea0d-4eb1-9562-8862c525c0f3",
- "colab": {
- "base_uri": "https://localhost:8080/",
- "height": 82
- }
- },
- "source": [
- "#Importing\n",
- "import ktrain\n",
- "from ktrain import text"
- ],
- "execution_count": 2,
- "outputs": [
- {
- "output_type": "stream",
- "text": [
- "Using TensorFlow backend.\n"
- ],
- "name": "stderr"
- },
- {
- "output_type": "display_data",
- "data": {
- "text/html": [
- "
\n",
- "The default version of TensorFlow in Colab will soon switch to TensorFlow 2.x. \n",
- "We recommend you upgrade now \n",
- "or ensure your notebook will continue to use TensorFlow 1.x via the %tensorflow_version 1.x magic:\n",
- "more info.
\n"
- ],
- "text/plain": [
- ""
- ]
- },
- "metadata": {
- "tags": []
- }
- }
- ]
+ "name": "stderr",
+ "output_type": "stream",
+ "text": [
+ "WARNING: Ignoring invalid distribution -pype1 (c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages)\n",
+ "WARNING: Ignoring invalid distribution -pype1 (c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages)\n",
+ "WARNING: Ignoring invalid distribution -pype1 (c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages)\n",
+ " WARNING: Ignoring invalid distribution -pype1 (c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages)\n",
+ "WARNING: Ignoring invalid distribution -pype1 (c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages)\n",
+ "WARNING: Ignoring invalid distribution -pype1 (c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages)\n",
+ "WARNING: Ignoring invalid distribution -pype1 (c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages)\n",
+ "WARNING: Ignoring invalid distribution -pype1 (c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages)\n"
+ ]
},
{
- "cell_type": "code",
- "metadata": {
- "id": "Mr1YXudk8Vti",
- "colab_type": "code",
- "outputId": "8b08004e-329e-4eb8-a21e-e4dae409fc3e",
- "colab": {
- "base_uri": "https://localhost:8080/",
- "height": 52
- }
- },
- "source": [
- "#obtain the dataset\n",
- "import tensorflow as tf\n",
- "dataset = tf.keras.utils.get_file(\n",
- " fname=\"aclImdb.tar.gz\", \n",
- " origin=\"http://ai.stanford.edu/~amaas/data/sentiment/aclImdb_v1.tar.gz\", \n",
- " extract=True,\n",
- ")"
- ],
- "execution_count": 3,
- "outputs": [
- {
- "output_type": "stream",
- "text": [
- "Downloading data from http://ai.stanford.edu/~amaas/data/sentiment/aclImdb_v1.tar.gz\n",
- "84131840/84125825 [==============================] - 4s 0us/step\n"
- ],
- "name": "stdout"
- }
- ]
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "\n",
+ "Requirement already satisfied: colorama in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from ipython->ktrain==0.26.3) (0.4.4)\n",
+ "Requirement already satisfied: backcall in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from ipython->ktrain==0.26.3) (0.2.0)\n",
+ "Requirement already satisfied: prompt-toolkit!=3.0.0,!=3.0.1,<3.1.0,>=2.0.0 in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from ipython->ktrain==0.26.3) (3.0.17)\n",
+ "Requirement already satisfied: parso>=0.7.0 in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from jedi>=0.10->ipython->ktrain==0.26.3) (0.8.2)\n",
+ "Requirement already satisfied: wcwidth in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from prompt-toolkit!=3.0.0,!=3.0.1,<3.1.0,>=2.0.0->ipython->ktrain==0.26.3) (0.2.5)\n",
+ "Requirement already satisfied: ipython-genutils in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from traitlets>=4.2->ipython->ktrain==0.26.3) (0.2.0)\n",
+ "Requirement already satisfied: idna<3,>=2.5 in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from requests->ktrain==0.26.3) (2.10)\n",
+ "Requirement already satisfied: certifi>=2017.4.17 in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from requests->ktrain==0.26.3) (2020.12.5)\n",
+ "Requirement already satisfied: urllib3<1.27,>=1.21.1 in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from requests->ktrain==0.26.3) (1.26.5)\n",
+ "Requirement already satisfied: chardet<5,>=3.0.2 in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from requests->ktrain==0.26.3) (4.0.0)\n",
+ "Requirement already satisfied: click in c:\\users\\kumar apurv\\anaconda3\\envs\\ml\\lib\\site-packages (from sacremoses->transformers<=4.3.3,>=4.0.0->ktrain==0.26.3) (7.1.2)\n",
+ "Installing collected packages: seqeval\n",
+ " Attempting uninstall: seqeval\n",
+ " Found existing installation: seqeval 0.0.12\n",
+ " Uninstalling seqeval-0.0.12:\n",
+ " Successfully uninstalled seqeval-0.0.12\n",
+ "Successfully installed seqeval-0.0.19\n"
+ ]
+ }
+ ],
+ "source": [
+ "!pip3 install ktrain==0.26.3\n",
+ "# use tensorflow 2.4.0"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 2,
+ "metadata": {
+ "colab": {
+ "base_uri": "https://localhost:8080/",
+ "height": 82
},
- {
- "cell_type": "code",
- "metadata": {
- "id": "2x46reXu9Kru",
- "colab_type": "code",
- "outputId": "f1ca7357-d740-492d-e482-76c8901eb04f",
- "colab": {
- "base_uri": "https://localhost:8080/",
- "height": 52
- }
- },
- "source": [
- "%cd /root/.keras/datasets/aclImdb\n",
- "!ls"
- ],
- "execution_count": 4,
- "outputs": [
- {
- "output_type": "stream",
- "text": [
- "/root/.keras/datasets/aclImdb\n",
- "imdbEr.txt imdb.vocab\tREADME\ttest train\n"
- ],
- "name": "stdout"
- }
- ]
+ "colab_type": "code",
+ "id": "KN6N85ah8VXf",
+ "outputId": "6e97b40b-ea0d-4eb1-9562-8862c525c0f3"
+ },
+ "outputs": [],
+ "source": [
+ "#Importing\n",
+ "import ktrain\n",
+ "from ktrain import text"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 3,
+ "metadata": {
+ "colab": {
+ "base_uri": "https://localhost:8080/",
+ "height": 52
},
+ "colab_type": "code",
+ "id": "Mr1YXudk8Vti",
+ "outputId": "8b08004e-329e-4eb8-a21e-e4dae409fc3e"
+ },
+ "outputs": [
{
- "cell_type": "code",
- "metadata": {
- "id": "qnXQ-lcL8d6O",
- "colab_type": "code",
- "outputId": "4a790d12-399d-415f-d643-75e55038ea69",
- "colab": {
- "base_uri": "https://localhost:8080/",
- "height": 35
- }
- },
- "source": [
- "# set path to dataset\n",
- "import os.path\n",
- "dataset = '/root/.keras/datasets/aclImdb'\n",
- "IMDB_DATADIR = os.path.join(os.path.dirname(dataset), 'aclImdb')\n",
- "print(IMDB_DATADIR)"
- ],
- "execution_count": 5,
- "outputs": [
- {
- "output_type": "stream",
- "text": [
- "/root/.keras/datasets/aclImdb\n"
- ],
- "name": "stdout"
- }
- ]
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "Downloading data from http://ai.stanford.edu/~amaas/data/sentiment/aclImdb_v1.tar.gz\n",
+ "84131840/84125825 [==============================] - 4s 0us/step\n"
+ ]
+ }
+ ],
+ "source": [
+ "##obtain the dataset\n",
+ "import os\n",
+ "try :\n",
+ " from google.colab import files\n",
+ " import tensorflow as tf\n",
+ " dataset = tf.keras.utils.get_file(\n",
+ " fname=\"aclImdb.tar.gz\", \n",
+ " origin=\"http://ai.stanford.edu/~amaas/data/sentiment/aclImdb_v1.tar.gz\", \n",
+ " extract=True,\n",
+ " )\n",
+ " IMDB_DATADIR = os.path.join(os.path.dirname(dataset), \"aclImdb\")\n",
+ "except ModuleNotFoundError :\n",
+ " if not os.path.exists(os.getcwd()+\"\\\\Data\\\\aclImdb\") :\n",
+ " import tensorflow as tf\n",
+ " dataset = tf.keras.utils.get_file(\n",
+ " fname=\"aclImdb.tar.gz\", \n",
+ " origin=\"http://ai.stanford.edu/~amaas/data/sentiment/aclImdb_v1.tar.gz\", \n",
+ " extract=True,\n",
+ " )\n",
+ "\n",
+ " # set path to dataset\n",
+ " IMDB_DATADIR=os.getcwd()\n",
+ " else :\n",
+ "\n",
+ " # set path to dataset\n",
+ " IMDB_DATADIR=os.getcwd()+\"\\\\Data\\\\aclImdb\""
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "metadata": {
+ "colab_type": "text",
+ "id": "ugopbOABrmne"
+ },
+ "source": [
+ "## STEP 1: Preprocessing\n",
+ "####The texts_from_folder function will load the training and validation data from the specified folder and automatically preprocess it according to BERT's requirements. In doing so, the BERT model and vocabulary will be automatically downloaded."
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 6,
+ "metadata": {
+ "colab": {
+ "base_uri": "https://localhost:8080/",
+ "height": 228
},
+ "colab_type": "code",
+ "id": "jELdxonN9J8v",
+ "outputId": "d32f97a7-e69f-465b-d1e5-bfef9ee204f5"
+ },
+ "outputs": [
{
- "cell_type": "markdown",
- "metadata": {
- "id": "ugopbOABrmne",
- "colab_type": "text"
- },
- "source": [
- "## STEP 1: Preprocessing\n",
- "####The texts_from_folder function will load the training and validation data from the specified folder and automatically preprocess it according to BERT's requirements. In doing so, the BERT model and vocabulary will be automatically downloaded."
- ]
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "downloading pretrained BERT model and vocabulary...\n",
+ "[██████████████████████████████████████████████████]\n",
+ "extracting pretrained BERT model and vocabulary...\n",
+ "done.\n",
+ "\n",
+ "cleanup downloaded zip...\n",
+ "done.\n",
+ "\n",
+ "preprocessing train...\n"
+ ]
},
{
- "cell_type": "code",
- "metadata": {
- "id": "jELdxonN9J8v",
- "colab_type": "code",
- "outputId": "d32f97a7-e69f-465b-d1e5-bfef9ee204f5",
- "colab": {
- "base_uri": "https://localhost:8080/",
- "height": 228
- }
- },
- "source": [
- "\n",
- "\n",
- "(x_train, y_train), (x_test, y_test), preproc = text.texts_from_folder(IMDB_DATADIR, \n",
- " maxlen=500, \n",
- " preprocess_mode='bert',\n",
- " train_test_names=['train', \n",
- " 'test'],\n",
- " classes=['pos', 'neg'])"
+ "data": {
+ "text/html": [
+ "done."
],
- "execution_count": 6,
- "outputs": [
- {
- "output_type": "stream",
- "text": [
- "downloading pretrained BERT model and vocabulary...\n",
- "[██████████████████████████████████████████████████]\n",
- "extracting pretrained BERT model and vocabulary...\n",
- "done.\n",
- "\n",
- "cleanup downloaded zip...\n",
- "done.\n",
- "\n",
- "preprocessing train...\n"
- ],
- "name": "stdout"
- },
- {
- "output_type": "display_data",
- "data": {
- "text/html": [
- "done."
- ],
- "text/plain": [
- ""
- ]
- },
- "metadata": {
- "tags": []
- }
- },
- {
- "output_type": "stream",
- "text": [
- "preprocessing test...\n"
- ],
- "name": "stdout"
- },
- {
- "output_type": "display_data",
- "data": {
- "text/html": [
- "done."
- ],
- "text/plain": [
- ""
- ]
- },
- "metadata": {
- "tags": []
- }
- }
+ "text/plain": [
+ ""
]
+ },
+ "metadata": {
+ "tags": []
+ },
+ "output_type": "display_data"
},
{
- "cell_type": "markdown",
- "metadata": {
- "id": "a0SIaqHcslLZ",
- "colab_type": "text"
- },
- "source": [
- "### STEP 2: Loading a pre trained BERT and wrapping it in a ktrain.learner object"
- ]
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "preprocessing test...\n"
+ ]
},
{
- "cell_type": "code",
- "metadata": {
- "id": "90ftQ6MgAJy4",
- "colab_type": "code",
- "outputId": "a1c715b8-5d54-4405-c5e9-b7bcb042a131",
- "colab": {
- "base_uri": "https://localhost:8080/",
- "height": 606
- }
- },
- "source": [
- "\n",
- "model = text.text_classifier('bert', (x_train, y_train), preproc=preproc)\n",
- "learner = ktrain.get_learner(model,train_data=(x_train, y_train), val_data=(x_test, y_test), batch_size=6)"
+ "data": {
+ "text/html": [
+ "done."
],
- "execution_count": 7,
- "outputs": [
- {
- "output_type": "stream",
- "text": [
- "Is Multi-Label? False\n",
- "maxlen is 500\n",
- "WARNING:tensorflow:From /usr/local/lib/python3.6/dist-packages/keras/backend/tensorflow_backend.py:541: The name tf.placeholder is deprecated. Please use tf.compat.v1.placeholder instead.\n",
- "\n",
- "WARNING:tensorflow:From /usr/local/lib/python3.6/dist-packages/keras/backend/tensorflow_backend.py:4432: The name tf.random_uniform is deprecated. Please use tf.random.uniform instead.\n",
- "\n",
- "WARNING:tensorflow:From /usr/local/lib/python3.6/dist-packages/keras/backend/tensorflow_backend.py:66: The name tf.get_default_graph is deprecated. Please use tf.compat.v1.get_default_graph instead.\n",
- "\n",
- "WARNING:tensorflow:From /usr/local/lib/python3.6/dist-packages/keras/backend/tensorflow_backend.py:148: The name tf.placeholder_with_default is deprecated. Please use tf.compat.v1.placeholder_with_default instead.\n",
- "\n",
- "WARNING:tensorflow:From /usr/local/lib/python3.6/dist-packages/keras/backend/tensorflow_backend.py:3733: calling dropout (from tensorflow.python.ops.nn_ops) with keep_prob is deprecated and will be removed in a future version.\n",
- "Instructions for updating:\n",
- "Please use `rate` instead of `keep_prob`. Rate should be set to `rate = 1 - keep_prob`.\n",
- "WARNING:tensorflow:From /usr/local/lib/python3.6/dist-packages/keras/backend/tensorflow_backend.py:4479: The name tf.truncated_normal is deprecated. Please use tf.random.truncated_normal instead.\n",
- "\n",
- "WARNING:tensorflow:From /usr/local/lib/python3.6/dist-packages/keras/backend/tensorflow_backend.py:190: The name tf.get_default_session is deprecated. Please use tf.compat.v1.get_default_session instead.\n",
- "\n",
- "WARNING:tensorflow:From /usr/local/lib/python3.6/dist-packages/keras/backend/tensorflow_backend.py:197: The name tf.ConfigProto is deprecated. Please use tf.compat.v1.ConfigProto instead.\n",
- "\n",
- "WARNING:tensorflow:From /usr/local/lib/python3.6/dist-packages/keras/backend/tensorflow_backend.py:203: The name tf.Session is deprecated. Please use tf.compat.v1.Session instead.\n",
- "\n",
- "WARNING:tensorflow:From /usr/local/lib/python3.6/dist-packages/keras/backend/tensorflow_backend.py:207: The name tf.global_variables is deprecated. Please use tf.compat.v1.global_variables instead.\n",
- "\n",
- "WARNING:tensorflow:From /usr/local/lib/python3.6/dist-packages/keras/backend/tensorflow_backend.py:216: The name tf.is_variable_initialized is deprecated. Please use tf.compat.v1.is_variable_initialized instead.\n",
- "\n",
- "WARNING:tensorflow:From /usr/local/lib/python3.6/dist-packages/keras/backend/tensorflow_backend.py:223: The name tf.variables_initializer is deprecated. Please use tf.compat.v1.variables_initializer instead.\n",
- "\n",
- "WARNING:tensorflow:From /usr/local/lib/python3.6/dist-packages/keras/optimizers.py:793: The name tf.train.Optimizer is deprecated. Please use tf.compat.v1.train.Optimizer instead.\n",
- "\n",
- "WARNING:tensorflow:From /usr/local/lib/python3.6/dist-packages/keras/backend/tensorflow_backend.py:3576: The name tf.log is deprecated. Please use tf.math.log instead.\n",
- "\n",
- "done.\n"
- ],
- "name": "stdout"
- }
- ]
- },
- {
- "cell_type": "markdown",
- "metadata": {
- "id": "nN6zWQgys0c_",
- "colab_type": "text"
- },
- "source": [
- "### STEP 3: Training and Tuning the model's parameters"
+ "text/plain": [
+ ""
]
+ },
+ "metadata": {
+ "tags": []
+ },
+ "output_type": "display_data"
+ }
+ ],
+ "source": [
+ "(x_train, y_train), (x_test, y_test), preproc = text.texts_from_folder(IMDB_DATADIR, \n",
+ " maxlen=500, \n",
+ " preprocess_mode='bert',\n",
+ " train_test_names=['train', \n",
+ " 'test'],\n",
+ " classes=['pos', 'neg'])"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "metadata": {
+ "colab_type": "text",
+ "id": "a0SIaqHcslLZ"
+ },
+ "source": [
+ "### STEP 2: Loading a pre trained BERT and wrapping it in a ktrain.learner object"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 7,
+ "metadata": {
+ "colab": {
+ "base_uri": "https://localhost:8080/",
+ "height": 606
},
+ "colab_type": "code",
+ "id": "90ftQ6MgAJy4",
+ "outputId": "a1c715b8-5d54-4405-c5e9-b7bcb042a131"
+ },
+ "outputs": [
{
- "cell_type": "code",
- "metadata": {
- "id": "Fxdw88YjAfvF",
- "colab_type": "code",
- "outputId": "663b6e29-8bd0-4fed-cbf6-c8cc361b5244",
- "colab": {
- "base_uri": "https://localhost:8080/",
- "height": 392
- }
- },
- "source": [
- "learner.fit_onecycle(2e-5, 4)"
- ],
- "execution_count": 8,
- "outputs": [
- {
- "output_type": "stream",
- "text": [
- "\n",
- "\n",
- "begin training using onecycle policy with max lr of 2e-05...\n",
- "WARNING:tensorflow:From /usr/local/lib/python3.6/dist-packages/tensorflow_core/python/ops/math_grad.py:1424: where (from tensorflow.python.ops.array_ops) is deprecated and will be removed in a future version.\n",
- "Instructions for updating:\n",
- "Use tf.where in 2.0, which has the same broadcast rule as np.where\n",
- "WARNING:tensorflow:From /usr/local/lib/python3.6/dist-packages/keras/backend/tensorflow_backend.py:1033: The name tf.assign_add is deprecated. Please use tf.compat.v1.assign_add instead.\n",
- "\n",
- "WARNING:tensorflow:From /usr/local/lib/python3.6/dist-packages/keras/backend/tensorflow_backend.py:1020: The name tf.assign is deprecated. Please use tf.compat.v1.assign instead.\n",
- "\n",
- "Train on 25000 samples, validate on 25000 samples\n",
- "Epoch 1/4\n",
- "25000/25000 [==============================] - 4557s 182ms/step - loss: 0.2551 - acc: 0.8944 - val_loss: 0.1694 - val_acc: 0.9342\n",
- "Epoch 2/4\n",
- "25000/25000 [==============================] - 4545s 182ms/step - loss: 0.1607 - acc: 0.9419 - val_loss: 0.1692 - val_acc: 0.9362\n",
- "Epoch 3/4\n",
- "25000/25000 [==============================] - 4545s 182ms/step - loss: 0.0875 - acc: 0.9706 - val_loss: 0.1860 - val_acc: 0.9378\n",
- "Epoch 4/4\n",
- "25000/25000 [==============================] - 4543s 182ms/step - loss: 0.0242 - acc: 0.9932 - val_loss: 0.2394 - val_acc: 0.9385\n"
- ],
- "name": "stdout"
- },
- {
- "output_type": "execute_result",
- "data": {
- "text/plain": [
- ""
- ]
- },
- "metadata": {
- "tags": []
- },
- "execution_count": 8
- }
- ]
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "Is Multi-Label? False\n",
+ "maxlen is 500\n",
+ "WARNING:tensorflow:From /usr/local/lib/python3.6/dist-packages/keras/backend/tensorflow_backend.py:541: The name tf.placeholder is deprecated. Please use tf.compat.v1.placeholder instead.\n",
+ "\n",
+ "WARNING:tensorflow:From /usr/local/lib/python3.6/dist-packages/keras/backend/tensorflow_backend.py:4432: The name tf.random_uniform is deprecated. Please use tf.random.uniform instead.\n",
+ "\n",
+ "WARNING:tensorflow:From /usr/local/lib/python3.6/dist-packages/keras/backend/tensorflow_backend.py:66: The name tf.get_default_graph is deprecated. Please use tf.compat.v1.get_default_graph instead.\n",
+ "\n",
+ "WARNING:tensorflow:From /usr/local/lib/python3.6/dist-packages/keras/backend/tensorflow_backend.py:148: The name tf.placeholder_with_default is deprecated. Please use tf.compat.v1.placeholder_with_default instead.\n",
+ "\n",
+ "WARNING:tensorflow:From /usr/local/lib/python3.6/dist-packages/keras/backend/tensorflow_backend.py:3733: calling dropout (from tensorflow.python.ops.nn_ops) with keep_prob is deprecated and will be removed in a future version.\n",
+ "Instructions for updating:\n",
+ "Please use `rate` instead of `keep_prob`. Rate should be set to `rate = 1 - keep_prob`.\n",
+ "WARNING:tensorflow:From /usr/local/lib/python3.6/dist-packages/keras/backend/tensorflow_backend.py:4479: The name tf.truncated_normal is deprecated. Please use tf.random.truncated_normal instead.\n",
+ "\n",
+ "WARNING:tensorflow:From /usr/local/lib/python3.6/dist-packages/keras/backend/tensorflow_backend.py:190: The name tf.get_default_session is deprecated. Please use tf.compat.v1.get_default_session instead.\n",
+ "\n",
+ "WARNING:tensorflow:From /usr/local/lib/python3.6/dist-packages/keras/backend/tensorflow_backend.py:197: The name tf.ConfigProto is deprecated. Please use tf.compat.v1.ConfigProto instead.\n",
+ "\n",
+ "WARNING:tensorflow:From /usr/local/lib/python3.6/dist-packages/keras/backend/tensorflow_backend.py:203: The name tf.Session is deprecated. Please use tf.compat.v1.Session instead.\n",
+ "\n",
+ "WARNING:tensorflow:From /usr/local/lib/python3.6/dist-packages/keras/backend/tensorflow_backend.py:207: The name tf.global_variables is deprecated. Please use tf.compat.v1.global_variables instead.\n",
+ "\n",
+ "WARNING:tensorflow:From /usr/local/lib/python3.6/dist-packages/keras/backend/tensorflow_backend.py:216: The name tf.is_variable_initialized is deprecated. Please use tf.compat.v1.is_variable_initialized instead.\n",
+ "\n",
+ "WARNING:tensorflow:From /usr/local/lib/python3.6/dist-packages/keras/backend/tensorflow_backend.py:223: The name tf.variables_initializer is deprecated. Please use tf.compat.v1.variables_initializer instead.\n",
+ "\n",
+ "WARNING:tensorflow:From /usr/local/lib/python3.6/dist-packages/keras/optimizers.py:793: The name tf.train.Optimizer is deprecated. Please use tf.compat.v1.train.Optimizer instead.\n",
+ "\n",
+ "WARNING:tensorflow:From /usr/local/lib/python3.6/dist-packages/keras/backend/tensorflow_backend.py:3576: The name tf.log is deprecated. Please use tf.math.log instead.\n",
+ "\n",
+ "done.\n"
+ ]
+ }
+ ],
+ "source": [
+ "model = text.text_classifier('bert', (x_train, y_train), preproc=preproc)\n",
+ "learner = ktrain.get_learner(model,train_data=(x_train, y_train), val_data=(x_test, y_test), batch_size=6)"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "metadata": {
+ "colab_type": "text",
+ "id": "nN6zWQgys0c_"
+ },
+ "source": [
+ "### STEP 3: Training and Tuning the model's parameters"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 8,
+ "metadata": {
+ "colab": {
+ "base_uri": "https://localhost:8080/",
+ "height": 392
},
+ "colab_type": "code",
+ "id": "Fxdw88YjAfvF",
+ "outputId": "663b6e29-8bd0-4fed-cbf6-c8cc361b5244"
+ },
+ "outputs": [
{
- "cell_type": "code",
- "metadata": {
- "id": "ihOn7ztsAnaL",
- "colab_type": "code",
- "colab": {}
- },
- "source": [
- ""
- ],
- "execution_count": 0,
- "outputs": []
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "\n",
+ "\n",
+ "begin training using onecycle policy with max lr of 2e-05...\n",
+ "WARNING:tensorflow:From /usr/local/lib/python3.6/dist-packages/tensorflow_core/python/ops/math_grad.py:1424: where (from tensorflow.python.ops.array_ops) is deprecated and will be removed in a future version.\n",
+ "Instructions for updating:\n",
+ "Use tf.where in 2.0, which has the same broadcast rule as np.where\n",
+ "WARNING:tensorflow:From /usr/local/lib/python3.6/dist-packages/keras/backend/tensorflow_backend.py:1033: The name tf.assign_add is deprecated. Please use tf.compat.v1.assign_add instead.\n",
+ "\n",
+ "WARNING:tensorflow:From /usr/local/lib/python3.6/dist-packages/keras/backend/tensorflow_backend.py:1020: The name tf.assign is deprecated. Please use tf.compat.v1.assign instead.\n",
+ "\n",
+ "Train on 25000 samples, validate on 25000 samples\n",
+ "Epoch 1/4\n",
+ "25000/25000 [==============================] - 4557s 182ms/step - loss: 0.2551 - acc: 0.8944 - val_loss: 0.1694 - val_acc: 0.9342\n",
+ "Epoch 2/4\n",
+ "25000/25000 [==============================] - 4545s 182ms/step - loss: 0.1607 - acc: 0.9419 - val_loss: 0.1692 - val_acc: 0.9362\n",
+ "Epoch 3/4\n",
+ "25000/25000 [==============================] - 4545s 182ms/step - loss: 0.0875 - acc: 0.9706 - val_loss: 0.1860 - val_acc: 0.9378\n",
+ "Epoch 4/4\n",
+ "25000/25000 [==============================] - 4543s 182ms/step - loss: 0.0242 - acc: 0.9932 - val_loss: 0.2394 - val_acc: 0.9385\n"
+ ]
},
{
- "cell_type": "code",
- "metadata": {
- "id": "mPVhsfj3TwHf",
- "colab_type": "code",
- "colab": {}
- },
- "source": [
- ""
- ],
- "execution_count": 0,
- "outputs": []
+ "data": {
+ "text/plain": [
+ ""
+ ]
+ },
+ "execution_count": 8,
+ "metadata": {
+ "tags": []
+ },
+ "output_type": "execute_result"
}
- ]
-}
\ No newline at end of file
+ ],
+ "source": [
+ "learner.fit_onecycle(2e-5, 4)"
+ ]
+ }
+ ],
+ "metadata": {
+ "accelerator": "GPU",
+ "colab": {
+ "collapsed_sections": [],
+ "name": "BERT_Sentiment_Classification_IMDB.ipynb",
+ "provenance": []
+ },
+ "kernelspec": {
+ "display_name": "Python 3",
+ "language": "python",
+ "name": "python3"
+ },
+ "language_info": {
+ "codemirror_mode": {
+ "name": "ipython",
+ "version": 3
+ },
+ "file_extension": ".py",
+ "mimetype": "text/x-python",
+ "name": "python",
+ "nbconvert_exporter": "python",
+ "pygments_lexer": "ipython3",
+ "version": "3.6.13"
+ }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 1
+}
From 15a90ef58c6048032c423501abb4e2641f52342e Mon Sep 17 00:00:00 2001
From: jatinpapreja <47968703+jatinpapreja@users.noreply.github.com>
Date: Thu, 10 Jun 2021 12:35:50 +0530
Subject: [PATCH 2/4] [Ch4Nb09] Fixed some errors and path issues
1. Updated tensorflow from '1.14.0' to '2.4.0 '.
2. Fixed 'tf.gfile.GFile' to 'tf.io.gfile.GFile'.
3. 'from keras.utils.np_utils import to_categorical' is the change.
4. Added try block for windows and colab users and specified the path for downloading files for windows users.
---
Ch4/09_Lime_RNN.ipynb | 1096 +++++++++++++++++++----------------------
1 file changed, 515 insertions(+), 581 deletions(-)
diff --git a/Ch4/09_Lime_RNN.ipynb b/Ch4/09_Lime_RNN.ipynb
index 5b5ab24..b95992a 100644
--- a/Ch4/09_Lime_RNN.ipynb
+++ b/Ch4/09_Lime_RNN.ipynb
@@ -1,606 +1,540 @@
{
- "nbformat": 4,
- "nbformat_minor": 0,
- "metadata": {
+ "cells": [
+ {
+ "cell_type": "markdown",
+ "metadata": {
+ "colab_type": "text",
+ "id": "hjoUGDuyTdh5"
+ },
+ "source": [
+ "In this notebook we will demonstrate how to interpret a Deep Learning Model using [LIME](https://github.com/marcotcr/lime)(local interpretable model-agnostic explanations), a python package for explaining machine learning classifiers. "
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 1,
+ "metadata": {
"colab": {
- "name": "Lime_RNN.ipynb",
- "provenance": []
- },
- "kernelspec": {
- "name": "python3",
- "display_name": "Python 3"
+ "base_uri": "https://localhost:8080/",
+ "height": 680
},
- "accelerator": "GPU"
+ "colab_type": "code",
+ "id": "qiGdNSat-V2i",
+ "outputId": "0cfc1f68-7585-4454-be5f-96647c677020"
+ },
+ "outputs": [],
+ "source": [
+ "!pip install tensorflow==2.4.0"
+ ]
},
- "cells": [
- {
- "cell_type": "markdown",
- "metadata": {
- "id": "hjoUGDuyTdh5",
- "colab_type": "text"
- },
- "source": [
- "In this notebook we will demonstrate how to interpret a Deep Learning Model using [LIME](https://github.com/marcotcr/lime)(local interpretable model-agnostic explanations), a python package for explaining machine learning classifiers. "
- ]
- },
- {
- "cell_type": "code",
- "metadata": {
- "id": "qiGdNSat-V2i",
- "colab_type": "code",
- "outputId": "0cfc1f68-7585-4454-be5f-96647c677020",
- "colab": {
- "base_uri": "https://localhost:8080/",
- "height": 680
- }
- },
- "source": [
- "!pip install tensorflow==1.14.0"
- ],
- "execution_count": 0,
- "outputs": [
- {
- "output_type": "stream",
- "text": [
- "Collecting tensorflow==1.14.0\n",
- "\u001b[?25l Downloading https://files.pythonhosted.org/packages/de/f0/96fb2e0412ae9692dbf400e5b04432885f677ad6241c088ccc5fe7724d69/tensorflow-1.14.0-cp36-cp36m-manylinux1_x86_64.whl (109.2MB)\n",
- "\u001b[K |████████████████████████████████| 109.2MB 89kB/s \n",
- "\u001b[?25hRequirement already satisfied: protobuf>=3.6.1 in /usr/local/lib/python3.6/dist-packages (from tensorflow==1.14.0) (3.10.0)\n",
- "Requirement already satisfied: gast>=0.2.0 in /usr/local/lib/python3.6/dist-packages (from tensorflow==1.14.0) (0.3.3)\n",
- "Requirement already satisfied: google-pasta>=0.1.6 in /usr/local/lib/python3.6/dist-packages (from tensorflow==1.14.0) (0.2.0)\n",
- "Requirement already satisfied: astor>=0.6.0 in /usr/local/lib/python3.6/dist-packages (from tensorflow==1.14.0) (0.8.1)\n",
- "Requirement already satisfied: numpy<2.0,>=1.14.5 in /usr/local/lib/python3.6/dist-packages (from tensorflow==1.14.0) (1.18.4)\n",
- "Collecting tensorboard<1.15.0,>=1.14.0\n",
- "\u001b[?25l Downloading https://files.pythonhosted.org/packages/91/2d/2ed263449a078cd9c8a9ba50ebd50123adf1f8cfbea1492f9084169b89d9/tensorboard-1.14.0-py3-none-any.whl (3.1MB)\n",
- "\u001b[K |████████████████████████████████| 3.2MB 36.5MB/s \n",
- "\u001b[?25hRequirement already satisfied: absl-py>=0.7.0 in /usr/local/lib/python3.6/dist-packages (from tensorflow==1.14.0) (0.9.0)\n",
- "Requirement already satisfied: grpcio>=1.8.6 in /usr/local/lib/python3.6/dist-packages (from tensorflow==1.14.0) (1.28.1)\n",
- "Requirement already satisfied: six>=1.10.0 in /usr/local/lib/python3.6/dist-packages (from tensorflow==1.14.0) (1.12.0)\n",
- "Requirement already satisfied: termcolor>=1.1.0 in /usr/local/lib/python3.6/dist-packages (from tensorflow==1.14.0) (1.1.0)\n",
- "Requirement already satisfied: wrapt>=1.11.1 in /usr/local/lib/python3.6/dist-packages (from tensorflow==1.14.0) (1.12.1)\n",
- "Requirement already satisfied: wheel>=0.26 in /usr/local/lib/python3.6/dist-packages (from tensorflow==1.14.0) (0.34.2)\n",
- "Collecting tensorflow-estimator<1.15.0rc0,>=1.14.0rc0\n",
- "\u001b[?25l Downloading https://files.pythonhosted.org/packages/3c/d5/21860a5b11caf0678fbc8319341b0ae21a07156911132e0e71bffed0510d/tensorflow_estimator-1.14.0-py2.py3-none-any.whl (488kB)\n",
- "\u001b[K |████████████████████████████████| 491kB 33.6MB/s \n",
- "\u001b[?25hRequirement already satisfied: keras-applications>=1.0.6 in /usr/local/lib/python3.6/dist-packages (from tensorflow==1.14.0) (1.0.8)\n",
- "Requirement already satisfied: keras-preprocessing>=1.0.5 in /usr/local/lib/python3.6/dist-packages (from tensorflow==1.14.0) (1.1.0)\n",
- "Requirement already satisfied: setuptools in /usr/local/lib/python3.6/dist-packages (from protobuf>=3.6.1->tensorflow==1.14.0) (46.1.3)\n",
- "Requirement already satisfied: markdown>=2.6.8 in /usr/local/lib/python3.6/dist-packages (from tensorboard<1.15.0,>=1.14.0->tensorflow==1.14.0) (3.2.1)\n",
- "Requirement already satisfied: werkzeug>=0.11.15 in /usr/local/lib/python3.6/dist-packages (from tensorboard<1.15.0,>=1.14.0->tensorflow==1.14.0) (1.0.1)\n",
- "Requirement already satisfied: h5py in /usr/local/lib/python3.6/dist-packages (from keras-applications>=1.0.6->tensorflow==1.14.0) (2.10.0)\n",
- "Installing collected packages: tensorboard, tensorflow-estimator, tensorflow\n",
- " Found existing installation: tensorboard 2.2.1\n",
- " Uninstalling tensorboard-2.2.1:\n",
- " Successfully uninstalled tensorboard-2.2.1\n",
- " Found existing installation: tensorflow-estimator 2.2.0\n",
- " Uninstalling tensorflow-estimator-2.2.0:\n",
- " Successfully uninstalled tensorflow-estimator-2.2.0\n",
- " Found existing installation: tensorflow 2.2.0rc4\n",
- " Uninstalling tensorflow-2.2.0rc4:\n",
- " Successfully uninstalled tensorflow-2.2.0rc4\n",
- "Successfully installed tensorboard-1.14.0 tensorflow-1.14.0 tensorflow-estimator-1.14.0\n"
- ],
- "name": "stdout"
- }
- ]
- },
- {
- "cell_type": "markdown",
- "metadata": {
- "id": "F5S86uIWZKVO",
- "colab_type": "text"
- },
- "source": [
- "We will be building an LSTM model with an embedding layer trained on the fly. We will be following all the preprocessing steps as in the [DeepNN_Example.ipynb](https://github.com/practical-nlp/practical-nlp/blob/master/Ch4/DeepNN_Example.ipynb) notebook in this repo."
- ]
- },
- {
- "cell_type": "code",
- "metadata": {
- "id": "UsCn1xlo_MMX",
- "colab_type": "code",
- "outputId": "a5f0393a-0812-4fd0-c593-1479a8a6ed76",
- "colab": {
- "base_uri": "https://localhost:8080/",
- "height": 98
- }
- },
- "source": [
- "import tensorflow as tf\n",
- "from tensorflow import keras\n",
- "import os\n",
- "import re\n",
- "import pandas as pd\n",
- "\n",
- "#helper functions to lead the data\n",
- "def load_directory_data(directory):\n",
- " data = {}\n",
- " data[\"sentence\"] = []\n",
- " data[\"sentiment\"] = []\n",
- " for file_path in os.listdir(directory):\n",
- " with tf.gfile.GFile(os.path.join(directory, file_path), \"r\") as f:\n",
- " data[\"sentence\"].append(f.read())\n",
- " data[\"sentiment\"].append(re.match(\"\\d+_(\\d+)\\.txt\", file_path).group(1))\n",
- " return pd.DataFrame.from_dict(data)\n",
- "\n",
- "# Merge positive and negative examples, add a polarity column and shuffle.\n",
- "def load_dataset(directory):\n",
- " pos_df = load_directory_data(os.path.join(directory, \"pos\"))\n",
- " neg_df = load_directory_data(os.path.join(directory, \"neg\"))\n",
- " pos_df[\"polarity\"] = 1\n",
- " neg_df[\"polarity\"] = 0\n",
- " return pd.concat([pos_df, neg_df]).sample(frac=1).reset_index(drop=True)\n",
- "\n",
- "def download_and_load_datasets(force_download=False):\n",
- " dataset = tf.keras.utils.get_file(\n",
- " fname=\"aclImdb.tar.gz\", \n",
- " origin=\"http://ai.stanford.edu/~amaas/data/sentiment/aclImdb_v1.tar.gz\", \n",
- " extract=True)\n",
- " \n",
- " train_df = load_dataset(os.path.join(os.path.dirname(dataset), \n",
- " \"aclImdb\", \"train\"))\n",
- " test_df = load_dataset(os.path.join(os.path.dirname(dataset), \n",
- " \"aclImdb\", \"test\"))\n",
- " \n",
- " return train_df, test_df\n",
- "\n",
- "train,test = download_and_load_datasets()"
- ],
- "execution_count": 0,
- "outputs": [
- {
- "output_type": "display_data",
- "data": {
- "text/html": [
- "
\n",
- "The default version of TensorFlow in Colab will soon switch to TensorFlow 2.x. \n",
- "We recommend you upgrade now \n",
- "or ensure your notebook will continue to use TensorFlow 1.x via the %tensorflow_version 1.x magic:\n",
- "more info.
\n"
- ],
- "text/plain": [
- ""
- ]
- },
- "metadata": {
- "tags": []
- }
- },
- {
- "output_type": "stream",
- "text": [
- "Downloading data from http://ai.stanford.edu/~amaas/data/sentiment/aclImdb_v1.tar.gz\n",
- "84131840/84125825 [==============================] - 8s 0us/step\n"
- ],
- "name": "stdout"
- }
- ]
- },
- {
- "cell_type": "code",
- "metadata": {
- "id": "hEpQWHnF-hOX",
- "colab_type": "code",
- "outputId": "75afbee2-0a05-4028-ed8f-86e50605201e",
- "colab": {
- "base_uri": "https://localhost:8080/",
- "height": 34
- }
- },
- "source": [
- "import warnings\n",
- "warnings.filterwarnings(\"ignore\")\n",
- "\n",
- "import os\n",
- "import sys\n",
- "import numpy as np\n",
- "from keras.preprocessing.text import Tokenizer\n",
- "from keras.preprocessing.sequence import pad_sequences\n",
- "from keras.utils import to_categorical\n",
- "from keras.layers import Dense, Input, GlobalMaxPooling1D\n",
- "from keras.layers import Conv1D, MaxPooling1D, Embedding, LSTM\n",
- "from keras.models import Model, Sequential\n",
- "from keras.initializers import Constant\n",
- "\n",
- "MAX_SEQUENCE_LENGTH = 1000\n",
- "MAX_NUM_WORDS = 20000 \n",
- "EMBEDDING_DIM = 100 \n",
- "VALIDATION_SPLIT = 0.2\n",
- "\n",
- "vocab_size = 20000 # Max number of different word, i.e. model input dimension\n",
- "maxlen = 1000 # Max number of words kept at the end of each text"
- ],
- "execution_count": 0,
- "outputs": [
- {
- "output_type": "stream",
- "text": [
- "Using TensorFlow backend.\n"
- ],
- "name": "stderr"
- }
- ]
- },
- {
- "cell_type": "code",
- "metadata": {
- "id": "830AVGaZBfnf",
- "colab_type": "code",
- "outputId": "c5fdd29a-b8fe-44a1-d81e-ddb0f1c57be0",
- "colab": {
- "base_uri": "https://localhost:8080/",
- "height": 34
- }
- },
- "source": [
- "train.columns"
- ],
- "execution_count": 0,
- "outputs": [
- {
- "output_type": "execute_result",
- "data": {
- "text/plain": [
- "Index(['sentence', 'sentiment', 'polarity'], dtype='object')"
- ]
- },
- "metadata": {
- "tags": []
- },
- "execution_count": 4
- }
- ]
+ {
+ "cell_type": "markdown",
+ "metadata": {
+ "colab_type": "text",
+ "id": "F5S86uIWZKVO"
+ },
+ "source": [
+ "We will be building an LSTM model with an embedding layer trained on the fly. We will be following all the preprocessing steps as in the [DeepNN_Example.ipynb](https://github.com/practical-nlp/practical-nlp/blob/master/Ch4/DeepNN_Example.ipynb) notebook in this repo."
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 2,
+ "metadata": {
+ "colab": {
+ "base_uri": "https://localhost:8080/",
+ "height": 98
},
- {
- "cell_type": "code",
- "metadata": {
- "id": "FJo_FLISBhx6",
- "colab_type": "code",
- "colab": {}
- },
- "source": [
- "train_texts = train['sentence'].values\n",
- "train_labels = train['polarity'].values\n",
- "test_texts = test['sentence'].values\n",
- "# test_labels = test['polarity'].values\n",
- "\n",
- "labels_index = {'pos':1, 'neg':0} "
- ],
- "execution_count": 0,
- "outputs": []
+ "colab_type": "code",
+ "id": "UsCn1xlo_MMX",
+ "outputId": "a5f0393a-0812-4fd0-c593-1479a8a6ed76"
+ },
+ "outputs": [],
+ "source": [
+ "import tensorflow as tf\n",
+ "from tensorflow import keras\n",
+ "import os\n",
+ "import re\n",
+ "import pandas as pd\n",
+ "\n",
+ "#helper functions to lead the data\n",
+ "def load_directory_data(directory):\n",
+ " data = {}\n",
+ " data[\"sentence\"] = []\n",
+ " data[\"sentiment\"] = []\n",
+ " for file_path in os.listdir(directory):\n",
+ " with tf.io.gfile.GFile(os.path.join(directory, file_path), \"r\") as f:\n",
+ " data[\"sentence\"].append(f.read())\n",
+ " data[\"sentiment\"].append(re.match(\"\\d+_(\\d+)\\.txt\", file_path).group(1))\n",
+ " return pd.DataFrame.from_dict(data)\n",
+ "\n",
+ "# Merge positive and negative examples, add a polarity column and shuffle.\n",
+ "def load_dataset(directory):\n",
+ " pos_df = load_directory_data(os.path.join(directory, \"pos\"))\n",
+ " neg_df = load_directory_data(os.path.join(directory, \"neg\"))\n",
+ " pos_df[\"polarity\"] = 1\n",
+ " neg_df[\"polarity\"] = 0\n",
+ " return pd.concat([pos_df, neg_df]).sample(frac=1).reset_index(drop=True)\n",
+ "\n",
+ "def download_and_load_datasets(force_download=False):\n",
+ " dataset = tf.keras.utils.get_file(\n",
+ " fname=\"aclImdb.tar.gz\", \n",
+ " origin=\"http://ai.stanford.edu/~amaas/data/sentiment/aclImdb_v1.tar.gz\", \n",
+ " extract=True)\n",
+ "\n",
+ " train_df = load_dataset(os.path.join(os.path.dirname(dataset), \n",
+ " \"aclImdb\", \"train\"))\n",
+ " test_df = load_dataset(os.path.join(os.path.dirname(dataset), \n",
+ " \"aclImdb\", \"test\"))\n",
+ " \n",
+ " return train_df, test_df"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 3,
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "try:\n",
+ " from google.colab import files\n",
+ " \n",
+ " if not os.path.exists('aclImdb'):\n",
+ " train,test = download_and_load_datasets()\n",
+ " else:\n",
+ " train = load_dataset('aclImdb/train')\n",
+ " test = load_dataset('aclImdb/test')\n",
+ " \n",
+ "except ModuleNotFoundError:\n",
+ " if not os.path.exists('Data/aclImdb'):\n",
+ " train,test = download_and_load_datasets()\n",
+ " else:\n",
+ " train = load_dataset('Data/aclImdb/train')\n",
+ " test = load_dataset('Data/aclImdb/test')"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 4,
+ "metadata": {
+ "colab": {
+ "base_uri": "https://localhost:8080/",
+ "height": 34
},
- {
- "cell_type": "code",
- "metadata": {
- "id": "rZ1G3DH3dDQ4",
- "colab_type": "code",
- "outputId": "8d6a5449-9d67-4ab5-d984-4eb80c971c4b",
- "colab": {
- "base_uri": "https://localhost:8080/",
- "height": 34
- }
- },
- "source": [
- "test.columns\n"
- ],
- "execution_count": 0,
- "outputs": [
- {
- "output_type": "execute_result",
- "data": {
- "text/plain": [
- "Index(['sentence', 'sentiment', 'polarity'], dtype='object')"
- ]
- },
- "metadata": {
- "tags": []
- },
- "execution_count": 37
- }
- ]
+ "colab_type": "code",
+ "id": "hEpQWHnF-hOX",
+ "outputId": "75afbee2-0a05-4028-ed8f-86e50605201e"
+ },
+ "outputs": [],
+ "source": [
+ "import warnings\n",
+ "warnings.filterwarnings(\"ignore\")\n",
+ "\n",
+ "import os\n",
+ "import sys\n",
+ "import numpy as np\n",
+ "from keras.preprocessing.text import Tokenizer\n",
+ "from keras.preprocessing.sequence import pad_sequences\n",
+ "from keras.utils.np_utils import to_categorical\n",
+ "from keras.layers import Dense, Input, GlobalMaxPooling1D\n",
+ "from keras.layers import Conv1D, MaxPooling1D, Embedding, LSTM\n",
+ "from keras.models import Model, Sequential\n",
+ "from keras.initializers import Constant\n",
+ "\n",
+ "MAX_SEQUENCE_LENGTH = 1000\n",
+ "MAX_NUM_WORDS = 20000 \n",
+ "EMBEDDING_DIM = 100 \n",
+ "VALIDATION_SPLIT = 0.2\n",
+ "\n",
+ "vocab_size = 20000 # Max number of different word, i.e. model input dimension\n",
+ "maxlen = 1000 # Max number of words kept at the end of each text"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 5,
+ "metadata": {
+ "colab": {
+ "base_uri": "https://localhost:8080/",
+ "height": 34
},
+ "colab_type": "code",
+ "id": "830AVGaZBfnf",
+ "outputId": "c5fdd29a-b8fe-44a1-d81e-ddb0f1c57be0"
+ },
+ "outputs": [
{
- "cell_type": "code",
- "metadata": {
- "id": "g8I6QgXldKd0",
- "colab_type": "code",
- "outputId": "e251c62f-451f-48cb-cce1-e46bd5dd9796",
- "colab": {
- "base_uri": "https://localhost:8080/",
- "height": 34
- }
- },
- "source": [
- "test_labels = test['polarity'].values\n",
- "test_labels"
- ],
- "execution_count": 0,
- "outputs": [
- {
- "output_type": "execute_result",
- "data": {
- "text/plain": [
- "array([1, 0, 1, ..., 0, 0, 0])"
- ]
- },
- "metadata": {
- "tags": []
- },
- "execution_count": 42
- }
+ "data": {
+ "text/plain": [
+ "Index(['sentence', 'sentiment', 'polarity'], dtype='object')"
]
+ },
+ "execution_count": 5,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "train.columns"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 6,
+ "metadata": {
+ "colab": {},
+ "colab_type": "code",
+ "id": "FJo_FLISBhx6"
+ },
+ "outputs": [],
+ "source": [
+ "train_texts = train['sentence'].values\n",
+ "train_labels = train['polarity'].values\n",
+ "test_texts = test['sentence'].values\n",
+ "# test_labels = test['polarity'].values\n",
+ "\n",
+ "labels_index = {'pos':1, 'neg':0} "
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 7,
+ "metadata": {
+ "colab": {
+ "base_uri": "https://localhost:8080/",
+ "height": 34
},
+ "colab_type": "code",
+ "id": "rZ1G3DH3dDQ4",
+ "outputId": "8d6a5449-9d67-4ab5-d984-4eb80c971c4b"
+ },
+ "outputs": [
{
- "cell_type": "markdown",
- "metadata": {
- "id": "VfPAZEEKajly",
- "colab_type": "text"
- },
- "source": [
- "We need to design an sklearn pipeline with our model.\n",
- "What is a pipeline? \n",
- "\n",
- "**Transformer** in scikit-learn - some class that have fit and transform method, or fit_transform method.\n",
- "\n",
- "**Predictor** - some class that has fit and predict methods, or fit_predict method.\n",
- "\n",
- "**Pipeline** is just an abstract notion, it's not some existing ml algorithm. Often in ML tasks you need to perform sequence of different transformations (find set of features, generate new features, select only some good features) of raw dataset before applying final estimator. Pipeline gives you a single interface for all 3 steps of transformation and resulting estimator. It encapsulates transformers and predictors inside"
+ "data": {
+ "text/plain": [
+ "Index(['sentence', 'sentiment', 'polarity'], dtype='object')"
]
+ },
+ "execution_count": 7,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "test.columns"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 8,
+ "metadata": {
+ "colab": {
+ "base_uri": "https://localhost:8080/",
+ "height": 34
},
+ "colab_type": "code",
+ "id": "g8I6QgXldKd0",
+ "outputId": "e251c62f-451f-48cb-cce1-e46bd5dd9796"
+ },
+ "outputs": [
{
- "cell_type": "code",
- "metadata": {
- "id": "ibekacAMMTsr",
- "colab_type": "code",
- "colab": {}
- },
- "source": [
- "from keras.preprocessing.text import Tokenizer\n",
- "from keras.preprocessing.sequence import pad_sequences\n",
- "from sklearn.pipeline import TransformerMixin\n",
- "from sklearn.base import BaseEstimator\n",
- "\n",
- "\n",
- "class TextsToSequences(Tokenizer, BaseEstimator, TransformerMixin):\n",
- " \"\"\" Sklearn transformer to convert texts to indices list \n",
- " (e.g. [[\"the cute cat\"], [\"the dog\"]] -> [[1, 2, 3], [1, 4]])\"\"\"\n",
- " def __init__(self, **kwargs):\n",
- " super().__init__(**kwargs)\n",
- " \n",
- " def fit(self, texts, y=None):\n",
- " self.fit_on_texts(texts)\n",
- " return self\n",
- " \n",
- " def transform(self, texts, y=None):\n",
- " return np.array(self.texts_to_sequences(texts))\n",
- " \n",
- "sequencer = TextsToSequences(num_words=vocab_size)\n",
- "\n",
- "\n",
- "\n",
- "\n",
- "class Padder(BaseEstimator, TransformerMixin):\n",
- " \"\"\" Pad and crop uneven lists to the same length. \n",
- " Only the end of lists longernthan the maxlen attribute are\n",
- " kept, and lists shorter than maxlen are left-padded with zeros\n",
- " \n",
- " Attributes\n",
- " ----------\n",
- " maxlen: int\n",
- " sizes of sequences after padding\n",
- " max_index: int\n",
- " maximum index known by the Padder, if a higher index is met during \n",
- " transform it is transformed to a 0\n",
- " \"\"\"\n",
- " def __init__(self, maxlen=500):\n",
- " self.maxlen = maxlen\n",
- " self.max_index = None\n",
- " \n",
- " def fit(self, X, y=None):\n",
- " self.max_index = pad_sequences(X, maxlen=self.maxlen).max()\n",
- " return self\n",
- " \n",
- " def transform(self, X, y=None):\n",
- " X = pad_sequences(X, maxlen=self.maxlen)\n",
- " X[X > self.max_index] = 0\n",
- " return X\n",
- "\n",
- "padder = Padder(maxlen)"
- ],
- "execution_count": 0,
- "outputs": []
- },
- {
- "cell_type": "markdown",
- "metadata": {
- "id": "8mtEN5BjbyKM",
- "colab_type": "text"
- },
- "source": [
- "We will only train for 2 epochs. A better model could be trained with more epochs and early stopping."
+ "data": {
+ "text/plain": [
+ "array([1, 1, 0, ..., 0, 1, 1])"
]
+ },
+ "execution_count": 8,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "test_labels = test['polarity'].values\n",
+ "test_labels"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "metadata": {
+ "colab_type": "text",
+ "id": "VfPAZEEKajly"
+ },
+ "source": [
+ "We need to design an sklearn pipeline with our model.\n",
+ "What is a pipeline? \n",
+ "\n",
+ "**Transformer** in scikit-learn - some class that have fit and transform method, or fit_transform method.\n",
+ "\n",
+ "**Predictor** - some class that has fit and predict methods, or fit_predict method.\n",
+ "\n",
+ "**Pipeline** is just an abstract notion, it's not some existing ml algorithm. Often in ML tasks you need to perform sequence of different transformations (find set of features, generate new features, select only some good features) of raw dataset before applying final estimator. Pipeline gives you a single interface for all 3 steps of transformation and resulting estimator. It encapsulates transformers and predictors inside"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 0,
+ "metadata": {
+ "colab": {},
+ "colab_type": "code",
+ "id": "ibekacAMMTsr"
+ },
+ "outputs": [],
+ "source": [
+ "from keras.preprocessing.text import Tokenizer\n",
+ "from keras.preprocessing.sequence import pad_sequences\n",
+ "from sklearn.pipeline import TransformerMixin\n",
+ "from sklearn.base import BaseEstimator\n",
+ "\n",
+ "\n",
+ "class TextsToSequences(Tokenizer, BaseEstimator, TransformerMixin):\n",
+ " \"\"\" Sklearn transformer to convert texts to indices list \n",
+ " (e.g. [[\"the cute cat\"], [\"the dog\"]] -> [[1, 2, 3], [1, 4]])\"\"\"\n",
+ " def __init__(self, **kwargs):\n",
+ " super().__init__(**kwargs)\n",
+ " \n",
+ " def fit(self, texts, y=None):\n",
+ " self.fit_on_texts(texts)\n",
+ " return self\n",
+ " \n",
+ " def transform(self, texts, y=None):\n",
+ " return np.array(self.texts_to_sequences(texts))\n",
+ " \n",
+ "sequencer = TextsToSequences(num_words=vocab_size)\n",
+ "\n",
+ "\n",
+ "\n",
+ "\n",
+ "class Padder(BaseEstimator, TransformerMixin):\n",
+ " \"\"\" Pad and crop uneven lists to the same length. \n",
+ " Only the end of lists longernthan the maxlen attribute are\n",
+ " kept, and lists shorter than maxlen are left-padded with zeros\n",
+ " \n",
+ " Attributes\n",
+ " ----------\n",
+ " maxlen: int\n",
+ " sizes of sequences after padding\n",
+ " max_index: int\n",
+ " maximum index known by the Padder, if a higher index is met during \n",
+ " transform it is transformed to a 0\n",
+ " \"\"\"\n",
+ " def __init__(self, maxlen=500):\n",
+ " self.maxlen = maxlen\n",
+ " self.max_index = None\n",
+ " \n",
+ " def fit(self, X, y=None):\n",
+ " self.max_index = pad_sequences(X, maxlen=self.maxlen).max()\n",
+ " return self\n",
+ " \n",
+ " def transform(self, X, y=None):\n",
+ " X = pad_sequences(X, maxlen=self.maxlen)\n",
+ " X[X > self.max_index] = 0\n",
+ " return X\n",
+ "\n",
+ "padder = Padder(maxlen)"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "metadata": {
+ "colab_type": "text",
+ "id": "8mtEN5BjbyKM"
+ },
+ "source": [
+ "We will only train for 2 epochs. A better model could be trained with more epochs and early stopping."
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 0,
+ "metadata": {
+ "colab": {
+ "base_uri": "https://localhost:8080/",
+ "height": 86
},
+ "colab_type": "code",
+ "id": "6XvXEYGBMWlW",
+ "outputId": "a546a0c7-169a-4ca9-fb0d-c054250f740a"
+ },
+ "outputs": [
{
- "cell_type": "code",
- "metadata": {
- "id": "6XvXEYGBMWlW",
- "colab_type": "code",
- "outputId": "a546a0c7-169a-4ca9-fb0d-c054250f740a",
- "colab": {
- "base_uri": "https://localhost:8080/",
- "height": 86
- }
- },
- "source": [
- "from keras.models import Sequential\n",
- "from keras.layers import Dense, Embedding, Bidirectional, LSTM\n",
- "from keras.wrappers.scikit_learn import KerasClassifier\n",
- "from sklearn.pipeline import make_pipeline\n",
- "\n",
- "batch_size = 64\n",
- "max_features = vocab_size + 1\n",
- "\n",
- "#Training an LSTM with embedding on the fly\n",
- "def create_model(max_features):\n",
- " \"\"\" Model creation function: returns a compiled LSTM\"\"\"\n",
- "\n",
- "\n",
- " rnnmodel = Sequential()\n",
- " rnnmodel.add(Embedding(MAX_NUM_WORDS, 128))\n",
- " rnnmodel.add(LSTM(128, dropout=0.2, recurrent_dropout=0.2))\n",
- " rnnmodel.add(Dense(1, activation='sigmoid'))\n",
- " rnnmodel.compile(loss='binary_crossentropy',\n",
- " optimizer='adam',\n",
- " metrics=['accuracy'])\n",
- " return rnnmodel\n",
- "\n",
- "\n",
- "# Use Keras Scikit-learn wrapper to instantiate a LSTM with all methods\n",
- "# required by Scikit-learn for the last step of a Pipeline\n",
- "sklearn_lstm = KerasClassifier(build_fn=create_model, epochs=2, batch_size=32, \n",
- " max_features=max_features, verbose=1)\n",
- "\n",
- "# Build the Scikit-learn pipeline\n",
- "pipeline = make_pipeline(sequencer, padder, sklearn_lstm)\n",
- "\n",
- "pipeline.fit(train_texts, train_labels);"
- ],
- "execution_count": 0,
- "outputs": [
- {
- "output_type": "stream",
- "text": [
- "Epoch 1/2\n",
- "25000/25000 [==============================] - 1486s 59ms/step - loss: 0.5025 - acc: 0.7597\n",
- "Epoch 2/2\n",
- "25000/25000 [==============================] - 1475s 59ms/step - loss: 0.3441 - acc: 0.8572\n"
- ],
- "name": "stdout"
- }
- ]
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "Epoch 1/2\n",
+ "25000/25000 [==============================] - 1486s 59ms/step - loss: 0.5025 - acc: 0.7597\n",
+ "Epoch 2/2\n",
+ "25000/25000 [==============================] - 1475s 59ms/step - loss: 0.3441 - acc: 0.8572\n"
+ ]
+ }
+ ],
+ "source": [
+ "from keras.models import Sequential\n",
+ "from keras.layers import Dense, Embedding, Bidirectional, LSTM\n",
+ "from keras.wrappers.scikit_learn import KerasClassifier\n",
+ "from sklearn.pipeline import make_pipeline\n",
+ "\n",
+ "batch_size = 64\n",
+ "max_features = vocab_size + 1\n",
+ "\n",
+ "#Training an LSTM with embedding on the fly\n",
+ "def create_model(max_features):\n",
+ " \"\"\" Model creation function: returns a compiled LSTM\"\"\"\n",
+ "\n",
+ "\n",
+ " rnnmodel = Sequential()\n",
+ " rnnmodel.add(Embedding(MAX_NUM_WORDS, 128))\n",
+ " rnnmodel.add(LSTM(128, dropout=0.2, recurrent_dropout=0.2))\n",
+ " rnnmodel.add(Dense(1, activation='sigmoid'))\n",
+ " rnnmodel.compile(loss='binary_crossentropy',\n",
+ " optimizer='adam',\n",
+ " metrics=['accuracy'])\n",
+ " return rnnmodel\n",
+ "\n",
+ "\n",
+ "# Use Keras Scikit-learn wrapper to instantiate a LSTM with all methods\n",
+ "# required by Scikit-learn for the last step of a Pipeline\n",
+ "sklearn_lstm = KerasClassifier(build_fn=create_model, epochs=2, batch_size=32, \n",
+ " max_features=max_features, verbose=1)\n",
+ "\n",
+ "# Build the Scikit-learn pipeline\n",
+ "pipeline = make_pipeline(sequencer, padder, sklearn_lstm)\n",
+ "\n",
+ "pipeline.fit(train_texts, train_labels);"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 0,
+ "metadata": {
+ "colab": {
+ "base_uri": "https://localhost:8080/",
+ "height": 34
},
+ "colab_type": "code",
+ "id": "2KKnIf5BcnQn",
+ "outputId": "bef294a5-b7bb-4b60-812b-91f843b8a04b"
+ },
+ "outputs": [
{
- "cell_type": "code",
- "metadata": {
- "id": "2KKnIf5BcnQn",
- "colab_type": "code",
- "outputId": "bef294a5-b7bb-4b60-812b-91f843b8a04b",
- "colab": {
- "base_uri": "https://localhost:8080/",
- "height": 34
- }
- },
- "source": [
- "print('Test accuracy: {:.2f} %'.format(100*metrics.accuracy_score(y_preds, test_labels)))"
- ],
- "execution_count": 0,
- "outputs": [
- {
- "output_type": "stream",
- "text": [
- "Test accuracy: 83.70 %\n"
- ],
- "name": "stdout"
- }
- ]
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "Test accuracy: 83.70 %\n"
+ ]
+ }
+ ],
+ "source": [
+ "print('Test accuracy: {:.2f} %'.format(100*metrics.accuracy_score(y_preds, test_labels)))"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 0,
+ "metadata": {
+ "colab": {
+ "base_uri": "https://localhost:8080/",
+ "height": 477
},
+ "colab_type": "code",
+ "id": "jd9mzgXrZ9ys",
+ "outputId": "9a640266-ef6d-40cc-8d6c-07023424b69c"
+ },
+ "outputs": [
{
- "cell_type": "code",
- "metadata": {
- "id": "jd9mzgXrZ9ys",
- "colab_type": "code",
- "outputId": "9a640266-ef6d-40cc-8d6c-07023424b69c",
- "colab": {
- "base_uri": "https://localhost:8080/",
- "height": 477
- }
- },
- "source": [
- "\n",
- "\n",
- "# We choose a sample from test set\n",
- "idx = 11\n",
- "text_sample = test_texts[idx]\n",
- "class_names = ['negative', 'positive']\n",
- "\n",
- "print('Sample {}: last 1000 words (only part used by the model)'.format(idx))\n",
- "print('-'*50)\n",
- "print(\" \".join(text_sample.split()[-1000:]))\n",
- "print('-'*50)\n",
- "print('Probability(positive) =', pipeline.predict_proba([text_sample])[0,1])\n",
- "print('True class: %s' % class_names[test_labels[idx]])\n",
- "\n",
- "\n",
- "\n",
- "import matplotlib.pyplot as plt\n",
- "import seaborn as sns\n",
- "%matplotlib inline\n",
- "from collections import OrderedDict\n",
- "from lime.lime_text import LimeTextExplainer\n",
- "\n",
- "explainer = LimeTextExplainer(class_names=class_names)\n",
- "explanation = explainer.explain_instance(text_sample, pipeline.predict_proba, num_features=10)\n",
- "\n",
- "weights = OrderedDict(explanation.as_list())\n",
- "lime_weights = pd.DataFrame({'words': list(weights.keys()), 'weights': list(weights.values())})\n",
- "\n",
- "sns.barplot(x=\"words\", y=\"weights\", data=lime_weights);\n",
- "plt.xticks(rotation=45)\n",
- "plt.title('Sample {} features weights given by LIME'.format(idx));"
- ],
- "execution_count": 0,
- "outputs": [
- {
- "output_type": "stream",
- "text": [
- "Sample 11: last 1000 words (only part used by the model)\n",
- "--------------------------------------------------\n",
- "The film starts out with a narration of the protagonist explaining certain crimes occurring all over the city and then we get to know that the hero is a cop who is either suspended or has probably retired. I did not have the patience or the interest to verify the above before commenting. If there is a stereotype for narrators to have a deep, sleep-inducing voice then, it is high time to put an end to it. I seriously fell asleep and did not bother to shut the movie down either. Am still trying to figure out what the movie was all about and why there were no outdoor shootings. A third rate TV Serial will have more number of sets compared to this crap of a movie and I still pity the actors and producers involved in this huge bullshit of a movie. It ought to have been produced as a normal TV serial or maybe even as a local theater drama instead of putting it out on the big screen. Total waste of time and money. The movie was supposed to be in production for a long time and it would have been better to have left it that way.With redundant sleep inducing dialogs and sets, this is the worst movie I have come across.\n",
- "--------------------------------------------------\n",
- "1/1 [==============================] - 0s 347ms/step\n",
- "Probability(positive) = 0.07630403\n",
- "True class: negative\n",
- "5000/5000 [==============================] - 63s 13ms/step\n"
- ],
- "name": "stdout"
- },
- {
- "output_type": "display_data",
- "data": {
- "image/png": "iVBORw0KGgoAAAANSUhEUgAAAZAAAAEtCAYAAAAm6zZnAAAABHNCSVQICAgIfAhkiAAAAAlwSFlz\nAAALEgAACxIB0t1+/AAAADh0RVh0U29mdHdhcmUAbWF0cGxvdGxpYiB2ZXJzaW9uMy4xLjMsIGh0\ndHA6Ly9tYXRwbG90bGliLm9yZy+AADFEAAAgAElEQVR4nO3dedxUZf3/8ddbEM0dAhFBxK9Lamou\nqJklrrgUQqYlbmgaaVG55E/LSjM1Lc20ssK0ULM0M8XcQnNLy7xxNzM0RUAEBNw30M/vj+uaHIe5\nb4bDPQvc7+fjMY97zpkz5/rMmbnP51zLOUcRgZmZ2aJaptkBmJnZkskJxMzMCnECMTOzQpxAzMys\nECcQMzMrxAnEzMwKcQKxBUg6RdJlLRBHX0l3SnpF0jnNjqeVSDpQ0l9qXPZQSX+rd0xVyh0o6VVJ\n3Rpc7u2SjmhkmV2VE0gLkfRxSfdIeknSHEl3S9q62XEtCkljJLVJekvSbype6yHpKknPSApJOy5k\ndaOBF4BVIuK4xYzrN5JOW5x1tJKI+G1EDO2MddVrhxsRz0bEShHxTmevuxEkDcq/0+5VXnvfQVZe\nbmb5spKWzfOibN7tkt7MibX0uK7+n6Y+nEBahKRVgD8DPwF6Af2B7wJvNTOuAp4DTgMubuf1vwEH\nAc/XsK61gX9FC5ztWm0nYlZhLrBn2fSeeV6lMTmxlh7DGhNe53MCaR0bAETE7yLinYh4IyL+EhEP\nA0haV9JfJc2W9IKk30parfTmfFR/vKSHJb0m6aLcBHRjbgK6RVLPvGzpyGq0pOckTZf09fYCk/TR\nXDN6UdJDHdUcIuLqiLgGmF3ltbcj4scR8Tegw6PSXHsZBfy/fJS2q6RlJJ0o6am8Ha6U1KvsPX+Q\n9Hyuwd0p6cN5/mjgwLJ1XZfnh6T1ysss1VIk7ShpqqQTJD0P/DrP/5SkB/O2uEfSZmXvP0HStLy9\nn5C0S5XPtU5+7zJ5+kJJM8tev1TS0fn5qvl7nJ7Xe1qpOaiyWUrS0FzmS5IukHRHZa1C0tmS5kp6\nWtKeed7pwCeAn+Zt81Ml5+aj55clPSJpk3a+p3X0XjPjLZJ+VjoyLz+Cl/Q5SW0V7z1G0vj8fLkc\n37OSZkj6haQPVHwXx+WYpks6rFo8ZdaV9M8c/7Wl34mk6yV9pSKOhyV9eiHrq8WlwCFl04cAl3TC\neluWE0jr+A/wjqRxkvYs7ezLCPg+sCawEbAWcErFMp8BdiMlo2HAjcA3gT6k7/qrFcvvBKwPDAVO\nkLRrZVCS+gPXk2oVvYCvA3+U1KfYx6xNRBwK/Bb4QT5KuwX4CjACGELaDnOBn5W97UbS51kduD+/\nn4gYW7GuWo/41iB95rWB0ZK2INWsvgh8EPglMD7v/D4EjAG2joiVgd2BZ6p8rqeBl4Et8qwdgFcl\nbZSnhwB35Oe/AeYD6+XlhwILNDVJ6g1cBXwjx/UE8LGKxbbN83sDPwAukqSIOAm4i/eOisfkcnYg\n/Y5WBT5LlQOC7HLgn7ncU4CD21nuOuBDktYvm3dAfj/Ambm8zfPn7Q98p2zZNXIs/YHDgZ9V+R8p\ndwjweaAfaRuen+ePI9WAAZD0kbzO6ztYV62uAXaQtFqO7RPAtZ2w3pblBNIiIuJl4ONAABcCsySN\nl9Q3v/5kREyIiLciYhbwI9LOptxPImJGREwj7RTujYgHIuJN4E+8t9Mq+W5EvBYRj5COsEdWCe0g\n4IaIuCEi3o2ICUAbsFfnfPJFciRwUkRMjYi3SDusfZWblyLi4oh4pey1j0hadTHKexc4OW/zN0h9\nMr+MiHtzLXEcqYnxo6Qa1XLAxpKWjYhnIuKpdtZ7BzBE0hp5+qo8vQ6wCvBQ/t73Ao7O39FM4Fxg\n/yrr2wt4LNf+SjvLyibCyRFxYe6PGEfasfZtJ755wMrAhoAi4vGImF65kKSBwNbAd3Lt8m/A+Gor\njIjXSTvTkfm96+f1j5ck0rY9JiLmRMQrwBkVn3UecGpEzIuIG4BXgQ+1Ez/ApRHxaES8Bnwb+Gyu\nvY0HNihLZAcDV0TE2x2sq1ZvkhLl5/JjfJ5X6fxcCy09vtcJZTeFE0gLyf+oh0bEAGAT0lH2j+F/\nI5J+n5syXgYuIx1NlptR9vyNKtMrVSw/pez55FxepbWB/cp/8KRE128RP15nWBv4U1kcj5N23H0l\ndZN0plLz1su8d/RfuY0WxaycfMvLP65iW6wFrBkRTwJHkxLXzPxdVduekBLIjqSj/DuB20kHA0OA\nuyLi3VzWssD0srJ+SapdVVqTsu8y9xlNrVjm+bLXX89PK38Ppdf/CvyUVLubKWmsUh9dtXLnlK0P\n3v+bqnQ57x2kHABck9/bB1gBmFj2WW/K80tm5+RY8np78VeJYzJpW/bO3+cVwEFKzYgjSU1PneUS\nUu2no+arr0bEamWPb3di+Q3lBNKiIuLfpCaMUtvzGaTayaYRsQqpZqDFLGatsucDSR3glaaQjubK\nf/ArRsSZi1l2EVOAPStiWT7XuA4AhgO7kpo6BuX3lLZRtY7410k7rpI1Kl6vfM8U4PSK8leIiN8B\nRMTlEfFx0s4/gLPa+Rx3kJo3dszP/wZsz/ubr6aQaje9y8paJSI+XGV904EBpYl8RD+gynLtWWDb\nRMT5EbEVsDGpaen4dsrtJal8G65VZbmSCUAfSZuTdtyl5qsXSAc4Hy77rKtGREcJYmEqf9vzcjmQ\namAHArsAr0fE3xejnEp38V7truFDpxvNCaRFSNowdxIOyNNrkf7J/pEXWZlUbX8p90tU+4deVN+W\ntIJSZ/NhpCOzSpcBwyTtno/yl8+dmlV3ULnDdHmgG1Bavnxo43L5dYAe+fVaE+EvgNMlrZ3X1UfS\n8PzayqQd7mxSUjij4r0zgP+rmPcgcED+XHuwYJNgpQuBIyVtq2RFSZ+UtLKkD0naWdJypGaLN0hN\nYAuIiEn59YOAO3Lz5QxSH9YdeZnpwF+AcyStojSAYF1J1WK8HthU0oi8rb/MgsmwI+/bNpK2zp9x\nWeC1/HkW+CwRMZnUnHmK0hDt7Uh9b1VFxDzgD8APSX1LE/L8d0nb9lxJq+cY+kvafRE+Q6WDJG2c\nk9upwFWl4cQ5YbwLnENttY/l8u+09Gh3v5lrf8OAvfPzpZoTSOt4hdTRea+k10iJ41GgdP7Dd4Et\ngZdIO4yrO6HMO4AngVuBsyNigRPTImIK6cj+m8As0pHx8bT/2/kWaed4ImkH+UaeV/JEntcfuDk/\nX7vGeM8jtSv/RdIrpG20bX7tElJTxTTgX7yXeEsuIvVPvCjpmjzva6R/9hdJR6TX0IGIaAO+QGre\nmUvadofml5cjdQS/QGouWp3Uqd2eO0jNMlPKpkXq/C85BOiRP89cUl/JAk2HEfECsB+pc3w2qdbQ\nRu1DwM8j9SXNlXQ+qR/mwlzm5LzOH7bz3gOB7fIyp5EOQjoq93JSLfEPFU1SJ5C25z9yE+QtdNzH\nsTCXkmrwzwPLs+AAkkuATUkHSAvzKul3Wnrs3NHCEfFYRDzWwSKlEW+lx8QaYmhJ6gJJ0ipIGgQ8\nDSxb8U9sS4F8hDwVODAibmtw2VcA/46IkxtZ7qKSdAgwOjc5WkGugZgtBXIT42q5Ce2bpNpMZS2s\nHuVunZvWlsnNgMNZSE2u2XKz1peAsc2OZUnnBGK2dNgOeIrUhDYMGJGHHtfbGqRRZK+Shg8fFREP\nNKDcQnK/yixSv8/lC1ncFsJNWGZmVohrIGZmVogTiJmZFdKlrjDau3fvGDRoULPDMDNbokycOPGF\niFjg+nddKoEMGjSItra2hS9oZmb/I2lytfluwjIzs0KcQMzMrBAnEDMzK8QJxMzMCnECMTOzQpxA\nzMysECcQMzMrxAnEzMwKaeqJhPnyz+eR7l73q8rbpOZLU18CbEW6Yc3nIuIZSbuRbt7TA3gbOD7f\nx3mJ8+ypmzaknIHfeaQh5ZhZ19G0GoikbsDPgD1Jd1AbKWnjisUOB+ZGxHrAubx3j+kXgGERsSkw\nitpuS2lmZp2omU1Y2wBPRsR/I+Jt4Pekm9GUGw6My8+vAnaRpIh4ICKey/MfAz6QaytmZtYgzUwg\n/Un31y6ZmudVXSbfevUl4IMVy3wGuD8iar3/s5mZdYIl+mKKkj5MatYa2sEyo4HRAAMHDmxQZGZm\nS79m1kCmAWuVTQ/I86ouI6k7sCqpMx1JA4A/AYdExFPtFRIRYyNicEQM7tNngasRm5lZQc1MIPcB\n60taR1IPYH9gfMUy40md5AD7An+NiJC0GnA9cGJE3N2wiM3M7H+alkByn8YY4GbgceDKiHhM0qmS\n9s6LXQR8UNKTwLHAiXn+GGA94DuSHsyP1Rv8EczMurSm9oFExA3ADRXzvlP2/E1gvyrvOw04re4B\nmplZu3wmupmZFeIEYmZmhTiBmJlZIUv0eSDWObb/yfYNK+vur3jQnNnSwjUQMzMrxAnEzMwKcROW\ntYQ7dhjSsLKG3HlHw8oyW5q5BmJmZoU4gZiZWSFOIGZmVogTiJmZFeIEYmZmhXgUllmLOf2gfRtW\n1kmXXdWwsmzp4xqImZkV4gRiZmaFOIGYmVkhTiBmZlaIE4iZmRXiUVhm1rJOOeWUlijryj9s07A4\nPrvfP6vO/8hVNzcshof23b2m5VwDMTOzQpxAzMysECcQMzMrxAnEzMwKcQIxM7NCnEDMzKwQJxAz\nMyvECcTMzApxAjEzs0KcQMzMrBAnEDMzK6SpCUTSHpKekPSkpBOrvL6cpCvy6/dKGlT22jfy/Cck\n1XbhFjMz6zRNSyCSugE/A/YENgZGStq4YrHDgbkRsR5wLnBWfu/GwP7Ah4E9gAvy+szMrEGaWQPZ\nBngyIv4bEW8DvweGVywzHBiXn18F7CJJef7vI+KtiHgaeDKvz8zMGkQR0ZyCpX2BPSLiiDx9MLBt\nRIwpW+bRvMzUPP0UsC1wCvCPiLgsz78IuDEirqpSzmhgNMDAgQO3mjx5MgBbHX9J/T5chYk/PKRh\nZdni+elx1zWsrDHnDGtYWUU8fvpfG1bWRift3LCybNFJmhgRgyvnL/Wd6BExNiIGR8TgPn36NDsc\nM7OlRjMTyDRgrbLpAXle1WUkdQdWBWbX+F4zM6ujZiaQ+4D1Ja0jqQepU3x8xTLjgVH5+b7AXyO1\nuY0H9s+jtNYB1geq38bLzMzqomm3tI2I+ZLGADcD3YCLI+IxSacCbRExHrgIuFTSk8AcUpIhL3cl\n8C9gPvDliHinKR/EzKyLauo90SPiBuCGinnfKXv+JrBfO+89HTi9rgGamVm7lvpOdDMzqw8nEDMz\nK8QJxMzMCnECMTOzQpxAzMysECcQMzMrxAnEzMwKcQIxM7NCnEDMzKwQJxAzMyvECcTMzApxAjEz\ns0KcQMzMrJCmXo3XzFqXbzNrC+MaiJmZFeIEYmZmhTiBmJlZIU4gZmZWiBOImZkV4gRiZmaFOIGY\nmVkhPg/ErMyYc4Y1OwSzJYZrIGZmVogTiJmZFeIEYmZmhTiBmJlZIU4gZmZWiBOImZkV4gRiZmaF\nNCWBSOolaYKkSflvz3aWG5WXmSRpVJ63gqTrJf1b0mOSzmxs9GZmBs2rgZwI3BoR6wO35un3kdQL\nOBnYFtgGOLks0ZwdERsCWwDbS9qzMWGbmVlJsxLIcGBcfj4OGFFlmd2BCRExJyLmAhOAPSLi9Yi4\nDSAi3gbuBwY0IGYzMyvTrATSNyKm5+fPA32rLNMfmFI2PTXP+x9JqwHDSLUYMzNroJquhSVpXWBq\nRLwlaUdgM+CSiHixg/fcAqxR5aWTyiciIiRF7SH/b/3dgd8B50fEfztYbjQwGmDgwIGLWoyZmbWj\n1hrIH4F3JK0HjAXWAi7v6A0RsWtEbFLlcS0wQ1I/gPx3ZpVVTMvllAzI80rGApMi4scLiWNsRAyO\niMF9+vRZ2Oc0M7Ma1ZpA3o2I+cCngZ9ExPFAv8UodzwwKj8fBVxbZZmbgaGSeubO86F5HpJOA1YF\njl6MGMzMbDHUmkDmSRpJ2tn/Oc9bdjHKPRPYTdIkYNc8jaTBkn4FEBFzgO8B9+XHqRExR9IAUjPY\nxsD9kh6UdMRixGJmZgXUej+Qw4AjgdMj4mlJ6wCXFi00ImYDu1SZ3wYcUTZ9MXBxxTJTARUt28zM\nOketCWS3iPhqaSInkTfrFJOZmS0Bam3CGlVl3qGdGIeZmS1hOqyB5H6PA4B1JI0ve2llYE49AzMz\ns9a2sCase4DpQG/gnLL5rwAP1ysoMzNrfR0mkIiYDEwGtmtMOGZmtqSoqQ9E0j75irgvSXpZ0iuS\nXq53cGZm1rpqHYX1A2BYRDxez2DMzGzJUesorBlOHmZmVm5ho7D2yU/bJF0BXAO8VXo9Iq6uY2xm\nZtbCFtaENazs+euk61GVBOAEYmbWRS1sFNZhjQrEzMyWLLXeD+T8KrNfAtry5dnNzKyLqbUTfXlg\nc2BSfmxGuj/H4ZI6vB+HmZktnWodxrsZsH1EvAMg6efAXcDHgUfqFJuZmbWwWmsgPYGVyqZXBHrl\nhPJW9beYmdnSbFFOJHxQ0u2ke3HsAJwhaUXgljrFZmZmLaymBBIRF0m6Adgmz/pmRDyXnx9fl8jM\nzKylddiEJWnD/HdL0j3Qp+THGnmemZl1UQurgRwLjOb9l3IvCWDnTo/IzMyWCAs7kXB0/rtTY8Ix\nM7MlRa2Xc19B0rckjc3T60v6VH1DMzOzVlbrMN5fA28DH8vT04DT6hKRmZktEWpNIOtGxA+AeQAR\n8TppOK+ZmXVRtSaQtyV9gNRxjqR18QmEZmZdWq0nEp4M3ASsJem3wPbAofUKyszMWl+tCWQUcD1w\nFfBf4GsR8ULdojIzs5ZXawK5CPgEsBuwLvCApDsj4ry6RWZmZi2t1kuZ3CbpTmBrYCfgSODDgBOI\nmVkXVesNpW4lXYH376TLuG8dETPrGZiZmbW2WkdhPUw6D2QT0r1BNsmjsgqR1EvSBEmT8t+e7Sw3\nKi8zSdKoKq+Pl/Ro0TjMzKy4mhJIRBwTETsA+wCzSScWvrgY5Z4I3BoR6wO35un3kdSLNPprW9JV\ngE8uTzSS9gFeXYwYzMxsMdR6KZMxkq4AHgCGAxcDey5GucOBcfn5OGBElWV2ByZExJyImAtMAPbI\n8axEutCjz4Y3M2uSWkdhLQ/8CJgYEfM7ody+ETE9P38e6Ftlmf6kS8eXTM3zAL5HukLw650Qi5mZ\nFVDrKKyzF3XFkm4B1qjy0kkV6w5JsQjr3Zx0aZVjJA2qYfnRpEvSM3DgwFqLMTOzhai1BrLIImLX\n9l6TNENSv4iYLqkfUG1E1zRgx7LpAcDtwHbAYEnPkOJfXdLtEbEjVUTEWGAswODBg2tOVGZm1rFa\nR2F1tvGks9vJf6+tsszNwFBJPXPn+VDg5oj4eUSsGRGDgI8D/2kveZiZWf00K4GcCewmaRKwa55G\n0mBJvwKIiDmkvo778uPUPM/MzFpA3ZqwOhIRs4FdqsxvA44om76YNOKrvfU8Qzo3xczMGqxZNRAz\nM1vCOYGYmVkhTiBmZlaIE4iZmRXiBGJmZoU4gZiZWSFOIGZmVogTiJmZFeIEYmZmhTiBmJlZIU4g\nZmZWiBOImZkV4gRiZmaFOIGYmVkhTiBmZlaIE4iZmRXiBGJmZoU4gZiZWSFOIGZmVogTiJmZFeIE\nYmZmhTiBmJlZIU4gZmZWiBOImZkV4gRiZmaFOIGYmVkhTiBmZlaIE4iZmRXiBGJmZoU4gZiZWSFN\nSSCSekmaIGlS/tuzneVG5WUmSRpVNr+HpLGS/iPp35I+07jozcwMmlcDORG4NSLWB27N0+8jqRdw\nMrAtsA1wclmiOQmYGREbABsDdzQkajMz+59mJZDhwLj8fBwwosoyuwMTImJORMwFJgB75Nc+D3wf\nICLejYgX6hyvmZlVaFYC6RsR0/Pz54G+VZbpD0wpm54K9Je0Wp7+nqT7Jf1BUrX3AyBptKQ2SW2z\nZs3qlODNzKyOCUTSLZIerfIYXr5cRAQQi7Dq7sAA4J6I2BL4O3B2ewtHxNiIGBwRg/v06VPko5iZ\nWRXd67XiiNi1vdckzZDULyKmS+oHzKyy2DRgx7LpAcDtwGzgdeDqPP8PwOGdEbOZmdWuWU1Y44HS\nqKpRwLVVlrkZGCqpZ+48HwrcnGss1/FectkF+Fd9wzUzs0rNSiBnArtJmgTsmqeRNFjSrwAiYg7w\nPeC+/Dg1zwM4AThF0sPAwcBxDY7fzKzLq1sTVkciYjap5lA5vw04omz6YuDiKstNBnaoZ4xmZtYx\nn4luZmaFOIGYmVkhTiBmZlaIE4iZmRXiBGJmZoU4gZiZWSFOIGZmVogTiJmZFeIEYmZmhTiBmJlZ\nIU4gZmZWiBOImZkV4gRiZmaFOIGYmVkhTiBmZlaIE4iZmRXiBGJmZoU4gZiZWSFOIGZmVogTiJmZ\nFeIEYmZmhTiBmJlZIU4gZmZWiBOImZkV4gRiZmaFOIGYmVkhTiBmZlaIE4iZmRXiBGJmZoU0JYFI\n6iVpgqRJ+W/PdpYblZeZJGlU2fyRkh6R9LCkmyT1blz0ZmYGzauBnAjcGhHrA7fm6feR1As4GdgW\n2AY4WVJPSd2B84CdImIz4GFgTMMiNzMzoHkJZDgwLj8fB4yosszuwISImBMRc4EJwB6A8mNFSQJW\nAZ6rf8hmZlaue5PK7RsR0/Pz54G+VZbpD0wpm54K9I+IeZKOAh4BXgMmAV+uZ7BmZragutVAJN0i\n6dEqj+Hly0VEALEI610WOArYAliT1IT1jQ6WHy2pTVLbrFmzin0YMzNbQN1qIBGxa3uvSZohqV9E\nTJfUD5hZZbFpwI5l0wOA24HN8/qfyuu6kip9KGVxjAXGAgwePPh/iWriDw+p9aOYmVkVzeoDGQ+U\nRlWNAq6tsszNwNDccd4TGJrnTQM2ltQnL7cb8Hid4zUzswrN6gM5E7hS0uHAZOCzAJIGA0dGxBER\nMUfS94D78ntOjYg5ebnvAndKmpfff2ijP4CZWVen1AXRNQwePDja2tqaHYaZ2RJF0sSIGFw532ei\nm5lZIU4gZmZWiBOImZkV4gRiZmaFOIGYmVkhTiBmZlZIlxrGK2kW6byRonoDL3RSOIujFeJohRig\nNeJohRigNeJohRigNeJohRigc+JYOyL6VM7sUglkcUlqqzYWuivG0QoxtEocrRBDq8TRCjG0Shyt\nEEO943ATlpmZFeIEYmZmhTiBLJqxzQ4ga4U4WiEGaI04WiEGaI04WiEGaI04WiEGqGMc7gMxM7NC\nXAMxM7NCnEDMzKwQJxCrmaRm3T+mQ5JU/tfMGsMJxGoiqTfwpKRezY6lio0AIiKcRKzZmv0blNSj\n7HldD/qcQAqS1D3fzx1JG0vq1uyY6ikiXgC+AtyTbzHcdEq6A9dKuhRaM4k0Ix5Jqze6zIUpqylu\nVO8yqsxvyL5OkiKPTJK0gaQVG1FuWfmrAJ+R1EvSJ/Pzuv3+WrJJYgmxM7CJpAHAx4EdgHeaFYyk\nbYEpQLeImFKPMiLiOknzgTZJgyNibj3KWQTLRMR8YH1JT0o6OyK+Xkoi0YQhhqVyJQ0C5gPPRcS7\njYxH0heBzSR9A3ilGduhmrxd9gQukDQiIh7qzPVX7LwPBN4FekTEuIh4tzPLqlY2pM+Yp48F9gBG\nAa/Vs+yyGLpHxMv5oOoe0v5oy3p+/66BFHcnMBQ4DDg9It5sViCSvgb8APgycJ6ktetVVkTcCIwh\nJZGm1kQi4h0ASXsAfwa+JOn8/FpTaiK53E8CtwPnAf+Q1DfPr/v/m6QvAF8AfhgRLwMfqHeZtZK0\nOfBj4DMR8ZCkfpJW6qztUrbzPpq0DeYD35R0QGesfyG6VSSv/YD9ImK6pDUkrVHPwiX1Af6YJ6cD\nPYGp+W/damBOIMX1Bc4GrgC2kPSxsip6w7arpG2AvSNiCNAHeBt4tp5tn2VJ5O/N7hORtB/wM+AC\nYE9gqKRfQHOSSG6e+QwwMiI+A9xNamJbqR5HweWfL//uPgb8P+BtSV8GbpR0TGeXW9AywFVAv1w7\nuhG4BNisswqQtCqwdUTsCKwPPAFcIaluiTTvvK8u+y66kQ5o9pL0LeAa4HRJG9YrhoiYBYyUtCOp\n9rFBjuGXkjbJteCNJC3XmeU6gRSQ/zG/R/qijgNWJR1xfEjSIcC+DYih9GNdhrQj/yqwFnBoPhIa\nImmlepWfk8gJwC2NTJhVvAv8JiL+ExF3AEOAEZJ+nuNsVLNRN0mrAb8ENgFezeUfAzwJfLcOZS4L\n7JqffwX4KHAbaSf9E1Lt40fAPnkQRFNI2ioflT9B+o0eSboq9jDgeeAji7Huyt9eN2BFSRcCg4HP\n5Zrq5yTV5YKCeee9P7BbPqD6J7AmMBp4iLSPeAWo68FMRLxOqnH8O8+6ALgXOEvSd4FTgc7tk4kI\nPxbhAYwE2oA183Q3Ul/SacCvgWeBDzcgjtXy31WAfwCPl702GrgOWKUBcazUwG2vKvP2Ah4htXWX\n5p0LPE2qJS7wnnrERGrCgDQibAJpwEHvPO9g4LQ6lL183kncnbfBoDx/cOl7AXYhJZWGfU8V22Vb\nUg3xUWBolW31APDxTihvY2C5/PxoYBawQZ4+BHgYGFDnzzwceAZYOU+vkP/unT/n2g3a9nsAk4BV\n8/Ro4Pp67Jca9oNaGh55h/QDUvPNeqQj8PuAX+TX1wLWaEAcRwG3At8G1iU1mfyG1Ob+NeB+YNNm\nb69O/swqe35UThIHkY7qvg88Tqp9HA1cDvRpVEz5H/YSUi1j+7wzu410QPEV4F/AsDrFsAOphnMx\nsGwpkZJqpl/LiWWzJn1nQ4H/AoeSakLXAYfn13YmHR2PKLjuLYCv5udfAh4D/pL/F9YjHfU/BZyf\n/x/qflCXY9kzl9szT48k1UI2afC23yv/T/TK08vVoxxfC6tGuXNyEHAD8HvgQdI/xG3Az4EjIuKZ\nBsSxNWmHeRrpH+dRUoftDODzpBvHXB8R/6p3LM2Q23jPAMaTEvabwPGkpLIBaefxjYh4uEHx7Aac\nSdphfYF09Ll3/p5+QOrI/HlE3FOHsnuTksZ84CxSM8mZkTpu1wIGAnMi4vHOLrvG+I4F5kbEr3PT\nzieAY0nJ5EZgvYj416KOUEXE9VUAAAr2SURBVMvNt7sCXyclh/8DvkhqRt6C1IR0ObA5advMjojF\nuZHcIskjzc4lNSkuD3SPiKmNKr8sjuGkg5otAaIefXBOIAuX+zW2BC6IiP9I6kv6x3g7jwA6A9g1\nIubUOY5dgdVItZyf5tFWJwCzgd9HxGP1LL/ZJB0MHAMcFmkUz2Dgs6Sj7dMjYq6kHhHxdgNjGk3q\nC+tHSuqfjYjJuX9iI+Ac4E/AuIjotOGcuR/uk6Tax+OkGtC4PP0W6Uj8oxHxameVWSDGY0nfzyci\nYl4eiTQWCODsiLirwDpXJx3dPyHp+6QmuqkRsU9+/WDSsPoHgCvr/T/ZQZwjgJOAbRYlOdYhjpXq\n+RtwJ3oHyjroDiEd3c/O07OB+XnncQ4wqgHJ4/OkHcSnSSM6tsxHVacDawP7dvYIi2arMoLqdmAd\n4HCAiGgjjYJbjjRcszswr5Exko4wrwJOJo2Gm5yPQI/JtaAzSE1cPTpYxyKRtD/paHs00AsYkpPT\nEaRaSB/gwEYmj7IRiNtIOljSx4BLSf1BF+b/pdVJyWMKqaZYxKrATyX9mtS/ch4wMA8iISIuJTUr\nb0gTz8uKiGuAnZqZPHIcdf0NuAZSobw6LWm1iHgxP7+O1Cm1Q57uDmwKvBoRk+oc006k801OiYj/\n5n+Wz5OazdqUzoiPiHi+nnE0UsX3MIY0sukRYCKpGfGsiDgrv745MC3SaJi6xyRpe6A/8Byp7X0s\n6YS9z+fv6ufA0RFxU37fByLijU6KYSVS38JkYCvSiL+9ImK+pHUi4mmlE8rmd0Z5ixjbMFItrI00\nsGRZ0miwA3Osq+R4dyM1Bx8Hiz5STtLZpOR5QkT8PCfsLwK3RcR5eZlVIp0HY/XUyI6dJelB+oH+\ngTQsc1iedw0woYExLEP6J/wx6Z/yc8Cy+bUxpJ3IFs3eVnXeBl8C7gAGAHNIR/SfBqYBpzYhnr1J\nR7jH5biOAj5EGnN/E6k565Ol7y//7ZSRYHlbHJPLfBm4pey1L5D6QerSWdpOPKsBA0ufkdSR/4k8\nvTbwLdJBT2m6J7AjaTjvRotR7nqkkW0PkIbpQkpQ9wIHNfs325UevpRJFflI6ljSkdMuwC6S+kXE\nCEn/lHRNRIxoQCi9I2Jmbkv+BmmEz2RJ90bqA5kHvNSAOJpC6bo+W5LG2O9H2nEPIo2GOxo4U9J5\npI7iulSlJa0AvB3pCH+FHMtuwO7k5qtINZ9P5ZPYekTErFxbeRc651wUpcuTHAp8OiKmKV0qZWNJ\nA4FPkY7AD4iItxa3rBrjWY7UfPqcpN9GxDO5j2Mr4C7S4IEHyedERWra659j3ScWo2M/Ip4kXdjz\nRVJz7ouk7+Jt0pBmaxA3YVXIzRNbAfMiVY9XIA05PAA4OCLekbR21HlUh6QvkXZWM4BnIuL4fDLQ\nqqRLFvytXjvNVpJ3VBsCP46InXJb+4vAicBlEfFKHctehTQ8ehxpHH03UnPVbNK5Fp+PiCeVLl3y\nXEQ8UKc4PgD8jtQ0NpG0U+5PSii3kXae340GD6LI/yuH814z3ibAKcCFEXFVfv1kUmJ7ofRZopOa\n8/L69gB+SLre1OGN3gZdnWsgZfIO40DSTno9SXdH6gj9c+532AJoa0Dy2JN0tu7ngDeAyyWNjYjR\nkn5CGmt+H2kI61ItIt6S9DrQXdKmpKaQm4Ab6pk8ctkvS7qB9F28FRE3SbqLdP7NkTl5DCENSx1Z\nxzjeyHGcSTqyf5x0fsXlpB32vGhgn0epwzwi7pYUpO3zRdKw9vOB8yUNJR14fS0iXij1H3Vm8sgx\n3CTp/vS0vn1gtiAnkEzSxpHGpE8kjfT5J3CMpN8BK5CSSt3Hckv6P1Kz1LVl1fyPSbpL0pakpqwV\nookXb2yCZ0l9DD8iXSJivwYk8W6RLoFxDSlpHZt3nLeT2v7PUDonZW/guIi4v57xkIbpPgA8FRFz\nlC4QuA2pFaGhySMiQtLakmZExD2SXiP1Cc0HLiOd3DgA+GlEPFw+IKIeImJmvdZtHXMTFiBpO9LJ\ngWcAfwUuIrWltpGOrl4mddh26uWnq8RxFOkM0j+SmmiGRMSM/NovSePab61nDK1K6byKNYB3I2Ja\ng8ocAXyHdImKIaRLc59JOrjYnDR8+MVII+Eacrn2PBz2MFIf0MiIeLTeZZaXHemifHuTTt58nNR8\ndTHppMWvk87CHhd1uqWAtZYuXwNRunvXFNKoni+SLu52L+kkrYtIQyZ71LtzMv9THgV8KiKelbQO\n6VLgx5COgLchjbLpkiJiHul7aog8NPgUYP+ImCLp96Tv4IukPocbyhNGA/ujliddQPKzi9MRvSgk\nLR8Rb+bk8TFSv8YnSU15h/HeJX7OJR34dPn9SlfRpU8kzDWPk0jNUwfx3vXzJ5E6BA8gDcVsxMiW\nNUlnkz+bm09OJiWMLUhXKz0oIv7bgDgseYs0imiIpG+TLr3Rm3SS3tfz84aLdMXV3zQwefQDDlK6\n0jCkzz2aNDpuW9JIrC1Jl8yYDnwhIp5uRGzWfF39SGFKfowjXdX0euDliLha0jvA7bkdvBEmky5D\n/seIeCLPm0m6TMPJDYrB3jOF1IQ5inTflz+SruX0NPBwMztsG1XbkfRBYB/g70BI+khEjM99Qb8g\nXVLmEUm7k/qFeroju2txHwgg6SOkCxSuTLqKa91u/NJBDKuQ2pW7k/pfViW1cx8QdT7T3dqnfG0t\npYsjjgO+0hX6oXKSOIh0Xal/5r8vkGrJE3OTXg9S09VPgKMiXVrGuhAnkEzpIm27kC6BvX804Mq6\nVWLoR+qw3Zs0Euv70aCrylp1krqROswvAM6IiGubHFJDSTqO1Gw3k3S14xmkc1KmAr8iNfn+IiL+\n1LQgrWmcQCpIWjZ32DYzhh4A0cCrylr7JK0IrB7pOlMNGW3VCnLT1DdJfaWzSINLNiAljz/mIbqr\nRsRLXWm72HucQMxsAblGfjUwOp8f9WXSJetnkc7Cf5Z075G6nsxpra1Lj8Iys3bNI/XHlUabjSU1\nZQ0j3WHxCicPcwIxswVExFzgSmBHSZvkZt2rgddJycN9c+YmLDOrTtIA0pUYtiFde21f4MsRcUtT\nA7OW4QRiZu2StDKwHenE2okRcUeTQ7IW4gRiZmaFuA/EzMwKcQIxM7NCnEDMzKwQJxAzMyvECcTM\nzApxAjFrcZJ2lPTnZsdhVskJxKzF5CsAm7U8JxCzTiTpeElfzc/PlfTX/HxnSb+VNFLSI5IelXRW\n2ftelXSOpIeA7STtIenfku4n3dSptNwQSQ/mxwP5RD+zpnACMetcd5HuXAjpqrUrSVo2z/sP6TbF\nO5PuMbK1pBF52RWBeyPiI6Q7IV5IunDhVsAaZev/OulyIpvndb5R349j1j4nELPONRHYKt9h8i3S\n7WAHk3b2L5JukzwrIuYDvwV2yO97h3TbXIANgacjYlK+x8ZlZeu/G/hRruWsltdj1hROIGadKF+1\n9mngUOAeUo1kJ2A94JkO3vpmRLxTw/rPBI4APgDcLanht182K3ECMet8d5Gamu7Mz48EHiDdW3yI\npN65o3wkUO3ihP8GBklaN0+PLL0gad2IeCQiziJdIdcJxJrGCcSs891Funvf3yNiBvAmcFdETAdO\nBG4DHiJd3XaBe6xHxJvAaOD63Ik+s+zlo3MH/MOkmz7dWN+PYtY+X43XzMwKcQ3EzMwKcQIxM7NC\nnEDMzKwQJxAzMyvECcTMzApxAjEzs0KcQMzMrBAnEDMzK+T/A0iz33g7KKJzAAAAAElFTkSuQmCC\n",
- "text/plain": [
- ""
- ]
- },
- "metadata": {
- "tags": []
- }
- }
- ]
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "Sample 11: last 1000 words (only part used by the model)\n",
+ "--------------------------------------------------\n",
+ "The film starts out with a narration of the protagonist explaining certain crimes occurring all over the city and then we get to know that the hero is a cop who is either suspended or has probably retired. I did not have the patience or the interest to verify the above before commenting. If there is a stereotype for narrators to have a deep, sleep-inducing voice then, it is high time to put an end to it. I seriously fell asleep and did not bother to shut the movie down either. Am still trying to figure out what the movie was all about and why there were no outdoor shootings. A third rate TV Serial will have more number of sets compared to this crap of a movie and I still pity the actors and producers involved in this huge bullshit of a movie. It ought to have been produced as a normal TV serial or maybe even as a local theater drama instead of putting it out on the big screen. Total waste of time and money. The movie was supposed to be in production for a long time and it would have been better to have left it that way.With redundant sleep inducing dialogs and sets, this is the worst movie I have come across.\n",
+ "--------------------------------------------------\n",
+ "1/1 [==============================] - 0s 347ms/step\n",
+ "Probability(positive) = 0.07630403\n",
+ "True class: negative\n",
+ "5000/5000 [==============================] - 63s 13ms/step\n"
+ ]
},
{
- "cell_type": "markdown",
- "metadata": {
- "id": "3tdpfNvHcaDB",
- "colab_type": "text"
- },
- "source": [
- "We have used the LIME interpretation to provide explanations for a recurrent neural network. Looking at the graph we understand that the sentence is negative and the word \"worst\" affects it the most.\n",
- "\n"
+ "data": {
+ "image/png": "iVBORw0KGgoAAAANSUhEUgAAAZAAAAEtCAYAAAAm6zZnAAAABHNCSVQICAgIfAhkiAAAAAlwSFlz\nAAALEgAACxIB0t1+/AAAADh0RVh0U29mdHdhcmUAbWF0cGxvdGxpYiB2ZXJzaW9uMy4xLjMsIGh0\ndHA6Ly9tYXRwbG90bGliLm9yZy+AADFEAAAgAElEQVR4nO3dedxUZf3/8ddbEM0dAhFBxK9Lamou\nqJklrrgUQqYlbmgaaVG55E/LSjM1Lc20ssK0ULM0M8XcQnNLy7xxNzM0RUAEBNw30M/vj+uaHIe5\nb4bDPQvc7+fjMY97zpkz5/rMmbnP51zLOUcRgZmZ2aJaptkBmJnZkskJxMzMCnECMTOzQpxAzMys\nECcQMzMrxAnEzMwKcQKxBUg6RdJlLRBHX0l3SnpF0jnNjqeVSDpQ0l9qXPZQSX+rd0xVyh0o6VVJ\n3Rpc7u2SjmhkmV2VE0gLkfRxSfdIeknSHEl3S9q62XEtCkljJLVJekvSbype6yHpKknPSApJOy5k\ndaOBF4BVIuK4xYzrN5JOW5x1tJKI+G1EDO2MddVrhxsRz0bEShHxTmevuxEkDcq/0+5VXnvfQVZe\nbmb5spKWzfOibN7tkt7MibX0uK7+n6Y+nEBahKRVgD8DPwF6Af2B7wJvNTOuAp4DTgMubuf1vwEH\nAc/XsK61gX9FC5ztWm0nYlZhLrBn2fSeeV6lMTmxlh7DGhNe53MCaR0bAETE7yLinYh4IyL+EhEP\nA0haV9JfJc2W9IKk30parfTmfFR/vKSHJb0m6aLcBHRjbgK6RVLPvGzpyGq0pOckTZf09fYCk/TR\nXDN6UdJDHdUcIuLqiLgGmF3ltbcj4scR8Tegw6PSXHsZBfy/fJS2q6RlJJ0o6am8Ha6U1KvsPX+Q\n9Hyuwd0p6cN5/mjgwLJ1XZfnh6T1ysss1VIk7ShpqqQTJD0P/DrP/5SkB/O2uEfSZmXvP0HStLy9\nn5C0S5XPtU5+7zJ5+kJJM8tev1TS0fn5qvl7nJ7Xe1qpOaiyWUrS0FzmS5IukHRHZa1C0tmS5kp6\nWtKeed7pwCeAn+Zt81Ml5+aj55clPSJpk3a+p3X0XjPjLZJ+VjoyLz+Cl/Q5SW0V7z1G0vj8fLkc\n37OSZkj6haQPVHwXx+WYpks6rFo8ZdaV9M8c/7Wl34mk6yV9pSKOhyV9eiHrq8WlwCFl04cAl3TC\neluWE0jr+A/wjqRxkvYs7ezLCPg+sCawEbAWcErFMp8BdiMlo2HAjcA3gT6k7/qrFcvvBKwPDAVO\nkLRrZVCS+gPXk2oVvYCvA3+U1KfYx6xNRBwK/Bb4QT5KuwX4CjACGELaDnOBn5W97UbS51kduD+/\nn4gYW7GuWo/41iB95rWB0ZK2INWsvgh8EPglMD7v/D4EjAG2joiVgd2BZ6p8rqeBl4Et8qwdgFcl\nbZSnhwB35Oe/AeYD6+XlhwILNDVJ6g1cBXwjx/UE8LGKxbbN83sDPwAukqSIOAm4i/eOisfkcnYg\n/Y5WBT5LlQOC7HLgn7ncU4CD21nuOuBDktYvm3dAfj/Ambm8zfPn7Q98p2zZNXIs/YHDgZ9V+R8p\ndwjweaAfaRuen+ePI9WAAZD0kbzO6ztYV62uAXaQtFqO7RPAtZ2w3pblBNIiIuJl4ONAABcCsySN\nl9Q3v/5kREyIiLciYhbwI9LOptxPImJGREwj7RTujYgHIuJN4E+8t9Mq+W5EvBYRj5COsEdWCe0g\n4IaIuCEi3o2ICUAbsFfnfPJFciRwUkRMjYi3SDusfZWblyLi4oh4pey1j0hadTHKexc4OW/zN0h9\nMr+MiHtzLXEcqYnxo6Qa1XLAxpKWjYhnIuKpdtZ7BzBE0hp5+qo8vQ6wCvBQ/t73Ao7O39FM4Fxg\n/yrr2wt4LNf+SjvLyibCyRFxYe6PGEfasfZtJ755wMrAhoAi4vGImF65kKSBwNbAd3Lt8m/A+Gor\njIjXSTvTkfm96+f1j5ck0rY9JiLmRMQrwBkVn3UecGpEzIuIG4BXgQ+1Ez/ApRHxaES8Bnwb+Gyu\nvY0HNihLZAcDV0TE2x2sq1ZvkhLl5/JjfJ5X6fxcCy09vtcJZTeFE0gLyf+oh0bEAGAT0lH2j+F/\nI5J+n5syXgYuIx1NlptR9vyNKtMrVSw/pez55FxepbWB/cp/8KRE128RP15nWBv4U1kcj5N23H0l\ndZN0plLz1su8d/RfuY0WxaycfMvLP65iW6wFrBkRTwJHkxLXzPxdVduekBLIjqSj/DuB20kHA0OA\nuyLi3VzWssD0srJ+SapdVVqTsu8y9xlNrVjm+bLXX89PK38Ppdf/CvyUVLubKWmsUh9dtXLnlK0P\n3v+bqnQ57x2kHABck9/bB1gBmFj2WW/K80tm5+RY8np78VeJYzJpW/bO3+cVwEFKzYgjSU1PneUS\nUu2no+arr0bEamWPb3di+Q3lBNKiIuLfpCaMUtvzGaTayaYRsQqpZqDFLGatsucDSR3glaaQjubK\nf/ArRsSZi1l2EVOAPStiWT7XuA4AhgO7kpo6BuX3lLZRtY7410k7rpI1Kl6vfM8U4PSK8leIiN8B\nRMTlEfFx0s4/gLPa+Rx3kJo3dszP/wZsz/ubr6aQaje9y8paJSI+XGV904EBpYl8RD+gynLtWWDb\nRMT5EbEVsDGpaen4dsrtJal8G65VZbmSCUAfSZuTdtyl5qsXSAc4Hy77rKtGREcJYmEqf9vzcjmQ\namAHArsAr0fE3xejnEp38V7truFDpxvNCaRFSNowdxIOyNNrkf7J/pEXWZlUbX8p90tU+4deVN+W\ntIJSZ/NhpCOzSpcBwyTtno/yl8+dmlV3ULnDdHmgG1Bavnxo43L5dYAe+fVaE+EvgNMlrZ3X1UfS\n8PzayqQd7mxSUjij4r0zgP+rmPcgcED+XHuwYJNgpQuBIyVtq2RFSZ+UtLKkD0naWdJypGaLN0hN\nYAuIiEn59YOAO3Lz5QxSH9YdeZnpwF+AcyStojSAYF1J1WK8HthU0oi8rb/MgsmwI+/bNpK2zp9x\nWeC1/HkW+CwRMZnUnHmK0hDt7Uh9b1VFxDzgD8APSX1LE/L8d0nb9lxJq+cY+kvafRE+Q6WDJG2c\nk9upwFWl4cQ5YbwLnENttY/l8u+09Gh3v5lrf8OAvfPzpZoTSOt4hdTRea+k10iJ41GgdP7Dd4Et\ngZdIO4yrO6HMO4AngVuBsyNigRPTImIK6cj+m8As0pHx8bT/2/kWaed4ImkH+UaeV/JEntcfuDk/\nX7vGeM8jtSv/RdIrpG20bX7tElJTxTTgX7yXeEsuIvVPvCjpmjzva6R/9hdJR6TX0IGIaAO+QGre\nmUvadofml5cjdQS/QGouWp3Uqd2eO0jNMlPKpkXq/C85BOiRP89cUl/JAk2HEfECsB+pc3w2qdbQ\nRu1DwM8j9SXNlXQ+qR/mwlzm5LzOH7bz3gOB7fIyp5EOQjoq93JSLfEPFU1SJ5C25z9yE+QtdNzH\nsTCXkmrwzwPLs+AAkkuATUkHSAvzKul3Wnrs3NHCEfFYRDzWwSKlEW+lx8QaYmhJ6gJJ0ipIGgQ8\nDSxb8U9sS4F8hDwVODAibmtw2VcA/46IkxtZ7qKSdAgwOjc5WkGugZgtBXIT42q5Ce2bpNpMZS2s\nHuVunZvWlsnNgMNZSE2u2XKz1peAsc2OZUnnBGK2dNgOeIrUhDYMGJGHHtfbGqRRZK+Shg8fFREP\nNKDcQnK/yixSv8/lC1ncFsJNWGZmVohrIGZmVogTiJmZFdKlrjDau3fvGDRoULPDMDNbokycOPGF\niFjg+nddKoEMGjSItra2hS9oZmb/I2lytfluwjIzs0KcQMzMrBAnEDMzK8QJxMzMCnECMTOzQpxA\nzMysECcQMzMrxAnEzMwKaeqJhPnyz+eR7l73q8rbpOZLU18CbEW6Yc3nIuIZSbuRbt7TA3gbOD7f\nx3mJ8+ypmzaknIHfeaQh5ZhZ19G0GoikbsDPgD1Jd1AbKWnjisUOB+ZGxHrAubx3j+kXgGERsSkw\nitpuS2lmZp2omU1Y2wBPRsR/I+Jt4Pekm9GUGw6My8+vAnaRpIh4ICKey/MfAz6QaytmZtYgzUwg\n/Un31y6ZmudVXSbfevUl4IMVy3wGuD8iar3/s5mZdYIl+mKKkj5MatYa2sEyo4HRAAMHDmxQZGZm\nS79m1kCmAWuVTQ/I86ouI6k7sCqpMx1JA4A/AYdExFPtFRIRYyNicEQM7tNngasRm5lZQc1MIPcB\n60taR1IPYH9gfMUy40md5AD7An+NiJC0GnA9cGJE3N2wiM3M7H+alkByn8YY4GbgceDKiHhM0qmS\n9s6LXQR8UNKTwLHAiXn+GGA94DuSHsyP1Rv8EczMurSm9oFExA3ADRXzvlP2/E1gvyrvOw04re4B\nmplZu3wmupmZFeIEYmZmhTiBmJlZIUv0eSDWObb/yfYNK+vur3jQnNnSwjUQMzMrxAnEzMwKcROW\ntYQ7dhjSsLKG3HlHw8oyW5q5BmJmZoU4gZiZWSFOIGZmVogTiJmZFeIEYmZmhXgUllmLOf2gfRtW\n1kmXXdWwsmzp4xqImZkV4gRiZmaFOIGYmVkhTiBmZlaIE4iZmRXiUVhm1rJOOeWUlijryj9s07A4\nPrvfP6vO/8hVNzcshof23b2m5VwDMTOzQpxAzMysECcQMzMrxAnEzMwKcQIxM7NCnEDMzKwQJxAz\nMyvECcTMzApxAjEzs0KcQMzMrBAnEDMzK6SpCUTSHpKekPSkpBOrvL6cpCvy6/dKGlT22jfy/Cck\n1XbhFjMz6zRNSyCSugE/A/YENgZGStq4YrHDgbkRsR5wLnBWfu/GwP7Ah4E9gAvy+szMrEGaWQPZ\nBngyIv4bEW8DvweGVywzHBiXn18F7CJJef7vI+KtiHgaeDKvz8zMGkQR0ZyCpX2BPSLiiDx9MLBt\nRIwpW+bRvMzUPP0UsC1wCvCPiLgsz78IuDEirqpSzmhgNMDAgQO3mjx5MgBbHX9J/T5chYk/PKRh\nZdni+elx1zWsrDHnDGtYWUU8fvpfG1bWRift3LCybNFJmhgRgyvnL/Wd6BExNiIGR8TgPn36NDsc\nM7OlRjMTyDRgrbLpAXle1WUkdQdWBWbX+F4zM6ujZiaQ+4D1Ja0jqQepU3x8xTLjgVH5+b7AXyO1\nuY0H9s+jtNYB1geq38bLzMzqomm3tI2I+ZLGADcD3YCLI+IxSacCbRExHrgIuFTSk8AcUpIhL3cl\n8C9gPvDliHinKR/EzKyLauo90SPiBuCGinnfKXv+JrBfO+89HTi9rgGamVm7lvpOdDMzqw8nEDMz\nK8QJxMzMCnECMTOzQpxAzMysECcQMzMrxAnEzMwKcQIxM7NCnEDMzKwQJxAzMyvECcTMzApxAjEz\ns0KcQMzMrJCmXo3XzFqXbzNrC+MaiJmZFeIEYmZmhTiBmJlZIU4gZmZWiBOImZkV4gRiZmaFOIGY\nmVkhPg/ErMyYc4Y1OwSzJYZrIGZmVogTiJmZFeIEYmZmhTiBmJlZIU4gZmZWiBOImZkV4gRiZmaF\nNCWBSOolaYKkSflvz3aWG5WXmSRpVJ63gqTrJf1b0mOSzmxs9GZmBs2rgZwI3BoR6wO35un3kdQL\nOBnYFtgGOLks0ZwdERsCWwDbS9qzMWGbmVlJsxLIcGBcfj4OGFFlmd2BCRExJyLmAhOAPSLi9Yi4\nDSAi3gbuBwY0IGYzMyvTrATSNyKm5+fPA32rLNMfmFI2PTXP+x9JqwHDSLUYMzNroJquhSVpXWBq\nRLwlaUdgM+CSiHixg/fcAqxR5aWTyiciIiRF7SH/b/3dgd8B50fEfztYbjQwGmDgwIGLWoyZmbWj\n1hrIH4F3JK0HjAXWAi7v6A0RsWtEbFLlcS0wQ1I/gPx3ZpVVTMvllAzI80rGApMi4scLiWNsRAyO\niMF9+vRZ2Oc0M7Ma1ZpA3o2I+cCngZ9ExPFAv8UodzwwKj8fBVxbZZmbgaGSeubO86F5HpJOA1YF\njl6MGMzMbDHUmkDmSRpJ2tn/Oc9bdjHKPRPYTdIkYNc8jaTBkn4FEBFzgO8B9+XHqRExR9IAUjPY\nxsD9kh6UdMRixGJmZgXUej+Qw4AjgdMj4mlJ6wCXFi00ImYDu1SZ3wYcUTZ9MXBxxTJTARUt28zM\nOketCWS3iPhqaSInkTfrFJOZmS0Bam3CGlVl3qGdGIeZmS1hOqyB5H6PA4B1JI0ve2llYE49AzMz\ns9a2sCase4DpQG/gnLL5rwAP1ysoMzNrfR0mkIiYDEwGtmtMOGZmtqSoqQ9E0j75irgvSXpZ0iuS\nXq53cGZm1rpqHYX1A2BYRDxez2DMzGzJUesorBlOHmZmVm5ho7D2yU/bJF0BXAO8VXo9Iq6uY2xm\nZtbCFtaENazs+euk61GVBOAEYmbWRS1sFNZhjQrEzMyWLLXeD+T8KrNfAtry5dnNzKyLqbUTfXlg\nc2BSfmxGuj/H4ZI6vB+HmZktnWodxrsZsH1EvAMg6efAXcDHgUfqFJuZmbWwWmsgPYGVyqZXBHrl\nhPJW9beYmdnSbFFOJHxQ0u2ke3HsAJwhaUXgljrFZmZmLaymBBIRF0m6Adgmz/pmRDyXnx9fl8jM\nzKylddiEJWnD/HdL0j3Qp+THGnmemZl1UQurgRwLjOb9l3IvCWDnTo/IzMyWCAs7kXB0/rtTY8Ix\nM7MlRa2Xc19B0rckjc3T60v6VH1DMzOzVlbrMN5fA28DH8vT04DT6hKRmZktEWpNIOtGxA+AeQAR\n8TppOK+ZmXVRtSaQtyV9gNRxjqR18QmEZmZdWq0nEp4M3ASsJem3wPbAofUKyszMWl+tCWQUcD1w\nFfBf4GsR8ULdojIzs5ZXawK5CPgEsBuwLvCApDsj4ry6RWZmZi2t1kuZ3CbpTmBrYCfgSODDgBOI\nmVkXVesNpW4lXYH376TLuG8dETPrGZiZmbW2WkdhPUw6D2QT0r1BNsmjsgqR1EvSBEmT8t+e7Sw3\nKi8zSdKoKq+Pl/Ro0TjMzKy4mhJIRBwTETsA+wCzSScWvrgY5Z4I3BoR6wO35un3kdSLNPprW9JV\ngE8uTzSS9gFeXYwYzMxsMdR6KZMxkq4AHgCGAxcDey5GucOBcfn5OGBElWV2ByZExJyImAtMAPbI\n8axEutCjz4Y3M2uSWkdhLQ/8CJgYEfM7ody+ETE9P38e6Ftlmf6kS8eXTM3zAL5HukLw650Qi5mZ\nFVDrKKyzF3XFkm4B1qjy0kkV6w5JsQjr3Zx0aZVjJA2qYfnRpEvSM3DgwFqLMTOzhai1BrLIImLX\n9l6TNENSv4iYLqkfUG1E1zRgx7LpAcDtwHbAYEnPkOJfXdLtEbEjVUTEWGAswODBg2tOVGZm1rFa\nR2F1tvGks9vJf6+tsszNwFBJPXPn+VDg5oj4eUSsGRGDgI8D/2kveZiZWf00K4GcCewmaRKwa55G\n0mBJvwKIiDmkvo778uPUPM/MzFpA3ZqwOhIRs4FdqsxvA44om76YNOKrvfU8Qzo3xczMGqxZNRAz\nM1vCOYGYmVkhTiBmZlaIE4iZmRXiBGJmZoU4gZiZWSFOIGZmVogTiJmZFeIEYmZmhTiBmJlZIU4g\nZmZWiBOImZkV4gRiZmaFOIGYmVkhTiBmZlaIE4iZmRXiBGJmZoU4gZiZWSFOIGZmVogTiJmZFeIE\nYmZmhTiBmJlZIU4gZmZWiBOImZkV4gRiZmaFOIGYmVkhTiBmZlaIE4iZmRXiBGJmZoU4gZiZWSFN\nSSCSekmaIGlS/tuzneVG5WUmSRpVNr+HpLGS/iPp35I+07jozcwMmlcDORG4NSLWB27N0+8jqRdw\nMrAtsA1wclmiOQmYGREbABsDdzQkajMz+59mJZDhwLj8fBwwosoyuwMTImJORMwFJgB75Nc+D3wf\nICLejYgX6hyvmZlVaFYC6RsR0/Pz54G+VZbpD0wpm54K9Je0Wp7+nqT7Jf1BUrX3AyBptKQ2SW2z\nZs3qlODNzKyOCUTSLZIerfIYXr5cRAQQi7Dq7sAA4J6I2BL4O3B2ewtHxNiIGBwRg/v06VPko5iZ\nWRXd67XiiNi1vdckzZDULyKmS+oHzKyy2DRgx7LpAcDtwGzgdeDqPP8PwOGdEbOZmdWuWU1Y44HS\nqKpRwLVVlrkZGCqpZ+48HwrcnGss1/FectkF+Fd9wzUzs0rNSiBnArtJmgTsmqeRNFjSrwAiYg7w\nPeC+/Dg1zwM4AThF0sPAwcBxDY7fzKzLq1sTVkciYjap5lA5vw04omz6YuDiKstNBnaoZ4xmZtYx\nn4luZmaFOIGYmVkhTiBmZlaIE4iZmRXiBGJmZoU4gZiZWSFOIGZmVogTiJmZFeIEYmZmhTiBmJlZ\nIU4gZmZWiBOImZkV4gRiZmaFOIGYmVkhTiBmZlaIE4iZmRXiBGJmZoU4gZiZWSFOIGZmVogTiJmZ\nFeIEYmZmhTiBmJlZIU4gZmZWiBOImZkV4gRiZmaFOIGYmVkhTiBmZlaIE4iZmRXiBGJmZoU0JYFI\n6iVpgqRJ+W/PdpYblZeZJGlU2fyRkh6R9LCkmyT1blz0ZmYGzauBnAjcGhHrA7fm6feR1As4GdgW\n2AY4WVJPSd2B84CdImIz4GFgTMMiNzMzoHkJZDgwLj8fB4yosszuwISImBMRc4EJwB6A8mNFSQJW\nAZ6rf8hmZlaue5PK7RsR0/Pz54G+VZbpD0wpm54K9I+IeZKOAh4BXgMmAV+uZ7BmZragutVAJN0i\n6dEqj+Hly0VEALEI610WOArYAliT1IT1jQ6WHy2pTVLbrFmzin0YMzNbQN1qIBGxa3uvSZohqV9E\nTJfUD5hZZbFpwI5l0wOA24HN8/qfyuu6kip9KGVxjAXGAgwePPh/iWriDw+p9aOYmVkVzeoDGQ+U\nRlWNAq6tsszNwNDccd4TGJrnTQM2ltQnL7cb8Hid4zUzswrN6gM5E7hS0uHAZOCzAJIGA0dGxBER\nMUfS94D78ntOjYg5ebnvAndKmpfff2ijP4CZWVen1AXRNQwePDja2tqaHYaZ2RJF0sSIGFw532ei\nm5lZIU4gZmZWiBOImZkV4gRiZmaFOIGYmVkhTiBmZlZIlxrGK2kW6byRonoDL3RSOIujFeJohRig\nNeJohRigNeJohRigNeJohRigc+JYOyL6VM7sUglkcUlqqzYWuivG0QoxtEocrRBDq8TRCjG0Shyt\nEEO943ATlpmZFeIEYmZmhTiBLJqxzQ4ga4U4WiEGaI04WiEGaI04WiEGaI04WiEGqGMc7gMxM7NC\nXAMxM7NCnEDMzKwQJxCrmaRm3T+mQ5JU/tfMGsMJxGoiqTfwpKRezY6lio0AIiKcRKzZmv0blNSj\n7HldD/qcQAqS1D3fzx1JG0vq1uyY6ikiXgC+AtyTbzHcdEq6A9dKuhRaM4k0Ix5Jqze6zIUpqylu\nVO8yqsxvyL5OkiKPTJK0gaQVG1FuWfmrAJ+R1EvSJ/Pzuv3+WrJJYgmxM7CJpAHAx4EdgHeaFYyk\nbYEpQLeImFKPMiLiOknzgTZJgyNibj3KWQTLRMR8YH1JT0o6OyK+Xkoi0YQhhqVyJQ0C5gPPRcS7\njYxH0heBzSR9A3ilGduhmrxd9gQukDQiIh7qzPVX7LwPBN4FekTEuIh4tzPLqlY2pM+Yp48F9gBG\nAa/Vs+yyGLpHxMv5oOoe0v5oy3p+/66BFHcnMBQ4DDg9It5sViCSvgb8APgycJ6ktetVVkTcCIwh\nJZGm1kQi4h0ASXsAfwa+JOn8/FpTaiK53E8CtwPnAf+Q1DfPr/v/m6QvAF8AfhgRLwMfqHeZtZK0\nOfBj4DMR8ZCkfpJW6qztUrbzPpq0DeYD35R0QGesfyG6VSSv/YD9ImK6pDUkrVHPwiX1Af6YJ6cD\nPYGp+W/damBOIMX1Bc4GrgC2kPSxsip6w7arpG2AvSNiCNAHeBt4tp5tn2VJ5O/N7hORtB/wM+AC\nYE9gqKRfQHOSSG6e+QwwMiI+A9xNamJbqR5HweWfL//uPgb8P+BtSV8GbpR0TGeXW9AywFVAv1w7\nuhG4BNisswqQtCqwdUTsCKwPPAFcIaluiTTvvK8u+y66kQ5o9pL0LeAa4HRJG9YrhoiYBYyUtCOp\n9rFBjuGXkjbJteCNJC3XmeU6gRSQ/zG/R/qijgNWJR1xfEjSIcC+DYih9GNdhrQj/yqwFnBoPhIa\nImmlepWfk8gJwC2NTJhVvAv8JiL+ExF3AEOAEZJ+nuNsVLNRN0mrAb8ENgFezeUfAzwJfLcOZS4L\n7JqffwX4KHAbaSf9E1Lt40fAPnkQRFNI2ioflT9B+o0eSboq9jDgeeAji7Huyt9eN2BFSRcCg4HP\n5Zrq5yTV5YKCeee9P7BbPqD6J7AmMBp4iLSPeAWo68FMRLxOqnH8O8+6ALgXOEvSd4FTgc7tk4kI\nPxbhAYwE2oA183Q3Ul/SacCvgWeBDzcgjtXy31WAfwCPl702GrgOWKUBcazUwG2vKvP2Ah4htXWX\n5p0LPE2qJS7wnnrERGrCgDQibAJpwEHvPO9g4LQ6lL183kncnbfBoDx/cOl7AXYhJZWGfU8V22Vb\nUg3xUWBolW31APDxTihvY2C5/PxoYBawQZ4+BHgYGFDnzzwceAZYOU+vkP/unT/n2g3a9nsAk4BV\n8/Ro4Pp67Jca9oNaGh55h/QDUvPNeqQj8PuAX+TX1wLWaEAcRwG3At8G1iU1mfyG1Ob+NeB+YNNm\nb69O/swqe35UThIHkY7qvg88Tqp9HA1cDvRpVEz5H/YSUi1j+7wzu410QPEV4F/AsDrFsAOphnMx\nsGwpkZJqpl/LiWWzJn1nQ4H/AoeSakLXAYfn13YmHR2PKLjuLYCv5udfAh4D/pL/F9YjHfU/BZyf\n/x/qflCXY9kzl9szT48k1UI2afC23yv/T/TK08vVoxxfC6tGuXNyEHAD8HvgQdI/xG3Az4EjIuKZ\nBsSxNWmHeRrpH+dRUoftDODzpBvHXB8R/6p3LM2Q23jPAMaTEvabwPGkpLIBaefxjYh4uEHx7Aac\nSdphfYF09Ll3/p5+QOrI/HlE3FOHsnuTksZ84CxSM8mZkTpu1wIGAnMi4vHOLrvG+I4F5kbEr3PT\nzieAY0nJ5EZgvYj416KOUEXE9VUAAAr2SURBVMvNt7sCXyclh/8DvkhqRt6C1IR0ObA5advMjojF\nuZHcIskjzc4lNSkuD3SPiKmNKr8sjuGkg5otAaIefXBOIAuX+zW2BC6IiP9I6kv6x3g7jwA6A9g1\nIubUOY5dgdVItZyf5tFWJwCzgd9HxGP1LL/ZJB0MHAMcFmkUz2Dgs6Sj7dMjYq6kHhHxdgNjGk3q\nC+tHSuqfjYjJuX9iI+Ac4E/AuIjotOGcuR/uk6Tax+OkGtC4PP0W6Uj8oxHxameVWSDGY0nfzyci\nYl4eiTQWCODsiLirwDpXJx3dPyHp+6QmuqkRsU9+/WDSsPoHgCvr/T/ZQZwjgJOAbRYlOdYhjpXq\n+RtwJ3oHyjroDiEd3c/O07OB+XnncQ4wqgHJ4/OkHcSnSSM6tsxHVacDawP7dvYIi2arMoLqdmAd\n4HCAiGgjjYJbjjRcszswr5Exko4wrwJOJo2Gm5yPQI/JtaAzSE1cPTpYxyKRtD/paHs00AsYkpPT\nEaRaSB/gwEYmj7IRiNtIOljSx4BLSf1BF+b/pdVJyWMKqaZYxKrATyX9mtS/ch4wMA8iISIuJTUr\nb0gTz8uKiGuAnZqZPHIcdf0NuAZSobw6LWm1iHgxP7+O1Cm1Q57uDmwKvBoRk+oc006k801OiYj/\n5n+Wz5OazdqUzoiPiHi+nnE0UsX3MIY0sukRYCKpGfGsiDgrv745MC3SaJi6xyRpe6A/8Byp7X0s\n6YS9z+fv6ufA0RFxU37fByLijU6KYSVS38JkYCvSiL+9ImK+pHUi4mmlE8rmd0Z5ixjbMFItrI00\nsGRZ0miwA3Osq+R4dyM1Bx8Hiz5STtLZpOR5QkT8PCfsLwK3RcR5eZlVIp0HY/XUyI6dJelB+oH+\ngTQsc1iedw0woYExLEP6J/wx6Z/yc8Cy+bUxpJ3IFs3eVnXeBl8C7gAGAHNIR/SfBqYBpzYhnr1J\nR7jH5biOAj5EGnN/E6k565Ol7y//7ZSRYHlbHJPLfBm4pey1L5D6QerSWdpOPKsBA0ufkdSR/4k8\nvTbwLdJBT2m6J7AjaTjvRotR7nqkkW0PkIbpQkpQ9wIHNfs325UevpRJFflI6ljSkdMuwC6S+kXE\nCEn/lHRNRIxoQCi9I2Jmbkv+BmmEz2RJ90bqA5kHvNSAOJpC6bo+W5LG2O9H2nEPIo2GOxo4U9J5\npI7iulSlJa0AvB3pCH+FHMtuwO7k5qtINZ9P5ZPYekTErFxbeRc651wUpcuTHAp8OiKmKV0qZWNJ\nA4FPkY7AD4iItxa3rBrjWY7UfPqcpN9GxDO5j2Mr4C7S4IEHyedERWra659j3ScWo2M/Ip4kXdjz\nRVJz7ouk7+Jt0pBmaxA3YVXIzRNbAfMiVY9XIA05PAA4OCLekbR21HlUh6QvkXZWM4BnIuL4fDLQ\nqqRLFvytXjvNVpJ3VBsCP46InXJb+4vAicBlEfFKHctehTQ8ehxpHH03UnPVbNK5Fp+PiCeVLl3y\nXEQ8UKc4PgD8jtQ0NpG0U+5PSii3kXae340GD6LI/yuH814z3ibAKcCFEXFVfv1kUmJ7ofRZopOa\n8/L69gB+SLre1OGN3gZdnWsgZfIO40DSTno9SXdH6gj9c+532AJoa0Dy2JN0tu7ngDeAyyWNjYjR\nkn5CGmt+H2kI61ItIt6S9DrQXdKmpKaQm4Ab6pk8ctkvS7qB9F28FRE3SbqLdP7NkTl5DCENSx1Z\nxzjeyHGcSTqyf5x0fsXlpB32vGhgn0epwzwi7pYUpO3zRdKw9vOB8yUNJR14fS0iXij1H3Vm8sgx\n3CTp/vS0vn1gtiAnkEzSxpHGpE8kjfT5J3CMpN8BK5CSSt3Hckv6P1Kz1LVl1fyPSbpL0pakpqwV\nookXb2yCZ0l9DD8iXSJivwYk8W6RLoFxDSlpHZt3nLeT2v7PUDonZW/guIi4v57xkIbpPgA8FRFz\nlC4QuA2pFaGhySMiQtLakmZExD2SXiP1Cc0HLiOd3DgA+GlEPFw+IKIeImJmvdZtHXMTFiBpO9LJ\ngWcAfwUuIrWltpGOrl4mddh26uWnq8RxFOkM0j+SmmiGRMSM/NovSePab61nDK1K6byKNYB3I2Ja\ng8ocAXyHdImKIaRLc59JOrjYnDR8+MVII+Eacrn2PBz2MFIf0MiIeLTeZZaXHemifHuTTt58nNR8\ndTHppMWvk87CHhd1uqWAtZYuXwNRunvXFNKoni+SLu52L+kkrYtIQyZ71LtzMv9THgV8KiKelbQO\n6VLgx5COgLchjbLpkiJiHul7aog8NPgUYP+ImCLp96Tv4IukPocbyhNGA/ujliddQPKzi9MRvSgk\nLR8Rb+bk8TFSv8YnSU15h/HeJX7OJR34dPn9SlfRpU8kzDWPk0jNUwfx3vXzJ5E6BA8gDcVsxMiW\nNUlnkz+bm09OJiWMLUhXKz0oIv7bgDgseYs0imiIpG+TLr3Rm3SS3tfz84aLdMXV3zQwefQDDlK6\n0jCkzz2aNDpuW9JIrC1Jl8yYDnwhIp5uRGzWfF39SGFKfowjXdX0euDliLha0jvA7bkdvBEmky5D\n/seIeCLPm0m6TMPJDYrB3jOF1IQ5inTflz+SruX0NPBwMztsG1XbkfRBYB/g70BI+khEjM99Qb8g\nXVLmEUm7k/qFeroju2txHwgg6SOkCxSuTLqKa91u/NJBDKuQ2pW7k/pfViW1cx8QdT7T3dqnfG0t\npYsjjgO+0hX6oXKSOIh0Xal/5r8vkGrJE3OTXg9S09VPgKMiXVrGuhAnkEzpIm27kC6BvX804Mq6\nVWLoR+qw3Zs0Euv70aCrylp1krqROswvAM6IiGubHFJDSTqO1Gw3k3S14xmkc1KmAr8iNfn+IiL+\n1LQgrWmcQCpIWjZ32DYzhh4A0cCrylr7JK0IrB7pOlMNGW3VCnLT1DdJfaWzSINLNiAljz/mIbqr\nRsRLXWm72HucQMxsAblGfjUwOp8f9WXSJetnkc7Cf5Z075G6nsxpra1Lj8Iys3bNI/XHlUabjSU1\nZQ0j3WHxCicPcwIxswVExFzgSmBHSZvkZt2rgddJycN9c+YmLDOrTtIA0pUYtiFde21f4MsRcUtT\nA7OW4QRiZu2StDKwHenE2okRcUeTQ7IW4gRiZmaFuA/EzMwKcQIxM7NCnEDMzKwQJxAzMyvECcTM\nzApxAjFrcZJ2lPTnZsdhVskJxKzF5CsAm7U8JxCzTiTpeElfzc/PlfTX/HxnSb+VNFLSI5IelXRW\n2ftelXSOpIeA7STtIenfku4n3dSptNwQSQ/mxwP5RD+zpnACMetcd5HuXAjpqrUrSVo2z/sP6TbF\nO5PuMbK1pBF52RWBeyPiI6Q7IV5IunDhVsAaZev/OulyIpvndb5R349j1j4nELPONRHYKt9h8i3S\n7WAHk3b2L5JukzwrIuYDvwV2yO97h3TbXIANgacjYlK+x8ZlZeu/G/hRruWsltdj1hROIGadKF+1\n9mngUOAeUo1kJ2A94JkO3vpmRLxTw/rPBI4APgDcLanht182K3ECMet8d5Gamu7Mz48EHiDdW3yI\npN65o3wkUO3ihP8GBklaN0+PLL0gad2IeCQiziJdIdcJxJrGCcSs891Funvf3yNiBvAmcFdETAdO\nBG4DHiJd3XaBe6xHxJvAaOD63Ik+s+zlo3MH/MOkmz7dWN+PYtY+X43XzMwKcQ3EzMwKcQIxM7NC\nnEDMzKwQJxAzMyvECcTMzApxAjEzs0KcQMzMrBAnEDMzK+T/A0iz33g7KKJzAAAAAElFTkSuQmCC\n",
+ "text/plain": [
+ ""
]
- },
- {
- "cell_type": "code",
- "metadata": {
- "id": "A3JGXJF2aIFJ",
- "colab_type": "code",
- "colab": {}
- },
- "source": [
- ""
- ],
- "execution_count": 0,
- "outputs": []
+ },
+ "metadata": {
+ "tags": []
+ },
+ "output_type": "display_data"
}
- ]
-}
\ No newline at end of file
+ ],
+ "source": [
+ "# We choose a sample from test set\n",
+ "idx = 11\n",
+ "text_sample = test_texts[idx]\n",
+ "class_names = ['negative', 'positive']\n",
+ "\n",
+ "print('Sample {}: last 1000 words (only part used by the model)'.format(idx))\n",
+ "print('-'*50)\n",
+ "print(\" \".join(text_sample.split()[-1000:]))\n",
+ "print('-'*50)\n",
+ "print('Probability(positive) =', pipeline.predict_proba([text_sample])[0,1])\n",
+ "print('True class: %s' % class_names[test_labels[idx]])\n",
+ "\n",
+ "\n",
+ "\n",
+ "import matplotlib.pyplot as plt\n",
+ "import seaborn as sns\n",
+ "%matplotlib inline\n",
+ "from collections import OrderedDict\n",
+ "from lime.lime_text import LimeTextExplainer\n",
+ "\n",
+ "explainer = LimeTextExplainer(class_names=class_names)\n",
+ "explanation = explainer.explain_instance(text_sample, pipeline.predict_proba, num_features=10)\n",
+ "\n",
+ "weights = OrderedDict(explanation.as_list())\n",
+ "lime_weights = pd.DataFrame({'words': list(weights.keys()), 'weights': list(weights.values())})\n",
+ "\n",
+ "sns.barplot(x=\"words\", y=\"weights\", data=lime_weights);\n",
+ "plt.xticks(rotation=45)\n",
+ "plt.title('Sample {} features weights given by LIME'.format(idx));"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "metadata": {
+ "colab_type": "text",
+ "id": "3tdpfNvHcaDB"
+ },
+ "source": [
+ "We have used the LIME interpretation to provide explanations for a recurrent neural network. Looking at the graph we understand that the sentence is negative and the word \"worst\" affects it the most.\n",
+ "\n"
+ ]
+ }
+ ],
+ "metadata": {
+ "accelerator": "GPU",
+ "colab": {
+ "name": "Lime_RNN.ipynb",
+ "provenance": []
+ },
+ "kernelspec": {
+ "display_name": "Python 3",
+ "language": "python",
+ "name": "python3"
+ },
+ "language_info": {
+ "codemirror_mode": {
+ "name": "ipython",
+ "version": 3
+ },
+ "file_extension": ".py",
+ "mimetype": "text/x-python",
+ "name": "python",
+ "nbconvert_exporter": "python",
+ "pygments_lexer": "ipython3",
+ "version": "3.7.4"
+ }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 1
+}
From e60001c89b2c9edd183d68944a60924322a825b8 Mon Sep 17 00:00:00 2001
From: jatinpapreja <47968703+jatinpapreja@users.noreply.github.com>
Date: Thu, 10 Jun 2021 12:52:55 +0530
Subject: [PATCH 3/4] [Ch4Nb10] Fixed path issues
1. Specified the version for tensorflow installation.
2. Added try block for windows and colab users and specified the path for downloading files for windows users.
---
Ch4/10_ShapDemo.ipynb | 375 +++++++++++++++---------------------------
1 file changed, 132 insertions(+), 243 deletions(-)
diff --git a/Ch4/10_ShapDemo.ipynb b/Ch4/10_ShapDemo.ipynb
index 93c3e3e..706a8c4 100644
--- a/Ch4/10_ShapDemo.ipynb
+++ b/Ch4/10_ShapDemo.ipynb
@@ -3,7 +3,6 @@
{
"cell_type": "markdown",
"metadata": {
- "colab_type": "text",
"id": "q53fZJ-eqcgX"
},
"source": [
@@ -12,43 +11,20 @@
},
{
"cell_type": "code",
- "execution_count": 0,
+ "execution_count": 1,
"metadata": {
- "colab": {
- "base_uri": "https://localhost:8080/",
- "height": 187
- },
- "colab_type": "code",
- "id": "2IH_HuQYqSE9",
- "outputId": "c9c0952b-1a4c-4380-bb1b-16b01dd7291d"
+ "id": "2IH_HuQYqSE9"
},
- "outputs": [
- {
- "name": "stdout",
- "output_type": "stream",
- "text": [
- "Requirement already satisfied: shap in /usr/local/lib/python3.6/dist-packages (0.35.0)\n",
- "Requirement already satisfied: scipy in /usr/local/lib/python3.6/dist-packages (from shap) (1.4.1)\n",
- "Requirement already satisfied: numpy in /usr/local/lib/python3.6/dist-packages (from shap) (1.18.4)\n",
- "Requirement already satisfied: pandas in /usr/local/lib/python3.6/dist-packages (from shap) (1.0.3)\n",
- "Requirement already satisfied: tqdm>4.25.0 in /usr/local/lib/python3.6/dist-packages (from shap) (4.41.1)\n",
- "Requirement already satisfied: scikit-learn in /usr/local/lib/python3.6/dist-packages (from shap) (0.22.2.post1)\n",
- "Requirement already satisfied: pytz>=2017.2 in /usr/local/lib/python3.6/dist-packages (from pandas->shap) (2018.9)\n",
- "Requirement already satisfied: python-dateutil>=2.6.1 in /usr/local/lib/python3.6/dist-packages (from pandas->shap) (2.8.1)\n",
- "Requirement already satisfied: joblib>=0.11 in /usr/local/lib/python3.6/dist-packages (from scikit-learn->shap) (0.14.1)\n",
- "Requirement already satisfied: six>=1.5 in /usr/local/lib/python3.6/dist-packages (from python-dateutil>=2.6.1->pandas->shap) (1.12.0)\n"
- ]
- }
- ],
+ "outputs": [],
"source": [
"#installing shap\n",
- "!pip install shap"
+ "!pip install shap\n",
+ "!pip install tensorflow==1.14.0"
]
},
{
"cell_type": "markdown",
"metadata": {
- "colab_type": "text",
"id": "ohVsijBFqmSS"
},
"source": [
@@ -58,27 +34,14 @@
},
{
"cell_type": "code",
- "execution_count": 0,
+ "execution_count": 2,
"metadata": {
- "colab": {
- "base_uri": "https://localhost:8080/",
- "height": 71
- },
- "colab_type": "code",
- "id": "TtQ_PdWZqiyE",
- "outputId": "27e840b8-804c-4627-e283-a158ad376d59"
+ "id": "TtQ_PdWZqiyE"
},
- "outputs": [
- {
- "name": "stderr",
- "output_type": "stream",
- "text": [
- "/usr/local/lib/python3.6/dist-packages/sklearn/utils/deprecation.py:144: FutureWarning: The sklearn.feature_extraction.stop_words module is deprecated in version 0.22 and will be removed in version 0.24. The corresponding classes / functions should instead be imported from sklearn.feature_extraction.text. Anything that cannot be imported from sklearn.feature_extraction.text is now part of the private API.\n",
- " warnings.warn(message, FutureWarning)\n"
- ]
- }
- ],
+ "outputs": [],
"source": [
+ "import warnings\n",
+ "warnings.filterwarnings('ignore')\n",
"import numpy as np\n",
"import pandas as pd #to work with csv files\n",
"\n",
@@ -102,21 +65,19 @@
"from sklearn.metrics import accuracy_score\n",
"from sklearn.model_selection import train_test_split\n",
"#import time function from time module to track the training duration\n",
- "from time import time\n",
- "\n"
+ "from time import time"
]
},
{
"cell_type": "code",
- "execution_count": 0,
+ "execution_count": 3,
"metadata": {
"colab": {
"base_uri": "https://localhost:8080/",
"height": 102
},
- "colab_type": "code",
"id": "3h3XkJDhq2-R",
- "outputId": "d0be0712-175e-469d-e313-62199cf9a088"
+ "outputId": "7fe6d5de-7766-41f8-e089-2e55af04c1ae"
},
"outputs": [
{
@@ -168,21 +129,18 @@
" doc = \"\".join([char for char in doc if char not in string.punctuation and not char.isdigit()])\n",
" doc = \" \".join([token for token in doc.split() if token not in stopwords])\n",
" #remove punctuation and numbers\n",
- " return doc\n",
- "\n"
+ " return doc"
]
},
{
"cell_type": "code",
- "execution_count": 0,
+ "execution_count": 4,
"metadata": {
"colab": {
- "base_uri": "https://localhost:8080/",
- "height": 68
+ "base_uri": "https://localhost:8080/"
},
- "colab_type": "code",
"id": "fLZR3emyq3RO",
- "outputId": "ea870f92-55d9-4a53-f224-0d974595cd80"
+ "outputId": "0e8550ff-ec82-47d2-a515-f38b4a2e21b0"
},
"outputs": [
{
@@ -206,16 +164,13 @@
"#random_state=1 for reproducibility\n",
"X_train, X_test, y_train, y_test = train_test_split(X, y, random_state=1)\n",
"print(X_train.shape, y_train.shape)\n",
- "print(X_test.shape, y_test.shape)\n",
- "\n"
+ "print(X_test.shape, y_test.shape)"
]
},
{
"cell_type": "code",
- "execution_count": 0,
+ "execution_count": 5,
"metadata": {
- "colab": {},
- "colab_type": "code",
"id": "lGOIy920q5xG"
},
"outputs": [],
@@ -224,20 +179,18 @@
"\n",
"vect = TfidfVectorizer(min_df=5)\n",
"X_train_dtm = vect.fit_transform(X_train)\n",
- "X_test_dtm = vect.transform(X_test)\n"
+ "X_test_dtm = vect.transform(X_test)"
]
},
{
"cell_type": "code",
- "execution_count": 0,
+ "execution_count": 6,
"metadata": {
"colab": {
- "base_uri": "https://localhost:8080/",
- "height": 34
+ "base_uri": "https://localhost:8080/"
},
- "colab_type": "code",
"id": "cjs6qDTIq7tT",
- "outputId": "3b4551ab-ca45-45a5-f34b-40f97d3ec5af"
+ "outputId": "90d1c5c0-edef-4f2f-f48e-61f7cff4fada"
},
"outputs": [
{
@@ -258,15 +211,13 @@
"y_pred_class = model.predict(X_test_dtm)\n",
"\n",
"#calculate evaluation measures:\n",
- "print(\"Accuracy: \", accuracy_score(y_test, y_pred_class))\n"
+ "print(\"Accuracy: \", accuracy_score(y_test, y_pred_class))"
]
},
{
"cell_type": "code",
- "execution_count": 0,
+ "execution_count": 7,
"metadata": {
- "colab": {},
- "colab_type": "code",
"id": "AvnDPwzprKUi"
},
"outputs": [],
@@ -279,15 +230,13 @@
},
{
"cell_type": "code",
- "execution_count": 0,
+ "execution_count": 8,
"metadata": {
"colab": {
- "base_uri": "https://localhost:8080/",
- "height": 272
+ "base_uri": "https://localhost:8080/"
},
- "colab_type": "code",
"id": "pHwr6uFdrcTv",
- "outputId": "14b1a7d8-0764-43ad-a7b1-f66f7e1d0c2a"
+ "outputId": "42f5a6b1-75e6-4dcf-e04c-23e21d0ccd7a"
},
"outputs": [
{
@@ -319,15 +268,14 @@
},
{
"cell_type": "code",
- "execution_count": 0,
+ "execution_count": 9,
"metadata": {
"colab": {
"base_uri": "https://localhost:8080/",
"height": 611
},
- "colab_type": "code",
"id": "dfQPVQ-xrjSN",
- "outputId": "b117d191-ed8f-4352-b506-9220cbd1a3e8"
+ "outputId": "e0def5ef-3bc3-444a-ac46-d65bc1681b3c"
},
"outputs": [
{
@@ -376,7 +324,7 @@
},
{
"data": {
- "image/png": "\n",
+ "image/png": "\n",
"text/plain": [
""
]
@@ -396,7 +344,6 @@
{
"cell_type": "markdown",
"metadata": {
- "colab_type": "text",
"id": "WE0JzAqV1Icg"
},
"source": [
@@ -411,15 +358,14 @@
},
{
"cell_type": "code",
- "execution_count": 0,
+ "execution_count": 10,
"metadata": {
"colab": {
"base_uri": "https://localhost:8080/",
"height": 193
},
- "colab_type": "code",
"id": "f587yWgnrr8r",
- "outputId": "b294b926-7ffc-434c-d017-c7973002236a"
+ "outputId": "52cb0af4-d23b-4739-d1df-da91f4bb71dd"
},
"outputs": [
{
@@ -470,7 +416,7 @@
"data": {
"text/html": [
"\n",
- "
\n",
+ "
\n",
"
\n",
" Visualization omitted, Javascript library not loaded! \n",
" Have you run `initjs()` in this notebook? If this notebook was from another\n",
@@ -480,13 +426,13 @@
"
\n",
" "
],
"text/plain": [
- ""
+ ""
]
},
"execution_count": 10,
@@ -508,7 +454,6 @@
{
"cell_type": "markdown",
"metadata": {
- "colab_type": "text",
"id": "SnKH7AYQ3R0_"
},
"source": [
@@ -522,7 +467,6 @@
{
"cell_type": "markdown",
"metadata": {
- "colab_type": "text",
"id": "dxbf2VQar-nr"
},
"source": [
@@ -531,25 +475,11 @@
},
{
"cell_type": "code",
- "execution_count": 0,
+ "execution_count": 11,
"metadata": {
- "colab": {
- "base_uri": "https://localhost:8080/",
- "height": 34
- },
- "colab_type": "code",
- "id": "cMdGM1_9ry6R",
- "outputId": "c89ba309-296c-4816-86cc-b4af89abaa89"
+ "id": "cMdGM1_9ry6R"
},
- "outputs": [
- {
- "name": "stderr",
- "output_type": "stream",
- "text": [
- "Using TensorFlow backend.\n"
- ]
- }
- ],
+ "outputs": [],
"source": [
"from sklearn.preprocessing import LabelEncoder\n",
"\n",
@@ -559,15 +489,16 @@
"import os\n",
"import sys\n",
"import numpy as np\n",
- "from keras.preprocessing.text import Tokenizer\n",
- "from keras.preprocessing.sequence import pad_sequences\n",
- "from keras.utils import to_categorical\n",
- "from keras.layers import Dense, Input, GlobalMaxPooling1D\n",
- "from keras.layers import Conv1D, MaxPooling1D, Embedding, LSTM\n",
- "from keras.models import Model, Sequential\n",
- "from keras.initializers import Constant\n",
- "import tensorflow as tf\n",
"from tensorflow import keras\n",
+ "from tensorflow.keras.preprocessing.text import Tokenizer\n",
+ "from tensorflow.keras.preprocessing.sequence import pad_sequences\n",
+ "from tensorflow.keras.utils import to_categorical\n",
+ "from tensorflow.keras.layers import Dense, Input, GlobalMaxPooling1D\n",
+ "from tensorflow.keras.layers import Conv1D, MaxPooling1D, Embedding, LSTM\n",
+ "from tensorflow.keras.models import Model, Sequential\n",
+ "from tensorflow.keras.initializers import Constant\n",
+ "import tensorflow as tf\n",
+ "\n",
"\n",
"\n",
"MAX_SEQUENCE_LENGTH = 1000\n",
@@ -576,108 +507,78 @@
"VALIDATION_SPLIT = 0.2\n",
"\n",
"vocab_size = 20000 # Max number of different word, i.e. model input dimension\n",
- "maxlen = 1000 # Max number of words kept at the end of each text\n"
+ "maxlen = 1000 # Max number of words kept at the end of each text"
]
},
{
"cell_type": "code",
- "execution_count": 0,
+ "execution_count": 12,
"metadata": {
- "colab": {
- "base_uri": "https://localhost:8080/",
- "height": 374
- },
- "colab_type": "code",
- "id": "1moJm0VJsM2r",
- "outputId": "d9c23ceb-cf5d-4fcb-e43d-10ebaaab5d2b"
- },
- "outputs": [
- {
- "name": "stdout",
- "output_type": "stream",
- "text": [
- "\u001b[33mWARNING: Skipping tensorflow as it is not installed.\u001b[0m\n",
- "Requirement already satisfied: tensorflow-gpu==1.14.0 in /usr/local/lib/python3.6/dist-packages (1.14.0)\n",
- "Requirement already satisfied: gast>=0.2.0 in /usr/local/lib/python3.6/dist-packages (from tensorflow-gpu==1.14.0) (0.3.3)\n",
- "Requirement already satisfied: keras-applications>=1.0.6 in /usr/local/lib/python3.6/dist-packages (from tensorflow-gpu==1.14.0) (1.0.8)\n",
- "Requirement already satisfied: termcolor>=1.1.0 in /usr/local/lib/python3.6/dist-packages (from tensorflow-gpu==1.14.0) (1.1.0)\n",
- "Requirement already satisfied: wrapt>=1.11.1 in /usr/local/lib/python3.6/dist-packages (from tensorflow-gpu==1.14.0) (1.12.1)\n",
- "Requirement already satisfied: wheel>=0.26 in /usr/local/lib/python3.6/dist-packages (from tensorflow-gpu==1.14.0) (0.34.2)\n",
- "Requirement already satisfied: google-pasta>=0.1.6 in /usr/local/lib/python3.6/dist-packages (from tensorflow-gpu==1.14.0) (0.2.0)\n",
- "Requirement already satisfied: astor>=0.6.0 in /usr/local/lib/python3.6/dist-packages (from tensorflow-gpu==1.14.0) (0.8.1)\n",
- "Requirement already satisfied: keras-preprocessing>=1.0.5 in /usr/local/lib/python3.6/dist-packages (from tensorflow-gpu==1.14.0) (1.1.0)\n",
- "Requirement already satisfied: grpcio>=1.8.6 in /usr/local/lib/python3.6/dist-packages (from tensorflow-gpu==1.14.0) (1.28.1)\n",
- "Requirement already satisfied: tensorflow-estimator<1.15.0rc0,>=1.14.0rc0 in /usr/local/lib/python3.6/dist-packages (from tensorflow-gpu==1.14.0) (1.14.0)\n",
- "Requirement already satisfied: absl-py>=0.7.0 in /usr/local/lib/python3.6/dist-packages (from tensorflow-gpu==1.14.0) (0.9.0)\n",
- "Requirement already satisfied: six>=1.10.0 in /usr/local/lib/python3.6/dist-packages (from tensorflow-gpu==1.14.0) (1.12.0)\n",
- "Requirement already satisfied: tensorboard<1.15.0,>=1.14.0 in /usr/local/lib/python3.6/dist-packages (from tensorflow-gpu==1.14.0) (1.14.0)\n",
- "Requirement already satisfied: protobuf>=3.6.1 in /usr/local/lib/python3.6/dist-packages (from tensorflow-gpu==1.14.0) (3.10.0)\n",
- "Requirement already satisfied: numpy<2.0,>=1.14.5 in /usr/local/lib/python3.6/dist-packages (from tensorflow-gpu==1.14.0) (1.18.4)\n",
- "Requirement already satisfied: h5py in /usr/local/lib/python3.6/dist-packages (from keras-applications>=1.0.6->tensorflow-gpu==1.14.0) (2.10.0)\n",
- "Requirement already satisfied: markdown>=2.6.8 in /usr/local/lib/python3.6/dist-packages (from tensorboard<1.15.0,>=1.14.0->tensorflow-gpu==1.14.0) (3.2.1)\n",
- "Requirement already satisfied: setuptools>=41.0.0 in /usr/local/lib/python3.6/dist-packages (from tensorboard<1.15.0,>=1.14.0->tensorflow-gpu==1.14.0) (46.1.3)\n",
- "Requirement already satisfied: werkzeug>=0.11.15 in /usr/local/lib/python3.6/dist-packages (from tensorboard<1.15.0,>=1.14.0->tensorflow-gpu==1.14.0) (1.0.1)\n"
- ]
- }
- ],
- "source": [
- "%tensorflow_version 2.x\n",
- "!pip uninstall -y tensorflow\n",
- "!pip install tensorflow-gpu==1.14.0"
- ]
- },
- {
- "cell_type": "code",
- "execution_count": 0,
- "metadata": {
- "colab": {},
- "colab_type": "code",
"id": "G8UECSj1sSlt"
},
"outputs": [],
"source": [
- "\n",
- "\n",
"def load_directory_data(directory):\n",
- " data = {}\n",
- " data[\"sentence\"] = []\n",
- " data[\"sentiment\"] = []\n",
- " for file_path in os.listdir(directory):\n",
- " with tf.gfile.GFile(os.path.join(directory, file_path), \"r\") as f:\n",
- " data[\"sentence\"].append(f.read())\n",
- " data[\"sentiment\"].append(re.match(\"\\d+_(\\d+)\\.txt\", file_path).group(1))\n",
- " return pd.DataFrame.from_dict(data)\n",
+ " data = {}\n",
+ " data[\"sentence\"] = []\n",
+ " data[\"sentiment\"] = []\n",
+ " for file_path in os.listdir(directory):\n",
+ " with tf.io.gfile.GFile(os.path.join(directory, file_path), \"r\") as f:\n",
+ " data[\"sentence\"].append(f.read())\n",
+ " data[\"sentiment\"].append(re.match(\"\\d+_(\\d+)\\.txt\", file_path).group(1))\n",
+ " return pd.DataFrame.from_dict(data)\n",
"\n",
"# Merge positive and negative examples, add a polarity column and shuffle.\n",
"def load_dataset(directory):\n",
- " pos_df = load_directory_data(os.path.join(directory, \"pos\"))\n",
- " neg_df = load_directory_data(os.path.join(directory, \"neg\"))\n",
- " pos_df[\"polarity\"] = 1\n",
- " neg_df[\"polarity\"] = 0\n",
- " return pd.concat([pos_df, neg_df]).sample(frac=1).reset_index(drop=True)\n",
+ " pos_df = load_directory_data(os.path.join(directory, \"pos\"))\n",
+ " neg_df = load_directory_data(os.path.join(directory, \"neg\"))\n",
+ " pos_df[\"polarity\"] = 1\n",
+ " neg_df[\"polarity\"] = 0\n",
+ " return pd.concat([pos_df, neg_df]).sample(frac=1).reset_index(drop=True)\n",
"\n",
"def download_and_load_datasets(force_download=False):\n",
- " dataset = tf.keras.utils.get_file(\n",
+ " dataset = tf.keras.utils.get_file(\n",
" fname=\"aclImdb.tar.gz\", \n",
" origin=\"http://ai.stanford.edu/~amaas/data/sentiment/aclImdb_v1.tar.gz\", \n",
" extract=True)\n",
- " \n",
- " train_df = load_dataset(os.path.join(os.path.dirname(dataset), \n",
+ "\n",
+ " train_df = load_dataset(os.path.join(os.path.dirname(dataset), \n",
" \"aclImdb\", \"train\"))\n",
- " test_df = load_dataset(os.path.join(os.path.dirname(dataset), \n",
+ " test_df = load_dataset(os.path.join(os.path.dirname(dataset), \n",
" \"aclImdb\", \"test\"))\n",
- " \n",
- " return train_df, test_df\n",
"\n",
- "train,test = download_and_load_datasets()"
+ " return train_df, test_df"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 13,
+ "metadata": {
+ "id": "yVlCL4IWgrUV"
+ },
+ "outputs": [],
+ "source": [
+ "try:\n",
+ " from google.colab import files\n",
+ " \n",
+ " if not os.path.exists('aclImdb'):\n",
+ " train,test = download_and_load_datasets()\n",
+ " else:\n",
+ " train = load_dataset('aclImdb/train')\n",
+ " test = load_dataset('aclImdb/test')\n",
+ " \n",
+ "except ModuleNotFoundError:\n",
+ " if not os.path.exists('Data/aclImdb'):\n",
+ " train,test = download_and_load_datasets()\n",
+ " else:\n",
+ " train = load_dataset('Data/aclImdb/train')\n",
+ " test = load_dataset('Data/aclImdb/test')"
]
},
{
"cell_type": "code",
- "execution_count": 0,
+ "execution_count": 14,
"metadata": {
- "colab": {},
- "colab_type": "code",
"id": "fRM5iANksS52"
},
"outputs": [],
@@ -692,15 +593,13 @@
},
{
"cell_type": "code",
- "execution_count": 0,
+ "execution_count": 15,
"metadata": {
"colab": {
- "base_uri": "https://localhost:8080/",
- "height": 51
+ "base_uri": "https://localhost:8080/"
},
- "colab_type": "code",
"id": "OCdVEEWDtY9q",
- "outputId": "cd121009-3557-4b13-a252-97b868a32ee3"
+ "outputId": "6fc10e64-7703-46f2-847b-2a379e240bb0"
},
"outputs": [
{
@@ -743,21 +642,18 @@
"y_val = trainvalid_labels[-num_validation_samples:]\n",
"\n",
"#This is the data we will use for CNN and RNN training\n",
- "print('Splitting the train data into train and valid is done')\n",
- "\n"
+ "print('Splitting the train data into train and valid is done')"
]
},
{
"cell_type": "code",
- "execution_count": 0,
+ "execution_count": 16,
"metadata": {
"colab": {
- "base_uri": "https://localhost:8080/",
- "height": 275
+ "base_uri": "https://localhost:8080/"
},
- "colab_type": "code",
"id": "3kbwNXYQtZLO",
- "outputId": "bb19bcca-836d-422f-e903-5e3981b5df53"
+ "outputId": "baaf3374-fdf1-4c36-ff6d-d4f6a5a351bb"
},
"outputs": [
{
@@ -765,19 +661,23 @@
"output_type": "stream",
"text": [
"Defining and training an LSTM model, training embedding layer on the fly\n",
- "WARNING:tensorflow:From /usr/local/lib/python3.6/dist-packages/tensorflow/python/ops/nn_impl.py:180: add_dispatch_support..wrapper (from tensorflow.python.ops.array_ops) is deprecated and will be removed in a future version.\n",
+ "WARNING:tensorflow:From /usr/local/lib/python3.7/dist-packages/tensorflow/python/keras/initializers.py:119: calling RandomUniform.__init__ (from tensorflow.python.ops.init_ops) with dtype is deprecated and will be removed in a future version.\n",
+ "Instructions for updating:\n",
+ "Call initializer instance with the dtype argument instead of passing it to the constructor\n",
+ "WARNING:tensorflow:From /usr/local/lib/python3.7/dist-packages/tensorflow/python/ops/init_ops.py:1251: calling VarianceScaling.__init__ (from tensorflow.python.ops.init_ops) with dtype is deprecated and will be removed in a future version.\n",
+ "Instructions for updating:\n",
+ "Call initializer instance with the dtype argument instead of passing it to the constructor\n",
+ "WARNING:tensorflow:From /usr/local/lib/python3.7/dist-packages/tensorflow/python/ops/nn_impl.py:180: add_dispatch_support..wrapper (from tensorflow.python.ops.array_ops) is deprecated and will be removed in a future version.\n",
"Instructions for updating:\n",
"Use tf.where in 2.0, which has the same broadcast rule as np.where\n",
"Training the RNN\n",
- "WARNING:tensorflow:From /usr/local/lib/python3.6/dist-packages/keras/backend/tensorflow_backend.py:422: The name tf.global_variables is deprecated. Please use tf.compat.v1.global_variables instead.\n",
- "\n",
"Train on 20000 samples, validate on 5000 samples\n",
"Epoch 1/2\n",
- "20000/20000 [==============================] - 580s 29ms/step - loss: 0.5170 - accuracy: 0.7466 - val_loss: 0.6257 - val_accuracy: 0.6769\n",
+ "20000/20000 [==============================] - 1497s 75ms/sample - loss: 0.4971 - acc: 0.7658 - val_loss: 0.5015 - val_acc: 0.8095\n",
"Epoch 2/2\n",
- "20000/20000 [==============================] - 571s 29ms/step - loss: 0.3721 - accuracy: 0.8408 - val_loss: 0.4292 - val_accuracy: 0.8138\n",
- "25000/25000 [==============================] - 134s 5ms/step\n",
- "Test accuracy with RNN: 0.8116400241851807\n"
+ "20000/20000 [==============================] - 1482s 74ms/sample - loss: 0.3532 - acc: 0.8561 - val_loss: 0.4566 - val_acc: 0.7831\n",
+ "25000/25000 [==============================] - 193s 8ms/sample - loss: 0.4721 - acc: 0.7787\n",
+ "Test accuracy with RNN: 0.77874\n"
]
}
],
@@ -803,20 +703,19 @@
" validation_data=(x_val, y_val))\n",
"score, acc = rnnmodel.evaluate(test_data, test_labels,\n",
" batch_size=32)\n",
- "print('Test accuracy with RNN:', acc)\n"
+ "print('Test accuracy with RNN:', acc)"
]
},
{
"cell_type": "code",
- "execution_count": 0,
+ "execution_count": 18,
"metadata": {
"colab": {
"base_uri": "https://localhost:8080/",
- "height": 77
+ "height": 131
},
- "colab_type": "code",
"id": "aJWmc_qguQbj",
- "outputId": "fd809bae-d9c0-4950-8c9f-0f1f1fb0f0f8"
+ "outputId": "84ba7325-6ec6-4d15-c26e-206a49a0d798"
},
"outputs": [
{
@@ -867,15 +766,18 @@
"name": "stdout",
"output_type": "stream",
"text": [
- "Downloading data from https://s3.amazonaws.com/text-datasets/imdb_word_index.json\n",
+ "WARNING:tensorflow:From /usr/local/lib/python3.7/dist-packages/shap/explainers/tf_utils.py:28: The name tf.keras.backend.get_session is deprecated. Please use tf.compat.v1.keras.backend.get_session instead.\n",
+ "\n",
+ "Downloading data from https://storage.googleapis.com/tensorflow/tf-keras-datasets/imdb_word_index.json\n",
"1646592/1641221 [==============================] - 0s 0us/step\n"
]
}
],
"source": [
- "from keras.datasets import imdb\n",
+ "from tensorflow.keras.datasets import imdb\n",
"import shap\n",
"shap.initjs()\n",
+ "\n",
"# we use the first 100 training examples as our background dataset to integrate over\n",
"explainer = shap.DeepExplainer(rnnmodel, x_train[:20])\n",
"\n",
@@ -888,20 +790,19 @@
"num2word = {}\n",
"for w in words.keys():\n",
" num2word[words[w]] = w\n",
- "x_val_words = np.stack([np.array(list(map(lambda x: num2word.get(x, \"NONE\"), x_val[i]))) for i in range(10)])\n"
+ "x_val_words = np.stack([np.array(list(map(lambda x: num2word.get(x, \"NONE\"), x_val[i]))) for i in range(10)])"
]
},
{
"cell_type": "code",
- "execution_count": 0,
+ "execution_count": 19,
"metadata": {
"colab": {
"base_uri": "https://localhost:8080/",
"height": 193
},
- "colab_type": "code",
"id": "VLup1ak_unKe",
- "outputId": "80995a62-04b5-4730-c4ed-9dfda5e64f3b"
+ "outputId": "068f4ef5-9655-4e72-b8d2-7aa876036954"
},
"outputs": [
{
@@ -952,7 +853,7 @@
"data": {
"text/html": [
"\n",
- "
\n",
+ "
\n",
"
\n",
" Visualization omitted, Javascript library not loaded! \n",
" Have you run `initjs()` in this notebook? If this notebook was from another\n",
@@ -962,16 +863,16 @@
"