From 7b9b4235f471c9180f0029629022ddf228c49735 Mon Sep 17 00:00:00 2001
From: Kumar Apurva <66004696+KUMAR-APURVA@users.noreply.github.com>
Date: Sun, 27 Jun 2021 12:25:46 +0530
Subject: [PATCH 1/2] [Ch2Nb06] Added dependencies and fixed some errors
1. Added pip install wget command.
2. Added pip install textblob command.
3. Fixed some errors.
---
Ch2/06_Snorkel.ipynb | 863 ++++++++++++++++++++-----------------------
1 file changed, 392 insertions(+), 471 deletions(-)
diff --git a/Ch2/06_Snorkel.ipynb b/Ch2/06_Snorkel.ipynb
index 2c6da6a..7e8645a 100644
--- a/Ch2/06_Snorkel.ipynb
+++ b/Ch2/06_Snorkel.ipynb
@@ -3,7 +3,6 @@
{
"cell_type": "markdown",
"metadata": {
- "colab_type": "text",
"id": "kBRUuq_poB7u"
},
"source": [
@@ -23,138 +22,178 @@
"start_time": "2021-04-03T11:07:43.179631Z"
},
"colab": {
- "base_uri": "https://localhost:8080/",
- "height": 940
+ "base_uri": "https://localhost:8080/"
},
- "colab_type": "code",
"id": "1TqgrfwYNlbQ",
- "outputId": "b0584485-e593-4768-f0aa-a6c84fe74244",
- "scrolled": true
+ "outputId": "6dec4d9a-a86a-4be6-cbb2-5038f174ff25",
+ "scrolled": false
},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
- "Requirement already satisfied: snorkel==0.9.6 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (0.9.6)\n",
- "Requirement already satisfied: munkres>=1.0.6 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from snorkel==0.9.6) (1.1.4)\n",
- "Requirement already satisfied: scipy<2.0.0,>=1.2.0 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from snorkel==0.9.6) (1.5.4)\n",
- "Requirement already satisfied: tensorboard<2.0.0,>=1.14.0 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from snorkel==0.9.6) (1.15.0)\n",
- "Requirement already satisfied: tqdm<5.0.0,>=4.33.0 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from snorkel==0.9.6) (4.59.0)\n",
- "Requirement already satisfied: torch<2.0.0,>=1.2.0 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from snorkel==0.9.6) (1.8.1)\n",
- "Requirement already satisfied: pandas<2.0.0,>=0.25.0 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from snorkel==0.9.6) (1.1.5)\n",
- "Requirement already satisfied: scikit-learn<0.22.0,>=0.20.2 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from snorkel==0.9.6) (0.21.3)\n",
- "Requirement already satisfied: networkx<2.4,>=2.2 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from snorkel==0.9.6) (2.3)\n",
- "Requirement already satisfied: numpy<2.0.0,>=1.16.0 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from snorkel==0.9.6) (1.19.5)\n",
- "Requirement already satisfied: decorator>=4.3.0 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from networkx<2.4,>=2.2->snorkel==0.9.6) (4.4.2)\n",
- "Requirement already satisfied: python-dateutil>=2.7.3 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from pandas<2.0.0,>=0.25.0->snorkel==0.9.6) (2.8.1)\n",
- "Requirement already satisfied: pytz>=2017.2 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from pandas<2.0.0,>=0.25.0->snorkel==0.9.6) (2021.1)\n",
- "Requirement already satisfied: six>=1.5 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from python-dateutil>=2.7.3->pandas<2.0.0,>=0.25.0->snorkel==0.9.6) (1.15.0)\n",
- "Requirement already satisfied: joblib>=0.11 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from scikit-learn<0.22.0,>=0.20.2->snorkel==0.9.6) (1.0.1)\n",
- "Requirement already satisfied: werkzeug>=0.11.15 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from tensorboard<2.0.0,>=1.14.0->snorkel==0.9.6) (1.0.1)\n",
- "Requirement already satisfied: setuptools>=41.0.0 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from tensorboard<2.0.0,>=1.14.0->snorkel==0.9.6) (54.1.2)\n",
- "Requirement already satisfied: grpcio>=1.6.3 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from tensorboard<2.0.0,>=1.14.0->snorkel==0.9.6) (1.36.1)\n",
- "Requirement already satisfied: markdown>=2.6.8 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from tensorboard<2.0.0,>=1.14.0->snorkel==0.9.6) (3.3.4)\n",
- "Requirement already satisfied: wheel>=0.26 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from tensorboard<2.0.0,>=1.14.0->snorkel==0.9.6) (0.36.2)\n",
- "Requirement already satisfied: protobuf>=3.6.0 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from tensorboard<2.0.0,>=1.14.0->snorkel==0.9.6) (3.15.6)\n",
- "Requirement already satisfied: absl-py>=0.4 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from tensorboard<2.0.0,>=1.14.0->snorkel==0.9.6) (0.12.0)\n",
- "Requirement already satisfied: importlib-metadata in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from markdown>=2.6.8->tensorboard<2.0.0,>=1.14.0->snorkel==0.9.6) (3.10.0)\n",
- "Requirement already satisfied: typing-extensions in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from torch<2.0.0,>=1.2.0->snorkel==0.9.6) (3.7.4.3)\n",
- "Requirement already satisfied: dataclasses in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from torch<2.0.0,>=1.2.0->snorkel==0.9.6) (0.8)\n",
- "Requirement already satisfied: zipp>=0.5 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from importlib-metadata->markdown>=2.6.8->tensorboard<2.0.0,>=1.14.0->snorkel==0.9.6) (3.4.1)\n",
- "Requirement already satisfied: treedlib==0.1.3 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (0.1.3)\n",
- "Requirement already satisfied: lxml in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from treedlib==0.1.3) (4.6.3)\n",
- "Requirement already satisfied: numbskull==0.1.1 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (0.1.1)\n",
- "Requirement already satisfied: future in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from numbskull==0.1.1) (0.18.2)\n",
- "Requirement already satisfied: tensorflow==1.15 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (1.15.0)\n",
- "Requirement already satisfied: wrapt>=1.11.1 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from tensorflow==1.15) (1.12.1)\n",
- "Requirement already satisfied: termcolor>=1.1.0 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from tensorflow==1.15) (1.1.0)\n",
- "Requirement already satisfied: astor>=0.6.0 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from tensorflow==1.15) (0.8.1)\n",
- "Requirement already satisfied: keras-applications>=1.0.8 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from tensorflow==1.15) (1.0.8)\n",
- "Requirement already satisfied: absl-py>=0.7.0 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from tensorflow==1.15) (0.12.0)\n",
- "Requirement already satisfied: six>=1.10.0 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from tensorflow==1.15) (1.15.0)\n",
- "Requirement already satisfied: tensorboard<1.16.0,>=1.15.0 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from tensorflow==1.15) (1.15.0)\n",
- "Requirement already satisfied: tensorflow-estimator==1.15.1 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from tensorflow==1.15) (1.15.1)\n",
- "Requirement already satisfied: protobuf>=3.6.1 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from tensorflow==1.15) (3.15.6)\n",
- "Requirement already satisfied: grpcio>=1.8.6 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from tensorflow==1.15) (1.36.1)\n",
- "Requirement already satisfied: wheel>=0.26 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from tensorflow==1.15) (0.36.2)\n",
- "Requirement already satisfied: gast==0.2.2 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from tensorflow==1.15) (0.2.2)\n",
- "Requirement already satisfied: keras-preprocessing>=1.0.5 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from tensorflow==1.15) (1.1.2)\n",
- "Requirement already satisfied: numpy<2.0,>=1.16.0 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from tensorflow==1.15) (1.19.5)\n",
- "Requirement already satisfied: opt-einsum>=2.3.2 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from tensorflow==1.15) (3.3.0)\n",
- "Requirement already satisfied: google-pasta>=0.1.6 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from tensorflow==1.15) (0.2.0)\n",
- "Requirement already satisfied: h5py in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from keras-applications>=1.0.8->tensorflow==1.15) (3.1.0)\n",
- "Requirement already satisfied: werkzeug>=0.11.15 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from tensorboard<1.16.0,>=1.15.0->tensorflow==1.15) (1.0.1)\n",
- "Requirement already satisfied: markdown>=2.6.8 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from tensorboard<1.16.0,>=1.15.0->tensorflow==1.15) (3.3.4)\n",
- "Requirement already satisfied: setuptools>=41.0.0 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from tensorboard<1.16.0,>=1.15.0->tensorflow==1.15) (54.1.2)\n",
- "Requirement already satisfied: importlib-metadata in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from markdown>=2.6.8->tensorboard<1.16.0,>=1.15.0->tensorflow==1.15) (3.10.0)\n",
- "Requirement already satisfied: cached-property in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from h5py->keras-applications>=1.0.8->tensorflow==1.15) (1.5.2)\n",
- "Requirement already satisfied: typing-extensions>=3.6.4 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from importlib-metadata->markdown>=2.6.8->tensorboard<1.16.0,>=1.15.0->tensorflow==1.15) (3.7.4.3)\n",
- "Requirement already satisfied: zipp>=0.5 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from importlib-metadata->markdown>=2.6.8->tensorboard<1.16.0,>=1.15.0->tensorflow==1.15) (3.4.1)\n",
- "Requirement already satisfied: tensorboard==1.15 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (1.15.0)\n",
- "Requirement already satisfied: absl-py>=0.4 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from tensorboard==1.15) (0.12.0)\n",
- "Requirement already satisfied: protobuf>=3.6.0 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from tensorboard==1.15) (3.15.6)\n",
- "Requirement already satisfied: setuptools>=41.0.0 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from tensorboard==1.15) (54.1.2)\n",
- "Requirement already satisfied: six>=1.10.0 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from tensorboard==1.15) (1.15.0)\n",
- "Requirement already satisfied: werkzeug>=0.11.15 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from tensorboard==1.15) (1.0.1)\n",
- "Requirement already satisfied: markdown>=2.6.8 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from tensorboard==1.15) (3.3.4)\n",
- "Requirement already satisfied: grpcio>=1.6.3 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from tensorboard==1.15) (1.36.1)\n",
- "Requirement already satisfied: wheel>=0.26 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from tensorboard==1.15) (0.36.2)\n",
- "Requirement already satisfied: numpy>=1.12.0 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from tensorboard==1.15) (1.19.5)\n",
- "Requirement already satisfied: importlib-metadata in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from markdown>=2.6.8->tensorboard==1.15) (3.10.0)\n",
- "Requirement already satisfied: zipp>=0.5 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from importlib-metadata->markdown>=2.6.8->tensorboard==1.15) (3.4.1)\n",
- "Requirement already satisfied: typing-extensions>=3.6.4 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from importlib-metadata->markdown>=2.6.8->tensorboard==1.15) (3.7.4.3)\n"
- ]
- },
- {
- "name": "stdout",
- "output_type": "stream",
- "text": [
- "Collecting en-core-web-sm==3.0.0\n",
- " Downloading https://github.com/explosion/spacy-models/releases/download/en_core_web_sm-3.0.0/en_core_web_sm-3.0.0-py3-none-any.whl (13.7 MB)\n",
- "Requirement already satisfied: spacy<3.1.0,>=3.0.0 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from en-core-web-sm==3.0.0) (3.0.5)\n",
- "Requirement already satisfied: setuptools in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from spacy<3.1.0,>=3.0.0->en-core-web-sm==3.0.0) (54.1.2)\n",
- "Requirement already satisfied: numpy>=1.15.0 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from spacy<3.1.0,>=3.0.0->en-core-web-sm==3.0.0) (1.19.5)\n",
- "Requirement already satisfied: requests<3.0.0,>=2.13.0 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from spacy<3.1.0,>=3.0.0->en-core-web-sm==3.0.0) (2.25.1)\n",
- "Requirement already satisfied: importlib-metadata>=0.20 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from spacy<3.1.0,>=3.0.0->en-core-web-sm==3.0.0) (3.10.0)\n",
- "Requirement already satisfied: typer<0.4.0,>=0.3.0 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from spacy<3.1.0,>=3.0.0->en-core-web-sm==3.0.0) (0.3.2)\n",
- "Requirement already satisfied: srsly<3.0.0,>=2.4.0 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from spacy<3.1.0,>=3.0.0->en-core-web-sm==3.0.0) (2.4.0)\n",
- "Requirement already satisfied: blis<0.8.0,>=0.4.0 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from spacy<3.1.0,>=3.0.0->en-core-web-sm==3.0.0) (0.7.4)\n",
- "Requirement already satisfied: tqdm<5.0.0,>=4.38.0 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from spacy<3.1.0,>=3.0.0->en-core-web-sm==3.0.0) (4.59.0)\n",
- "Requirement already satisfied: pydantic<1.8.0,>=1.7.1 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from spacy<3.1.0,>=3.0.0->en-core-web-sm==3.0.0) (1.7.3)\n",
- "Requirement already satisfied: murmurhash<1.1.0,>=0.28.0 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from spacy<3.1.0,>=3.0.0->en-core-web-sm==3.0.0) (1.0.5)\n",
- "Requirement already satisfied: wasabi<1.1.0,>=0.8.1 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from spacy<3.1.0,>=3.0.0->en-core-web-sm==3.0.0) (0.8.2)\n",
- "Requirement already satisfied: typing-extensions<4.0.0.0,>=3.7.4 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from spacy<3.1.0,>=3.0.0->en-core-web-sm==3.0.0) (3.7.4.3)\n",
- "Requirement already satisfied: packaging>=20.0 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from spacy<3.1.0,>=3.0.0->en-core-web-sm==3.0.0) (20.9)\n",
- "Requirement already satisfied: cymem<2.1.0,>=2.0.2 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from spacy<3.1.0,>=3.0.0->en-core-web-sm==3.0.0) (2.0.5)\n",
- "Requirement already satisfied: pathy>=0.3.5 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from spacy<3.1.0,>=3.0.0->en-core-web-sm==3.0.0) (0.4.0)\n",
- "Requirement already satisfied: spacy-legacy<3.1.0,>=3.0.0 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from spacy<3.1.0,>=3.0.0->en-core-web-sm==3.0.0) (3.0.1)\n",
- "Requirement already satisfied: jinja2 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from spacy<3.1.0,>=3.0.0->en-core-web-sm==3.0.0) (2.11.3)\n",
- "Requirement already satisfied: preshed<3.1.0,>=3.0.2 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from spacy<3.1.0,>=3.0.0->en-core-web-sm==3.0.0) (3.0.5)\n",
- "Requirement already satisfied: thinc<8.1.0,>=8.0.2 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from spacy<3.1.0,>=3.0.0->en-core-web-sm==3.0.0) (8.0.2)\n",
- "Requirement already satisfied: catalogue<2.1.0,>=2.0.1 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from spacy<3.1.0,>=3.0.0->en-core-web-sm==3.0.0) (2.0.1)\n",
- "Requirement already satisfied: zipp>=0.5 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from importlib-metadata>=0.20->spacy<3.1.0,>=3.0.0->en-core-web-sm==3.0.0) (3.4.1)\n",
- "Requirement already satisfied: pyparsing>=2.0.2 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from packaging>=20.0->spacy<3.1.0,>=3.0.0->en-core-web-sm==3.0.0) (2.4.7)\n",
- "Requirement already satisfied: smart-open<4.0.0,>=2.2.0 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from pathy>=0.3.5->spacy<3.1.0,>=3.0.0->en-core-web-sm==3.0.0) (3.0.0)\n",
- "Requirement already satisfied: dataclasses<1.0,>=0.6 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from pathy>=0.3.5->spacy<3.1.0,>=3.0.0->en-core-web-sm==3.0.0) (0.8)\n",
- "Requirement already satisfied: idna<3,>=2.5 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from requests<3.0.0,>=2.13.0->spacy<3.1.0,>=3.0.0->en-core-web-sm==3.0.0) (2.10)\n",
- "Requirement already satisfied: urllib3<1.27,>=1.21.1 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from requests<3.0.0,>=2.13.0->spacy<3.1.0,>=3.0.0->en-core-web-sm==3.0.0) (1.26.4)\n",
- "Requirement already satisfied: chardet<5,>=3.0.2 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from requests<3.0.0,>=2.13.0->spacy<3.1.0,>=3.0.0->en-core-web-sm==3.0.0) (4.0.0)\n",
- "Requirement already satisfied: certifi>=2017.4.17 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from requests<3.0.0,>=2.13.0->spacy<3.1.0,>=3.0.0->en-core-web-sm==3.0.0) (2020.12.5)\n",
- "Requirement already satisfied: contextvars<3,>=2.4 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from thinc<8.1.0,>=8.0.2->spacy<3.1.0,>=3.0.0->en-core-web-sm==3.0.0) (2.4)\n",
- "Requirement already satisfied: immutables>=0.9 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from contextvars<3,>=2.4->thinc<8.1.0,>=8.0.2->spacy<3.1.0,>=3.0.0->en-core-web-sm==3.0.0) (0.15)\n",
- "Requirement already satisfied: click<7.2.0,>=7.1.1 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from typer<0.4.0,>=0.3.0->spacy<3.1.0,>=3.0.0->en-core-web-sm==3.0.0) (7.1.2)\n",
- "Requirement already satisfied: MarkupSafe>=0.23 in c:\\users\\karti\\envs\\pnlp\\lib\\site-packages (from jinja2->spacy<3.1.0,>=3.0.0->en-core-web-sm==3.0.0) (1.1.1)\n",
- "[+] Download and installation successful\n",
- "You can now load the package via spacy.load('en_core_web_sm')\n"
- ]
- },
- {
- "name": "stderr",
- "output_type": "stream",
- "text": [
- "2021-04-03 16:37:49.144386: W tensorflow/stream_executor/platform/default/dso_loader.cc:55] Could not load dynamic library 'cudart64_100.dll'; dlerror: cudart64_100.dll not found\n",
- "2021-04-03 16:37:49.144410: I tensorflow/stream_executor/cuda/cudart_stub.cc:29] Ignore above cudart dlerror if you do not have a GPU set up on your machine.\n"
+ "Collecting snorkel==0.9.6\n",
+ "\u001b[?25l Downloading https://files.pythonhosted.org/packages/4e/6a/e33babd8b4fb34867b695b5ab6b02c9106ec9de05ed4a02b2b9417eb3ae7/snorkel-0.9.6-py3-none-any.whl (144kB)\n",
+ "\u001b[K |████████████████████████████████| 153kB 30.6MB/s \n",
+ "\u001b[?25hRequirement already satisfied: tqdm<5.0.0,>=4.33.0 in /usr/local/lib/python3.7/dist-packages (from snorkel==0.9.6) (4.41.1)\n",
+ "Requirement already satisfied: scipy<2.0.0,>=1.2.0 in /usr/local/lib/python3.7/dist-packages (from snorkel==0.9.6) (1.4.1)\n",
+ "Collecting tensorboard<2.0.0,>=1.14.0\n",
+ "\u001b[?25l Downloading https://files.pythonhosted.org/packages/1e/e9/d3d747a97f7188f48aa5eda486907f3b345cd409f0a0850468ba867db246/tensorboard-1.15.0-py3-none-any.whl (3.8MB)\n",
+ "\u001b[K |████████████████████████████████| 3.8MB 29.7MB/s \n",
+ "\u001b[?25hCollecting munkres>=1.0.6\n",
+ " Downloading https://files.pythonhosted.org/packages/90/ab/0301c945a704218bc9435f0e3c88884f6b19ef234d8899fb47ce1ccfd0c9/munkres-1.1.4-py2.py3-none-any.whl\n",
+ "Collecting networkx<2.4,>=2.2\n",
+ "\u001b[?25l Downloading https://files.pythonhosted.org/packages/85/08/f20aef11d4c343b557e5de6b9548761811eb16e438cee3d32b1c66c8566b/networkx-2.3.zip (1.7MB)\n",
+ "\u001b[K |████████████████████████████████| 1.8MB 33.9MB/s \n",
+ "\u001b[?25hCollecting scikit-learn<0.22.0,>=0.20.2\n",
+ "\u001b[?25l Downloading https://files.pythonhosted.org/packages/9f/c5/e5267eb84994e9a92a2c6a6ee768514f255d036f3c8378acfa694e9f2c99/scikit_learn-0.21.3-cp37-cp37m-manylinux1_x86_64.whl (6.7MB)\n",
+ "\u001b[K |████████████████████████████████| 6.7MB 25.6MB/s \n",
+ "\u001b[?25hRequirement already satisfied: torch<2.0.0,>=1.2.0 in /usr/local/lib/python3.7/dist-packages (from snorkel==0.9.6) (1.9.0+cu102)\n",
+ "Requirement already satisfied: pandas<2.0.0,>=0.25.0 in /usr/local/lib/python3.7/dist-packages (from snorkel==0.9.6) (1.1.5)\n",
+ "Requirement already satisfied: numpy<2.0.0,>=1.16.0 in /usr/local/lib/python3.7/dist-packages (from snorkel==0.9.6) (1.19.5)\n",
+ "Requirement already satisfied: markdown>=2.6.8 in /usr/local/lib/python3.7/dist-packages (from tensorboard<2.0.0,>=1.14.0->snorkel==0.9.6) (3.3.4)\n",
+ "Requirement already satisfied: absl-py>=0.4 in /usr/local/lib/python3.7/dist-packages (from tensorboard<2.0.0,>=1.14.0->snorkel==0.9.6) (0.12.0)\n",
+ "Requirement already satisfied: wheel>=0.26; python_version >= \"3\" in /usr/local/lib/python3.7/dist-packages (from tensorboard<2.0.0,>=1.14.0->snorkel==0.9.6) (0.36.2)\n",
+ "Requirement already satisfied: six>=1.10.0 in /usr/local/lib/python3.7/dist-packages (from tensorboard<2.0.0,>=1.14.0->snorkel==0.9.6) (1.15.0)\n",
+ "Requirement already satisfied: setuptools>=41.0.0 in /usr/local/lib/python3.7/dist-packages (from tensorboard<2.0.0,>=1.14.0->snorkel==0.9.6) (57.0.0)\n",
+ "Requirement already satisfied: grpcio>=1.6.3 in /usr/local/lib/python3.7/dist-packages (from tensorboard<2.0.0,>=1.14.0->snorkel==0.9.6) (1.34.1)\n",
+ "Requirement already satisfied: werkzeug>=0.11.15 in /usr/local/lib/python3.7/dist-packages (from tensorboard<2.0.0,>=1.14.0->snorkel==0.9.6) (1.0.1)\n",
+ "Requirement already satisfied: protobuf>=3.6.0 in /usr/local/lib/python3.7/dist-packages (from tensorboard<2.0.0,>=1.14.0->snorkel==0.9.6) (3.12.4)\n",
+ "Requirement already satisfied: decorator>=4.3.0 in /usr/local/lib/python3.7/dist-packages (from networkx<2.4,>=2.2->snorkel==0.9.6) (4.4.2)\n",
+ "Requirement already satisfied: joblib>=0.11 in /usr/local/lib/python3.7/dist-packages (from scikit-learn<0.22.0,>=0.20.2->snorkel==0.9.6) (1.0.1)\n",
+ "Requirement already satisfied: typing-extensions in /usr/local/lib/python3.7/dist-packages (from torch<2.0.0,>=1.2.0->snorkel==0.9.6) (3.7.4.3)\n",
+ "Requirement already satisfied: python-dateutil>=2.7.3 in /usr/local/lib/python3.7/dist-packages (from pandas<2.0.0,>=0.25.0->snorkel==0.9.6) (2.8.1)\n",
+ "Requirement already satisfied: pytz>=2017.2 in /usr/local/lib/python3.7/dist-packages (from pandas<2.0.0,>=0.25.0->snorkel==0.9.6) (2018.9)\n",
+ "Requirement already satisfied: importlib-metadata; python_version < \"3.8\" in /usr/local/lib/python3.7/dist-packages (from markdown>=2.6.8->tensorboard<2.0.0,>=1.14.0->snorkel==0.9.6) (4.5.0)\n",
+ "Requirement already satisfied: zipp>=0.5 in /usr/local/lib/python3.7/dist-packages (from importlib-metadata; python_version < \"3.8\"->markdown>=2.6.8->tensorboard<2.0.0,>=1.14.0->snorkel==0.9.6) (3.4.1)\n",
+ "Building wheels for collected packages: networkx\n",
+ " Building wheel for networkx (setup.py) ... \u001b[?25l\u001b[?25hdone\n",
+ " Created wheel for networkx: filename=networkx-2.3-py2.py3-none-any.whl size=1556427 sha256=fe9bd053c6e9c3cf9d5a0e106e6d244b52e73825d565d18c2eb34ee2663b4f55\n",
+ " Stored in directory: /root/.cache/pip/wheels/de/63/64/3699be2a9d0ccdb37c7f16329acf3863fd76eda58c39c737af\n",
+ "Successfully built networkx\n",
+ "\u001b[31mERROR: tensorflow 2.5.0 has requirement tensorboard~=2.5, but you'll have tensorboard 1.15.0 which is incompatible.\u001b[0m\n",
+ "\u001b[31mERROR: albumentations 0.1.12 has requirement imgaug<0.2.7,>=0.2.5, but you'll have imgaug 0.2.9 which is incompatible.\u001b[0m\n",
+ "Installing collected packages: tensorboard, munkres, networkx, scikit-learn, snorkel\n",
+ " Found existing installation: tensorboard 2.5.0\n",
+ " Uninstalling tensorboard-2.5.0:\n",
+ " Successfully uninstalled tensorboard-2.5.0\n",
+ " Found existing installation: networkx 2.5.1\n",
+ " Uninstalling networkx-2.5.1:\n",
+ " Successfully uninstalled networkx-2.5.1\n",
+ " Found existing installation: scikit-learn 0.22.2.post1\n",
+ " Uninstalling scikit-learn-0.22.2.post1:\n",
+ " Successfully uninstalled scikit-learn-0.22.2.post1\n",
+ "Successfully installed munkres-1.1.4 networkx-2.3 scikit-learn-0.21.3 snorkel-0.9.6 tensorboard-1.15.0\n",
+ "Collecting treedlib==0.1.3\n",
+ " Downloading https://files.pythonhosted.org/packages/2c/44/d0880af1f8f14e4b6c71da161648cac8ff8231965383f11b65540f751fa7/treedlib-0.1.3-py3-none-any.whl\n",
+ "Requirement already satisfied: lxml in /usr/local/lib/python3.7/dist-packages (from treedlib==0.1.3) (4.2.6)\n",
+ "Installing collected packages: treedlib\n",
+ "Successfully installed treedlib-0.1.3\n",
+ "Collecting numbskull==0.1.1\n",
+ " Downloading https://files.pythonhosted.org/packages/c8/56/03f98485dec32d15522a59d35d87107a46375288a7a4ee1fffde7ff8fff2/numbskull-0.1.1-py3-none-any.whl\n",
+ "Requirement already satisfied: future in /usr/local/lib/python3.7/dist-packages (from numbskull==0.1.1) (0.16.0)\n",
+ "Installing collected packages: numbskull\n",
+ "Successfully installed numbskull-0.1.1\n",
+ "Collecting tensorflow==1.15\n",
+ "\u001b[?25l Downloading https://files.pythonhosted.org/packages/92/2b/e3af15221da9ff323521565fa3324b0d7c7c5b1d7a8ca66984c8d59cb0ce/tensorflow-1.15.0-cp37-cp37m-manylinux2010_x86_64.whl (412.3MB)\n",
+ "\u001b[K |████████████████████████████████| 412.3MB 29kB/s \n",
+ "\u001b[?25hRequirement already satisfied: tensorboard<1.16.0,>=1.15.0 in /usr/local/lib/python3.7/dist-packages (from tensorflow==1.15) (1.15.0)\n",
+ "Requirement already satisfied: google-pasta>=0.1.6 in /usr/local/lib/python3.7/dist-packages (from tensorflow==1.15) (0.2.0)\n",
+ "Requirement already satisfied: astor>=0.6.0 in /usr/local/lib/python3.7/dist-packages (from tensorflow==1.15) (0.8.1)\n",
+ "Requirement already satisfied: absl-py>=0.7.0 in /usr/local/lib/python3.7/dist-packages (from tensorflow==1.15) (0.12.0)\n",
+ "Requirement already satisfied: keras-preprocessing>=1.0.5 in /usr/local/lib/python3.7/dist-packages (from tensorflow==1.15) (1.1.2)\n",
+ "Requirement already satisfied: opt-einsum>=2.3.2 in /usr/local/lib/python3.7/dist-packages (from tensorflow==1.15) (3.3.0)\n",
+ "Collecting tensorflow-estimator==1.15.1\n",
+ "\u001b[?25l Downloading https://files.pythonhosted.org/packages/de/62/2ee9cd74c9fa2fa450877847ba560b260f5d0fb70ee0595203082dafcc9d/tensorflow_estimator-1.15.1-py2.py3-none-any.whl (503kB)\n",
+ "\u001b[K |████████████████████████████████| 512kB 42.4MB/s \n",
+ "\u001b[?25hRequirement already satisfied: termcolor>=1.1.0 in /usr/local/lib/python3.7/dist-packages (from tensorflow==1.15) (1.1.0)\n",
+ "Collecting keras-applications>=1.0.8\n",
+ "\u001b[?25l Downloading https://files.pythonhosted.org/packages/71/e3/19762fdfc62877ae9102edf6342d71b28fbfd9dea3d2f96a882ce099b03f/Keras_Applications-1.0.8-py3-none-any.whl (50kB)\n",
+ "\u001b[K |████████████████████████████████| 51kB 7.0MB/s \n",
+ "\u001b[?25hRequirement already satisfied: numpy<2.0,>=1.16.0 in /usr/local/lib/python3.7/dist-packages (from tensorflow==1.15) (1.19.5)\n",
+ "Requirement already satisfied: six>=1.10.0 in /usr/local/lib/python3.7/dist-packages (from tensorflow==1.15) (1.15.0)\n",
+ "Requirement already satisfied: wrapt>=1.11.1 in /usr/local/lib/python3.7/dist-packages (from tensorflow==1.15) (1.12.1)\n",
+ "Collecting gast==0.2.2\n",
+ " Downloading https://files.pythonhosted.org/packages/4e/35/11749bf99b2d4e3cceb4d55ca22590b0d7c2c62b9de38ac4a4a7f4687421/gast-0.2.2.tar.gz\n",
+ "Requirement already satisfied: protobuf>=3.6.1 in /usr/local/lib/python3.7/dist-packages (from tensorflow==1.15) (3.12.4)\n",
+ "Requirement already satisfied: grpcio>=1.8.6 in /usr/local/lib/python3.7/dist-packages (from tensorflow==1.15) (1.34.1)\n",
+ "Requirement already satisfied: wheel>=0.26 in /usr/local/lib/python3.7/dist-packages (from tensorflow==1.15) (0.36.2)\n",
+ "Requirement already satisfied: setuptools>=41.0.0 in /usr/local/lib/python3.7/dist-packages (from tensorboard<1.16.0,>=1.15.0->tensorflow==1.15) (57.0.0)\n",
+ "Requirement already satisfied: markdown>=2.6.8 in /usr/local/lib/python3.7/dist-packages (from tensorboard<1.16.0,>=1.15.0->tensorflow==1.15) (3.3.4)\n",
+ "Requirement already satisfied: werkzeug>=0.11.15 in /usr/local/lib/python3.7/dist-packages (from tensorboard<1.16.0,>=1.15.0->tensorflow==1.15) (1.0.1)\n",
+ "Requirement already satisfied: h5py in /usr/local/lib/python3.7/dist-packages (from keras-applications>=1.0.8->tensorflow==1.15) (3.1.0)\n",
+ "Requirement already satisfied: importlib-metadata; python_version < \"3.8\" in /usr/local/lib/python3.7/dist-packages (from markdown>=2.6.8->tensorboard<1.16.0,>=1.15.0->tensorflow==1.15) (4.5.0)\n",
+ "Requirement already satisfied: cached-property; python_version < \"3.8\" in /usr/local/lib/python3.7/dist-packages (from h5py->keras-applications>=1.0.8->tensorflow==1.15) (1.5.2)\n",
+ "Requirement already satisfied: zipp>=0.5 in /usr/local/lib/python3.7/dist-packages (from importlib-metadata; python_version < \"3.8\"->markdown>=2.6.8->tensorboard<1.16.0,>=1.15.0->tensorflow==1.15) (3.4.1)\n",
+ "Requirement already satisfied: typing-extensions>=3.6.4; python_version < \"3.8\" in /usr/local/lib/python3.7/dist-packages (from importlib-metadata; python_version < \"3.8\"->markdown>=2.6.8->tensorboard<1.16.0,>=1.15.0->tensorflow==1.15) (3.7.4.3)\n",
+ "Building wheels for collected packages: gast\n",
+ " Building wheel for gast (setup.py) ... \u001b[?25l\u001b[?25hdone\n",
+ " Created wheel for gast: filename=gast-0.2.2-cp37-none-any.whl size=7557 sha256=b9b362dc4c0d1e05be50daaf72075a04f18eb1de2cb83ad4cf5ec6942c4c099d\n",
+ " Stored in directory: /root/.cache/pip/wheels/5c/2e/7e/a1d4d4fcebe6c381f378ce7743a3ced3699feb89bcfbdadadd\n",
+ "Successfully built gast\n",
+ "\u001b[31mERROR: tensorflow-probability 0.12.1 has requirement gast>=0.3.2, but you'll have gast 0.2.2 which is incompatible.\u001b[0m\n",
+ "\u001b[31mERROR: kapre 0.3.5 has requirement tensorflow>=2.0.0, but you'll have tensorflow 1.15.0 which is incompatible.\u001b[0m\n",
+ "Installing collected packages: tensorflow-estimator, keras-applications, gast, tensorflow\n",
+ " Found existing installation: tensorflow-estimator 2.5.0\n",
+ " Uninstalling tensorflow-estimator-2.5.0:\n",
+ " Successfully uninstalled tensorflow-estimator-2.5.0\n",
+ " Found existing installation: gast 0.4.0\n",
+ " Uninstalling gast-0.4.0:\n",
+ " Successfully uninstalled gast-0.4.0\n",
+ " Found existing installation: tensorflow 2.5.0\n",
+ " Uninstalling tensorflow-2.5.0:\n",
+ " Successfully uninstalled tensorflow-2.5.0\n",
+ "Successfully installed gast-0.2.2 keras-applications-1.0.8 tensorflow-1.15.0 tensorflow-estimator-1.15.1\n",
+ "Requirement already satisfied: tensorboard==1.15 in /usr/local/lib/python3.7/dist-packages (1.15.0)\n",
+ "Requirement already satisfied: absl-py>=0.4 in /usr/local/lib/python3.7/dist-packages (from tensorboard==1.15) (0.12.0)\n",
+ "Requirement already satisfied: markdown>=2.6.8 in /usr/local/lib/python3.7/dist-packages (from tensorboard==1.15) (3.3.4)\n",
+ "Requirement already satisfied: wheel>=0.26; python_version >= \"3\" in /usr/local/lib/python3.7/dist-packages (from tensorboard==1.15) (0.36.2)\n",
+ "Requirement already satisfied: setuptools>=41.0.0 in /usr/local/lib/python3.7/dist-packages (from tensorboard==1.15) (57.0.0)\n",
+ "Requirement already satisfied: six>=1.10.0 in /usr/local/lib/python3.7/dist-packages (from tensorboard==1.15) (1.15.0)\n",
+ "Requirement already satisfied: werkzeug>=0.11.15 in /usr/local/lib/python3.7/dist-packages (from tensorboard==1.15) (1.0.1)\n",
+ "Requirement already satisfied: protobuf>=3.6.0 in /usr/local/lib/python3.7/dist-packages (from tensorboard==1.15) (3.12.4)\n",
+ "Requirement already satisfied: grpcio>=1.6.3 in /usr/local/lib/python3.7/dist-packages (from tensorboard==1.15) (1.34.1)\n",
+ "Requirement already satisfied: numpy>=1.12.0 in /usr/local/lib/python3.7/dist-packages (from tensorboard==1.15) (1.19.5)\n",
+ "Requirement already satisfied: importlib-metadata; python_version < \"3.8\" in /usr/local/lib/python3.7/dist-packages (from markdown>=2.6.8->tensorboard==1.15) (4.5.0)\n",
+ "Requirement already satisfied: typing-extensions>=3.6.4; python_version < \"3.8\" in /usr/local/lib/python3.7/dist-packages (from importlib-metadata; python_version < \"3.8\"->markdown>=2.6.8->tensorboard==1.15) (3.7.4.3)\n",
+ "Requirement already satisfied: zipp>=0.5 in /usr/local/lib/python3.7/dist-packages (from importlib-metadata; python_version < \"3.8\"->markdown>=2.6.8->tensorboard==1.15) (3.4.1)\n",
+ "Collecting wget\n",
+ " Downloading https://files.pythonhosted.org/packages/47/6a/62e288da7bcda82b935ff0c6cfe542970f04e29c756b0e147251b2fb251f/wget-3.2.zip\n",
+ "Building wheels for collected packages: wget\n",
+ " Building wheel for wget (setup.py) ... \u001b[?25l\u001b[?25hdone\n",
+ " Created wheel for wget: filename=wget-3.2-cp37-none-any.whl size=9675 sha256=0ee752c74ee35d6038de394ff408eb5e7a9dfe00e1e53a8cd5940483007dc86a\n",
+ " Stored in directory: /root/.cache/pip/wheels/40/15/30/7d8f7cea2902b4db79e3fea550d7d7b85ecb27ef992b618f3f\n",
+ "Successfully built wget\n",
+ "Installing collected packages: wget\n",
+ "Successfully installed wget-3.2\n",
+ "Requirement already satisfied: textblob in /usr/local/lib/python3.7/dist-packages (0.15.3)\n",
+ "Requirement already satisfied: nltk>=3.1 in /usr/local/lib/python3.7/dist-packages (from textblob) (3.2.5)\n",
+ "Requirement already satisfied: six in /usr/local/lib/python3.7/dist-packages (from nltk>=3.1->textblob) (1.15.0)\n",
+ "Requirement already satisfied: en_core_web_sm==2.2.5 from https://github.com/explosion/spacy-models/releases/download/en_core_web_sm-2.2.5/en_core_web_sm-2.2.5.tar.gz#egg=en_core_web_sm==2.2.5 in /usr/local/lib/python3.7/dist-packages (2.2.5)\n",
+ "Requirement already satisfied: spacy>=2.2.2 in /usr/local/lib/python3.7/dist-packages (from en_core_web_sm==2.2.5) (2.2.4)\n",
+ "Requirement already satisfied: wasabi<1.1.0,>=0.4.0 in /usr/local/lib/python3.7/dist-packages (from spacy>=2.2.2->en_core_web_sm==2.2.5) (0.8.2)\n",
+ "Requirement already satisfied: setuptools in /usr/local/lib/python3.7/dist-packages (from spacy>=2.2.2->en_core_web_sm==2.2.5) (57.0.0)\n",
+ "Requirement already satisfied: requests<3.0.0,>=2.13.0 in /usr/local/lib/python3.7/dist-packages (from spacy>=2.2.2->en_core_web_sm==2.2.5) (2.23.0)\n",
+ "Requirement already satisfied: blis<0.5.0,>=0.4.0 in /usr/local/lib/python3.7/dist-packages (from spacy>=2.2.2->en_core_web_sm==2.2.5) (0.4.1)\n",
+ "Requirement already satisfied: preshed<3.1.0,>=3.0.2 in /usr/local/lib/python3.7/dist-packages (from spacy>=2.2.2->en_core_web_sm==2.2.5) (3.0.5)\n",
+ "Requirement already satisfied: plac<1.2.0,>=0.9.6 in /usr/local/lib/python3.7/dist-packages (from spacy>=2.2.2->en_core_web_sm==2.2.5) (1.1.3)\n",
+ "Requirement already satisfied: numpy>=1.15.0 in /usr/local/lib/python3.7/dist-packages (from spacy>=2.2.2->en_core_web_sm==2.2.5) (1.19.5)\n",
+ "Requirement already satisfied: murmurhash<1.1.0,>=0.28.0 in /usr/local/lib/python3.7/dist-packages (from spacy>=2.2.2->en_core_web_sm==2.2.5) (1.0.5)\n",
+ "Requirement already satisfied: srsly<1.1.0,>=1.0.2 in /usr/local/lib/python3.7/dist-packages (from spacy>=2.2.2->en_core_web_sm==2.2.5) (1.0.5)\n",
+ "Requirement already satisfied: cymem<2.1.0,>=2.0.2 in /usr/local/lib/python3.7/dist-packages (from spacy>=2.2.2->en_core_web_sm==2.2.5) (2.0.5)\n",
+ "Requirement already satisfied: tqdm<5.0.0,>=4.38.0 in /usr/local/lib/python3.7/dist-packages (from spacy>=2.2.2->en_core_web_sm==2.2.5) (4.41.1)\n",
+ "Requirement already satisfied: thinc==7.4.0 in /usr/local/lib/python3.7/dist-packages (from spacy>=2.2.2->en_core_web_sm==2.2.5) (7.4.0)\n",
+ "Requirement already satisfied: catalogue<1.1.0,>=0.0.7 in /usr/local/lib/python3.7/dist-packages (from spacy>=2.2.2->en_core_web_sm==2.2.5) (1.0.0)\n",
+ "Requirement already satisfied: chardet<4,>=3.0.2 in /usr/local/lib/python3.7/dist-packages (from requests<3.0.0,>=2.13.0->spacy>=2.2.2->en_core_web_sm==2.2.5) (3.0.4)\n",
+ "Requirement already satisfied: idna<3,>=2.5 in /usr/local/lib/python3.7/dist-packages (from requests<3.0.0,>=2.13.0->spacy>=2.2.2->en_core_web_sm==2.2.5) (2.10)\n",
+ "Requirement already satisfied: certifi>=2017.4.17 in /usr/local/lib/python3.7/dist-packages (from requests<3.0.0,>=2.13.0->spacy>=2.2.2->en_core_web_sm==2.2.5) (2021.5.30)\n",
+ "Requirement already satisfied: urllib3!=1.25.0,!=1.25.1,<1.26,>=1.21.1 in /usr/local/lib/python3.7/dist-packages (from requests<3.0.0,>=2.13.0->spacy>=2.2.2->en_core_web_sm==2.2.5) (1.24.3)\n",
+ "Requirement already satisfied: importlib-metadata>=0.20; python_version < \"3.8\" in /usr/local/lib/python3.7/dist-packages (from catalogue<1.1.0,>=0.0.7->spacy>=2.2.2->en_core_web_sm==2.2.5) (4.5.0)\n",
+ "Requirement already satisfied: zipp>=0.5 in /usr/local/lib/python3.7/dist-packages (from importlib-metadata>=0.20; python_version < \"3.8\"->catalogue<1.1.0,>=0.0.7->spacy>=2.2.2->en_core_web_sm==2.2.5) (3.4.1)\n",
+ "Requirement already satisfied: typing-extensions>=3.6.4; python_version < \"3.8\" in /usr/local/lib/python3.7/dist-packages (from importlib-metadata>=0.20; python_version < \"3.8\"->catalogue<1.1.0,>=0.0.7->spacy>=2.2.2->en_core_web_sm==2.2.5) (3.7.4.3)\n",
+ "\u001b[38;5;2m✔ Download and installation successful\u001b[0m\n",
+ "You can now load the model via spacy.load('en_core_web_sm')\n"
]
}
],
@@ -164,6 +203,8 @@
"!pip install numbskull==0.1.1\n",
"!pip install tensorflow==1.15\n",
"!pip install tensorboard==1.15\n",
+ "!pip install wget\n",
+ "!pip install textblob\n",
"!python -m spacy download en_core_web_sm"
]
},
@@ -174,7 +215,8 @@
"ExecuteTime": {
"end_time": "2021-04-03T11:08:02.765409Z",
"start_time": "2021-04-03T11:08:02.750395Z"
- }
+ },
+ "id": "1_TfLGPSr3OQ"
},
"outputs": [],
"source": [
@@ -185,7 +227,6 @@
{
"cell_type": "markdown",
"metadata": {
- "colab_type": "text",
"id": "fYsYe4tOomEM"
},
"source": [
@@ -200,28 +241,28 @@
"ExecuteTime": {
"end_time": "2021-04-03T11:08:04.193561Z",
"start_time": "2021-04-03T11:08:02.766409Z"
- }
+ },
+ "colab": {
+ "base_uri": "https://localhost:8080/"
+ },
+ "id": "1hO0ncklr3OR",
+ "outputId": "d92aa059-86fb-4395-cbaf-2fc9198f2825"
},
"outputs": [
- {
- "name": "stdout",
- "output_type": "stream",
- "text": [
- "100% [............................................................................] 163567 / 163567"
- ]
- },
{
"data": {
"text/plain": [
- "['Youtube01-Psy.csv',\n",
+ "['Youtube05-Shakira.csv',\n",
" 'Youtube02-KatyPerry.csv',\n",
" 'Youtube03-LMFAO.csv',\n",
- " 'Youtube04-Eminem.csv',\n",
- " 'Youtube05-Shakira.csv']"
+ " 'Youtube01-Psy.csv',\n",
+ " 'Youtube04-Eminem.csv']"
]
},
"execution_count": 3,
- "metadata": {},
+ "metadata": {
+ "tags": []
+ },
"output_type": "execute_result"
}
],
@@ -251,7 +292,6 @@
{
"cell_type": "markdown",
"metadata": {
- "colab_type": "text",
"id": "H2msvroyoZ5W"
},
"source": [
@@ -267,19 +307,23 @@
"start_time": "2021-04-03T11:08:04.194562Z"
},
"colab": {
- "base_uri": "https://localhost:8080/",
- "height": 139
+ "base_uri": "https://localhost:8080/"
},
- "colab_type": "code",
"id": "F2MGdPXm7IvY",
- "outputId": "2e2079af-2b09-4006-cb64-7e4a374071c9"
+ "outputId": "e19dd48c-20ee-4f49-92d5-b3e123feb1b9"
},
"outputs": [
{
- "name": "stderr",
+ "name": "stdout",
"output_type": "stream",
"text": [
- "Cloning into 'snorkel-tutorials'...\n"
+ "Cloning into 'snorkel-tutorials'...\n",
+ "remote: Enumerating objects: 1124, done.\u001b[K\n",
+ "remote: Counting objects: 100% (65/65), done.\u001b[K\n",
+ "remote: Compressing objects: 100% (56/56), done.\u001b[K\n",
+ "remote: Total 1124 (delta 28), reused 15 (delta 8), pack-reused 1059\u001b[K\n",
+ "Receiving objects: 100% (1124/1124), 3.53 MiB | 19.66 MiB/s, done.\n",
+ "Resolving deltas: 100% (743/743), done.\n"
]
}
],
@@ -302,7 +346,6 @@
{
"cell_type": "markdown",
"metadata": {
- "colab_type": "text",
"id": "XM6JWmh6oxtv"
},
"source": [
@@ -317,8 +360,6 @@
"end_time": "2021-04-03T11:08:10.334905Z",
"start_time": "2021-04-03T11:08:06.478745Z"
},
- "colab": {},
- "colab_type": "code",
"id": "h-vgmzc7B0PM",
"scrolled": true
},
@@ -365,7 +406,8 @@
"ExecuteTime": {
"end_time": "2021-04-03T11:08:10.350918Z",
"start_time": "2021-04-03T11:08:10.335905Z"
- }
+ },
+ "id": "0Lp8IEfZr3OT"
},
"outputs": [],
"source": [
@@ -412,11 +454,10 @@
},
"colab": {
"base_uri": "https://localhost:8080/",
- "height": 448
+ "height": 407
},
- "colab_type": "code",
"id": "PQ_a_pkV3tdR",
- "outputId": "037e36ad-5c7e-4ea6-9daf-2ee959847dd7",
+ "outputId": "01776a69-84fd-407d-c4f2-4c804321329e",
"scrolled": false
},
"outputs": [
@@ -501,22 +542,19 @@
""
],
"text/plain": [
- " author date \\\n",
- "0 Alessandro leite 2014-11-05T22:21:36 \n",
- "1 Salim Tayara 2014-11-02T14:33:30 \n",
- "2 Phuc Ly 2014-01-20T15:27:47 \n",
- "3 DropShotSk8r 2014-01-19T04:27:18 \n",
- "4 css403 2014-11-07T14:25:48 \n",
+ " author date ... label video\n",
+ "0 Alessandro leite 2014-11-05T22:21:36 ... -1.0 1\n",
+ "1 Salim Tayara 2014-11-02T14:33:30 ... -1.0 1\n",
+ "2 Phuc Ly 2014-01-20T15:27:47 ... -1.0 1\n",
+ "3 DropShotSk8r 2014-01-19T04:27:18 ... -1.0 1\n",
+ "4 css403 2014-11-07T14:25:48 ... -1.0 1\n",
"\n",
- " text label video \n",
- "0 pls http://www10.vakinha.com.br/VaquinhaE.aspx... -1.0 1 \n",
- "1 if your like drones, plz subscribe to Kamal Ta... -1.0 1 \n",
- "2 go here to check the views :3 -1.0 1 \n",
- "3 Came here to check the views, goodbye. -1.0 1 \n",
- "4 i am 2,126,492,636 viewer :D -1.0 1 "
+ "[5 rows x 5 columns]"
]
},
- "metadata": {},
+ "metadata": {
+ "tags": []
+ },
"output_type": "display_data"
},
{
@@ -600,23 +638,20 @@
""
],
"text/plain": [
- " author date \\\n",
- "27 حلم الشباب 2015-05-25T23:42:49.533000 \n",
- "194 MOHAMED THASLEEM 2015-05-24T07:03:59.488000 \n",
- "277 AlabaGames 2015-05-22T00:31:43.922000 \n",
- "132 Manish Ray 2015-05-23T08:55:07.512000 \n",
- "163 Sudheer Yadav 2015-05-28T10:28:25.133000 \n",
+ " author date ... label video\n",
+ "27 حلم الشباب 2015-05-25T23:42:49.533000 ... 1 5\n",
+ "194 MOHAMED THASLEEM 2015-05-24T07:03:59.488000 ... 0 5\n",
+ "277 AlabaGames 2015-05-22T00:31:43.922000 ... 1 5\n",
+ "132 Manish Ray 2015-05-23T08:55:07.512000 ... 0 5\n",
+ "163 Sudheer Yadav 2015-05-28T10:28:25.133000 ... 1 5\n",
"\n",
- " text label video \n",
- "27 Check out this video on YouTube: 1 5 \n",
- "194 super music 0 5 \n",
- "277 Subscribe my channel I RECORDING FIFA 15 GOAL... 1 5 \n",
- "132 This song is so beauty 0 5 \n",
- "163 SEE SOME MORE SONG OPEN GOOGLE AND TYPE Shakir... 1 5 "
+ "[5 rows x 5 columns]"
]
},
"execution_count": 7,
- "metadata": {},
+ "metadata": {
+ "tags": []
+ },
"output_type": "execute_result"
}
],
@@ -637,34 +672,33 @@
"start_time": "2021-04-03T11:08:10.448007Z"
},
"colab": {
- "base_uri": "https://localhost:8080/",
- "height": 34
+ "base_uri": "https://localhost:8080/"
},
- "colab_type": "code",
"id": "sYk70EPO4sk3",
- "outputId": "db2db996-7faa-453d-c3d7-0e1049dc8d81"
+ "outputId": "cedead41-f044-48e7-fce0-9a3e5c80e645"
},
"outputs": [
{
"data": {
"text/plain": [
- "array([1, 0, 1, 0, 1], dtype=int64)"
+ "array([1, 0, 1, 0, 1, 0, 1, 0, 1, 1])"
]
},
"execution_count": 8,
- "metadata": {},
+ "metadata": {
+ "tags": []
+ },
"output_type": "execute_result"
}
],
"source": [
"Y_test = df_test.label.values\n",
- "Y_test[:5]"
+ "Y_test[:10]"
]
},
{
"cell_type": "markdown",
"metadata": {
- "colab_type": "text",
"id": "YSxLJ9P2ptsG"
},
"source": [
@@ -684,8 +718,6 @@
"end_time": "2021-04-03T11:08:10.478036Z",
"start_time": "2021-04-03T11:08:10.464021Z"
},
- "colab": {},
- "colab_type": "code",
"id": "BUPjY_nKbJEM"
},
"outputs": [],
@@ -698,7 +730,6 @@
{
"cell_type": "markdown",
"metadata": {
- "colab_type": "text",
"id": "AA94SzMiqJQq"
},
"source": [
@@ -716,11 +747,10 @@
},
"colab": {
"base_uri": "https://localhost:8080/",
- "height": 677
+ "height": 639
},
- "colab_type": "code",
"id": "fz2VcSoNbMi2",
- "outputId": "67aa06eb-5117-485d-a042-f6086c7983ff"
+ "outputId": "fafc6a04-e14b-4f19-b8ff-937272c5e6d6"
},
"outputs": [
{
@@ -875,53 +905,35 @@
""
],
"text/plain": [
- " author \\\n",
- "240 Lucas Trigo \n",
- "211 Blaze Rod \n",
- "228 MasterRobotTV \n",
- "207 Franklin Music \n",
- "153 lebanonwarior1 \n",
- "8 yenis maría Rodríguez \n",
- "62 RapStarz Coleman \n",
- "54 Jd Hurst \n",
- "353 jefflynnejp \n",
- "406 eliška žáková \n",
- "375 Chris Bieber \n",
- "270 Angela Alor \n",
- "44 BlueYetiPlayz -Call Of Duty and More \n",
- "295 the34104 \n",
- "223 Truc Ng \n",
- "144 Nina Mackie \n",
- "340 DanteBTV \n",
- "19 Paul Garza \n",
- "185 Bo Lanciné MAGASSOUBA \n",
- "73 MrValentinique \n",
+ " author ... video\n",
+ "240 Lucas Trigo ... 1\n",
+ "211 Blaze Rod ... 3\n",
+ "228 MasterRobotTV ... 1\n",
+ "207 Franklin Music ... 3\n",
+ "153 lebanonwarior1 ... 1\n",
+ "8 yenis maría Rodríguez ... 3\n",
+ "62 RapStarz Coleman ... 4\n",
+ "54 Jd Hurst ... 3\n",
+ "353 jefflynnejp ... 3\n",
+ "406 eliška žáková ... 3\n",
+ "375 Chris Bieber ... 4\n",
+ "270 Angela Alor ... 3\n",
+ "44 BlueYetiPlayz -Call Of Duty and More ... 1\n",
+ "295 the34104 ... 4\n",
+ "223 Truc Ng ... 2\n",
+ "144 Nina Mackie ... 3\n",
+ "340 DanteBTV ... 4\n",
+ "19 Paul Garza ... 3\n",
+ "185 Bo Lanciné MAGASSOUBA ... 4\n",
+ "73 MrValentinique ... 1\n",
"\n",
- " text video \n",
- "240 WHATS UP EVERYONE!? :-) I Trying To Showcase M... 1 \n",
- "211 when i see this back in 2015 i ask myself how ... 3 \n",
- "228 http://www.twitch.tv/zxlightsoutxz 1 \n",
- "207 Very Nice ! 3 \n",
- "153 Song name?? 1 \n",
- "8 2015 LIKEEE 3 \n",
- "62 Subscribe To Mê Please Guys 4 \n",
- "54 Check out this video on YouTube: 3 \n",
- "353 Check out this video on YouTube: 3 \n",
- "406 CUTE :) 3 \n",
- "375 Love the way you lie II is nicer in my opinion... 4 \n",
- "270 HOW DO YOU PUT A PICTURE FOR YOUR IMAGE THINGI... 3 \n",
- "44 subscribe to me for call of duty vids and give... 1 \n",
- "295 check out eminem latest track survival if u didnt 4 \n",
- "223 https://www.facebook.com/myfunnyriddles 2 \n",
- "144 Take a look at this video on YouTub
You 3 \n",
- "340 Check Out The New Hot Video By Dante B Called ... 4 \n",
- "19 Check out this video on YouTube: 3 \n",
- "185 WE GO FOR 1,000,000,000 FOR EMINEM 4 \n",
- "73 https://www.facebook.com/eeccon/posts/73394924... 1 "
+ "[20 rows x 3 columns]"
]
},
"execution_count": 10,
- "metadata": {},
+ "metadata": {
+ "tags": []
+ },
"output_type": "execute_result"
}
],
@@ -932,7 +944,6 @@
{
"cell_type": "markdown",
"metadata": {
- "colab_type": "text",
"id": "8Pin_a-epBXr"
},
"source": [
@@ -947,8 +958,6 @@
"end_time": "2021-04-03T11:08:10.510064Z",
"start_time": "2021-04-03T11:08:10.496052Z"
},
- "colab": {},
- "colab_type": "code",
"id": "mpSoy45Mblnr"
},
"outputs": [],
@@ -962,7 +971,6 @@
{
"cell_type": "markdown",
"metadata": {
- "colab_type": "text",
"id": "NcVpGTOpqbSr"
},
"source": [
@@ -978,8 +986,6 @@
"end_time": "2021-04-03T11:08:10.526079Z",
"start_time": "2021-04-03T11:08:10.511065Z"
},
- "colab": {},
- "colab_type": "code",
"id": "OI9-aAYAbs1e"
},
"outputs": [],
@@ -994,17 +1000,16 @@
"\n",
"@labeling_function()\n",
"def my_channel(x):\n",
- " return SPAM if \"my channel\" in x.text.lower() else ABSTAIN\n",
+ " return SPAM if \"my channel\" in x.text.lower() else ABSTAIN\n",
"\n",
"@labeling_function()\n",
"def if_subscribe(x):\n",
- " return SPAM if \"subscribe\" in x.text.lower() else ABSTAIN"
+ " return SPAM if \"subscribe\" in x.text.lower() else ABSTAIN"
]
},
{
"cell_type": "markdown",
"metadata": {
- "colab_type": "text",
"id": "VmBAWflGqzCL"
},
"source": [
@@ -1022,19 +1027,17 @@
"start_time": "2021-04-03T11:08:10.527080Z"
},
"colab": {
- "base_uri": "https://localhost:8080/",
- "height": 34
+ "base_uri": "https://localhost:8080/"
},
- "colab_type": "code",
"id": "Ab5nnlrzcUBY",
- "outputId": "6352eddb-c673-4fef-e100-b2d74c984710"
+ "outputId": "955fade7-040c-4e4e-8be1-791e89dd8e1f"
},
"outputs": [
{
"name": "stderr",
"output_type": "stream",
"text": [
- "100%|███████████████████████████████████████████████████████████████████████████| 1586/1586 [00:00<00:00, 23649.62it/s]\n"
+ "100%|██████████| 1586/1586 [00:00<00:00, 13520.09it/s]\n"
]
}
],
@@ -1054,12 +1057,10 @@
"start_time": "2021-04-03T11:08:10.607070Z"
},
"colab": {
- "base_uri": "https://localhost:8080/",
- "height": 139
+ "base_uri": "https://localhost:8080/"
},
- "colab_type": "code",
"id": "iEQOljcHcZh1",
- "outputId": "03b69925-a749-4da0-b43b-093dd99a5dcc"
+ "outputId": "d4415c36-a388-4d5b-b023-ffd4c2a64074"
},
"outputs": [
{
@@ -1075,7 +1076,9 @@
]
},
"execution_count": 14,
- "metadata": {},
+ "metadata": {
+ "tags": []
+ },
"output_type": "execute_result"
}
],
@@ -1086,7 +1089,6 @@
{
"cell_type": "markdown",
"metadata": {
- "colab_type": "text",
"id": "l6vJmvsgrl9O"
},
"source": [
@@ -1102,12 +1104,10 @@
"start_time": "2021-04-03T11:08:10.622084Z"
},
"colab": {
- "base_uri": "https://localhost:8080/",
- "height": 104
+ "base_uri": "https://localhost:8080/"
},
- "colab_type": "code",
"id": "LZS3HRs1c7BB",
- "outputId": "5e14598b-c60d-40a5-960e-5cbac8c28e6f"
+ "outputId": "8fed2489-93ff-42bc-fdb7-0903b09e5054"
},
"outputs": [
{
@@ -1134,7 +1134,6 @@
{
"cell_type": "markdown",
"metadata": {
- "colab_type": "text",
"id": "I_Lflxdir08t"
},
"source": [
@@ -1156,11 +1155,10 @@
},
"colab": {
"base_uri": "https://localhost:8080/",
- "height": 206
+ "height": 195
},
- "colab_type": "code",
"id": "Hb63fpwQdqin",
- "outputId": "3687be18-3e39-429d-a179-4dbacf8de494"
+ "outputId": "eb38910a-f638-4cb3-e9f7-6974d475fe27"
},
"outputs": [
{
@@ -1246,7 +1244,9 @@
]
},
"execution_count": 16,
- "metadata": {},
+ "metadata": {
+ "tags": []
+ },
"output_type": "execute_result"
}
],
@@ -1257,7 +1257,6 @@
{
"cell_type": "markdown",
"metadata": {
- "colab_type": "text",
"id": "lMAK17fqtOAK"
},
"source": [
@@ -1274,11 +1273,10 @@
},
"colab": {
"base_uri": "https://localhost:8080/",
- "height": 363
+ "height": 343
},
- "colab_type": "code",
"id": "QHSdjvyVd2QB",
- "outputId": "8024e6a5-f1d9-49bd-c063-ea5bd52f48ee"
+ "outputId": "ad70a3fa-f30b-40f1-a880-dd0872027b95"
},
"outputs": [
{
@@ -1395,33 +1393,25 @@
""
],
"text/plain": [
- " author date \\\n",
- "34 TA Stealth 2015-03-11T01:25:46.234000 \n",
- "288 ItsJoey Dash 2014-07-22T10:02:25.925000 \n",
- "36 Victor Gamer 2015-04-13T02:00:20.152000 \n",
- "263 Backup Plus 2014-11-03T17:39:07 \n",
- "386 ItsJoey Dash 2014-07-22T10:04:05.755000 \n",
- "404 M.E.S NaN \n",
- "341 superfacoo NaN \n",
- "229 Terry-Lee Mackenney NaN \n",
- "157 TopMusicWorld HD 2014-10-19T23:27:50 \n",
- "48 Kiddy Kidso 2014-01-19T16:49:52 \n",
+ " author date ... label video\n",
+ "34 TA Stealth 2015-03-11T01:25:46.234000 ... -1.0 3\n",
+ "288 ItsJoey Dash 2014-07-22T10:02:25.925000 ... -1.0 3\n",
+ "36 Victor Gamer 2015-04-13T02:00:20.152000 ... -1.0 3\n",
+ "263 Backup Plus 2014-11-03T17:39:07 ... -1.0 1\n",
+ "386 ItsJoey Dash 2014-07-22T10:04:05.755000 ... -1.0 3\n",
+ "404 M.E.S NaN ... -1.0 4\n",
+ "341 superfacoo NaN ... -1.0 4\n",
+ "229 Terry-Lee Mackenney NaN ... -1.0 4\n",
+ "157 TopMusicWorld HD 2014-10-19T23:27:50 ... -1.0 2\n",
+ "48 Kiddy Kidso 2014-01-19T16:49:52 ... -1.0 1\n",
"\n",
- " text label video \n",
- "34 Cool Video LMFAOVEVO! You should check out my ... -1.0 3 \n",
- "288 EVERYONE PLEASE GO SUBSCRIBE TO MY CHANNEL OR ... -1.0 3 \n",
- "36 View 851.247.920
Best youtube Vide... -1.0 3 \n",
- "263 Suscribe My Channel Please XD lol -1.0 1 \n",
- "386 EVERYONE PLEASE SUBSCRIBE TO MY CHANNEL OR CAN... -1.0 3 \n",
- "404 hey its M.E.S here I'm a young up and comi... -1.0 4 \n",
- "341 Hey? Everyone Please take a moment to read thi... -1.0 4 \n",
- "229 Hi Guys im an Upcoming Rapper if you could che... -1.0 4 \n",
- "157 Please Subscribe In My Channel → -1.0 2 \n",
- "48 Check my channel please! And listen to the bes... -1.0 1 "
+ "[10 rows x 5 columns]"
]
},
"execution_count": 17,
- "metadata": {},
+ "metadata": {
+ "tags": []
+ },
"output_type": "execute_result"
}
],
@@ -1434,7 +1424,6 @@
{
"cell_type": "markdown",
"metadata": {
- "colab_type": "text",
"id": "brmOFPoMtefG"
},
"source": [
@@ -1451,11 +1440,10 @@
},
"colab": {
"base_uri": "https://localhost:8080/",
- "height": 363
+ "height": 343
},
- "colab_type": "code",
"id": "SCup4XPReLeE",
- "outputId": "ebce9e4c-011b-4f81-8e57-78c257ddd4a1"
+ "outputId": "252e4980-07a7-4d68-d700-2e91920949f0"
},
"outputs": [
{
@@ -1572,33 +1560,25 @@
""
],
"text/plain": [
- " author date \\\n",
- "230 LBEProductions 2014-11-12T01:40:22 \n",
- "287 DERRICK HANFORD 2014-12-05T22:52:29.316000 \n",
- "113 Carlos Thegamer 2013-12-01T01:20:21 \n",
- "301 Ractive NaN \n",
- "246 Patrik Gybka 2015-05-05T09:32:04.687000 \n",
- "8 Youyou A. 2014-10-21T15:20:49 \n",
- "333 FreexGaming 2014-10-18T08:12:26 \n",
- "161 MarianMusicChannel 2014-08-24T03:57:52 \n",
- "171 MR magic man 2014-09-25T10:42:47 \n",
- "10 Dany PK NaN \n",
+ " author date ... label video\n",
+ "230 LBEProductions 2014-11-12T01:40:22 ... -1.0 1\n",
+ "287 DERRICK HANFORD 2014-12-05T22:52:29.316000 ... -1.0 3\n",
+ "113 Carlos Thegamer 2013-12-01T01:20:21 ... -1.0 1\n",
+ "301 Ractive NaN ... -1.0 4\n",
+ "246 Patrik Gybka 2015-05-05T09:32:04.687000 ... -1.0 3\n",
+ "8 Youyou A. 2014-10-21T15:20:49 ... -1.0 2\n",
+ "333 FreexGaming 2014-10-18T08:12:26 ... -1.0 2\n",
+ "161 MarianMusicChannel 2014-08-24T03:57:52 ... -1.0 2\n",
+ "171 MR magic man 2014-09-25T10:42:47 ... -1.0 2\n",
+ "10 Dany PK NaN ... -1.0 4\n",
"\n",
- " text label video \n",
- "230 Hey guys can you check my channel out plz. I d... -1.0 1 \n",
- "287 White people are going extinct for more inform... -1.0 3 \n",
- "113 subscribe to my channel people :D -1.0 1 \n",
- "301 i been working so hard for the past 60 days to... -1.0 4 \n",
- "246 SUBSCRIBE MY CHANNEL PLEASE LOL PRO PLAYS) -1.0 3 \n",
- "8 I make guitar covers, please have a look at my... -1.0 2 \n",
- "333 want to win borderlands the pre-sequel? check ... -1.0 2 \n",
- "161 Hello! I'm Marian, I'm a singer from Venezuela... -1.0 2 \n",
- "171 Please look at my channel -1.0 2 \n",
- "10 SUBSCRIBE TO MY CHANNEL X PLEASE!. SPARE -1.0 4 "
+ "[10 rows x 5 columns]"
]
},
"execution_count": 18,
- "metadata": {},
+ "metadata": {
+ "tags": []
+ },
"output_type": "execute_result"
}
],
@@ -1613,7 +1593,6 @@
{
"cell_type": "markdown",
"metadata": {
- "colab_type": "text",
"id": "oHmTYt8btmcb"
},
"source": [
@@ -1630,8 +1609,6 @@
"end_time": "2021-04-03T11:08:10.701156Z",
"start_time": "2021-04-03T11:08:10.686143Z"
},
- "colab": {},
- "colab_type": "code",
"id": "DumNxb_PiEeN"
},
"outputs": [],
@@ -1651,19 +1628,17 @@
"start_time": "2021-04-03T11:08:10.702157Z"
},
"colab": {
- "base_uri": "https://localhost:8080/",
- "height": 34
+ "base_uri": "https://localhost:8080/"
},
- "colab_type": "code",
"id": "fkgLHcPgkkQV",
- "outputId": "95e329d7-f31b-47fc-9052-daf1b9b11ebe"
+ "outputId": "23fb4f98-84b3-4798-9b39-eb7dd65a7c9f"
},
"outputs": [
{
"name": "stderr",
"output_type": "stream",
"text": [
- "100%|███████████████████████████████████████████████████████████████████████████| 1586/1586 [00:00<00:00, 35212.86it/s]\n"
+ "100%|██████████| 1586/1586 [00:00<00:00, 22789.90it/s]\n"
]
}
],
@@ -1684,11 +1659,10 @@
},
"colab": {
"base_uri": "https://localhost:8080/",
- "height": 143
+ "height": 136
},
- "colab_type": "code",
"id": "854a-lHSkpB3",
- "outputId": "a7b30b81-4880-40cd-d520-2f55e24bb6fd"
+ "outputId": "f1a69983-1858-447f-c1e6-0d57e99b81ec"
},
"outputs": [
{
@@ -1756,7 +1730,9 @@
]
},
"execution_count": 21,
- "metadata": {},
+ "metadata": {
+ "tags": []
+ },
"output_type": "execute_result"
}
],
@@ -1774,11 +1750,10 @@
},
"colab": {
"base_uri": "https://localhost:8080/",
- "height": 363
+ "height": 343
},
- "colab_type": "code",
"id": "HaQZ-7PolblW",
- "outputId": "a06d2efa-ed06-4f37-ddea-9d6334f916af"
+ "outputId": "92212dd8-bc90-4495-a325-393e56f5997e"
},
"outputs": [
{
@@ -1895,33 +1870,25 @@
""
],
"text/plain": [
- " author date \\\n",
- "112 ArioseRose 2014-11-13T15:20:31 \n",
- "273 Artady 2014-08-11T16:27:55 \n",
- "190 Warrdrew 2014-11-07T07:46:57 \n",
- "146 Bob Kanowski 2013-11-28T12:33:27 \n",
- "139 MFkin PRXPHETZ 2014-01-20T09:08:39 \n",
- "191 RezAIIDay 2014-11-05T22:50:58 \n",
- "16 zhichao wang 2013-11-29T02:13:56 \n",
- "162 Owen Lai 2013-12-01T04:51:52 \n",
- "239 Cony 2013-11-28T16:01:47 \n",
- "322 Minecraft-Viasat 2014-11-03T14:38:53 \n",
+ " author date ... label video\n",
+ "112 ArioseRose 2014-11-13T15:20:31 ... -1.0 1\n",
+ "273 Artady 2014-08-11T16:27:55 ... -1.0 2\n",
+ "190 Warrdrew 2014-11-07T07:46:57 ... -1.0 1\n",
+ "146 Bob Kanowski 2013-11-28T12:33:27 ... -1.0 1\n",
+ "139 MFkin PRXPHETZ 2014-01-20T09:08:39 ... -1.0 1\n",
+ "191 RezAIIDay 2014-11-05T22:50:58 ... -1.0 2\n",
+ "16 zhichao wang 2013-11-29T02:13:56 ... -1.0 1\n",
+ "162 Owen Lai 2013-12-01T04:51:52 ... -1.0 1\n",
+ "239 Cony 2013-11-28T16:01:47 ... -1.0 1\n",
+ "322 Minecraft-Viasat 2014-11-03T14:38:53 ... -1.0 1\n",
"\n",
- " text label video \n",
- "112 Don't mind me, I'm just checking what the view... -1.0 1 \n",
- "273 https://soundcloud.com/artady please check my ... -1.0 2 \n",
- "190 I'm here to check the views.. holy shit -1.0 1 \n",
- "146 i turned it on mute as soon is i came on i jus... -1.0 1 \n",
- "139 if you like raw talent, raw lyrics, straight r... -1.0 1 \n",
- "191 Such a good song ans Katy sounds great over th... -1.0 2 \n",
- "16 i think about 100 millions of the views come f... -1.0 1 \n",
- "162 just checking the views -1.0 1 \n",
- "239 You should check my channel for Funny VIDEOS!! -1.0 1 \n",
- "322 Check my channel -1.0 1 "
+ "[10 rows x 5 columns]"
]
},
"execution_count": 22,
- "metadata": {},
+ "metadata": {
+ "tags": []
+ },
"output_type": "execute_result"
}
],
@@ -1933,7 +1900,6 @@
{
"cell_type": "markdown",
"metadata": {
- "colab_type": "text",
"id": "646laecIt2y4"
},
"source": [
@@ -1948,8 +1914,6 @@
"end_time": "2021-04-03T11:08:10.812635Z",
"start_time": "2021-04-03T11:08:10.798620Z"
},
- "colab": {},
- "colab_type": "code",
"id": "oBMqQuBUmRz1"
},
"outputs": [],
@@ -1970,8 +1934,6 @@
"end_time": "2021-04-03T11:08:10.828649Z",
"start_time": "2021-04-03T11:08:10.814636Z"
},
- "colab": {},
- "colab_type": "code",
"id": "u97Ql5_W6MNf"
},
"outputs": [],
@@ -1994,19 +1956,17 @@
"start_time": "2021-04-03T11:08:10.829650Z"
},
"colab": {
- "base_uri": "https://localhost:8080/",
- "height": 34
+ "base_uri": "https://localhost:8080/"
},
- "colab_type": "code",
"id": "2pJl0yod-qMe",
- "outputId": "2b45ce28-6592-4472-e559-141454da5f2b"
+ "outputId": "b927d1cb-a39b-4119-c492-53fabc9e212a"
},
"outputs": [
{
"name": "stderr",
"output_type": "stream",
"text": [
- "100%|████████████████████████████████████████████████████████████████████████████| 1586/1586 [00:01<00:00, 1445.44it/s]\n"
+ "100%|██████████| 1586/1586 [00:01<00:00, 1088.23it/s]\n"
]
}
],
@@ -2027,11 +1987,10 @@
},
"colab": {
"base_uri": "https://localhost:8080/",
- "height": 112
+ "height": 106
},
- "colab_type": "code",
"id": "q5NVqhPr--EO",
- "outputId": "f1e6133e-25e4-4713-a9d5-9e95829669ff"
+ "outputId": "246bdc68-3388-4842-967a-860bd55bee33"
},
"outputs": [
{
@@ -2090,7 +2049,9 @@
]
},
"execution_count": 26,
- "metadata": {},
+ "metadata": {
+ "tags": []
+ },
"output_type": "execute_result"
}
],
@@ -2101,7 +2062,6 @@
{
"cell_type": "markdown",
"metadata": {
- "colab_type": "text",
"id": "UZxFsE-vH47d"
},
"source": [
@@ -2113,7 +2073,6 @@
{
"cell_type": "markdown",
"metadata": {
- "colab_type": "text",
"id": "QuOJYTmNgjK5"
},
"source": [
@@ -2128,13 +2087,10 @@
"end_time": "2021-04-03T11:08:11.976404Z",
"start_time": "2021-04-03T11:08:11.961384Z"
},
- "colab": {},
- "colab_type": "code",
"id": "MZNRemLj_Bx2"
},
"outputs": [],
"source": [
- "\n",
"def keyword_lookup(x, keywords, label):\n",
" if any(word in x.text.lower() for word in keywords):\n",
" return label\n",
@@ -2168,7 +2124,6 @@
{
"cell_type": "markdown",
"metadata": {
- "colab_type": "text",
"id": "ZxDDetHLhp59"
},
"source": [
@@ -2187,8 +2142,6 @@
"end_time": "2021-04-03T11:08:11.992370Z",
"start_time": "2021-04-03T11:08:11.977405Z"
},
- "colab": {},
- "colab_type": "code",
"id": "ZeNvjhdkhUSK"
},
"outputs": [],
@@ -2202,7 +2155,6 @@
{
"cell_type": "markdown",
"metadata": {
- "colab_type": "text",
"id": "I3GOjwZtiwfw"
},
"source": [
@@ -2217,8 +2169,6 @@
"end_time": "2021-04-03T11:08:17.522364Z",
"start_time": "2021-04-03T11:08:11.993372Z"
},
- "colab": {},
- "colab_type": "code",
"id": "TZ2p4AW1iegt"
},
"outputs": [],
@@ -2244,8 +2194,6 @@
"end_time": "2021-04-03T11:08:22.239568Z",
"start_time": "2021-04-03T11:08:17.523293Z"
},
- "colab": {},
- "colab_type": "code",
"id": "Ya5diNfSlRA1"
},
"outputs": [],
@@ -2264,7 +2212,6 @@
{
"cell_type": "markdown",
"metadata": {
- "colab_type": "text",
"id": "yOL67OFB2N5b"
},
"source": [
@@ -2281,8 +2228,6 @@
"end_time": "2021-04-03T11:08:22.255584Z",
"start_time": "2021-04-03T11:08:22.240569Z"
},
- "colab": {},
- "colab_type": "code",
"id": "HOFzxDkSlpiL"
},
"outputs": [],
@@ -2310,20 +2255,18 @@
"start_time": "2021-04-03T11:08:22.256584Z"
},
"colab": {
- "base_uri": "https://localhost:8080/",
- "height": 52
+ "base_uri": "https://localhost:8080/"
},
- "colab_type": "code",
"id": "W_y7ZTD43Ttp",
- "outputId": "dd9ebd36-1528-49a6-bd23-0c7989d0d451"
+ "outputId": "8078dab7-62b8-4f60-ca71-de098f47def3"
},
"outputs": [
{
"name": "stderr",
"output_type": "stream",
"text": [
- "100%|█████████████████████████████████████████████████████████████████████████████| 1586/1586 [00:07<00:00, 198.89it/s]\n",
- "100%|███████████████████████████████████████████████████████████████████████████████| 250/250 [00:01<00:00, 157.09it/s]\n"
+ "100%|██████████| 1586/1586 [00:17<00:00, 91.32it/s]\n",
+ "100%|██████████| 250/250 [00:03<00:00, 78.62it/s]\n"
]
}
],
@@ -2343,11 +2286,10 @@
},
"colab": {
"base_uri": "https://localhost:8080/",
- "height": 363
+ "height": 343
},
- "colab_type": "code",
"id": "FXEDv6Nk3a9r",
- "outputId": "9a57832c-bab1-4ab0-a468-7548cacf1c70"
+ "outputId": "46d590c2-49df-4e43-c0c2-37e4c950bc2c"
},
"outputs": [
{
@@ -2384,7 +2326,7 @@
"