Skip to content

Commit

Permalink
edit baseline notebook
Browse files Browse the repository at this point in the history
  • Loading branch information
oshaikh13 committed Oct 4, 2020
1 parent af4d161 commit 7e30963
Showing 1 changed file with 5 additions and 26 deletions.
31 changes: 5 additions & 26 deletions baselines.ipynb
Expand Up @@ -206,7 +206,7 @@
"metadata": {},
"outputs": [],
"source": [
"class ToxicDataset(Dataset):\n",
"class PersuasionDataset(Dataset):\n",
" \n",
" def __init__(self, tokenizer: AutoTokenizer, dataframe: pd.DataFrame, lazy: bool = False):\n",
" self.tokenizer = tokenizer\n",
Expand Down Expand Up @@ -252,9 +252,9 @@
" y = torch.stack(y)\n",
" return x.cuda(), y.cuda(), index\n",
"\n",
"train_dataset = ToxicDataset(tokenizer, train_df, lazy=True)\n",
"dev_dataset = ToxicDataset(tokenizer, val_df, lazy=True)\n",
"test_dataset = ToxicDataset(tokenizer, test_df, lazy=True)\n",
"train_dataset = PersuasionDataset(tokenizer, train_df, lazy=True)\n",
"dev_dataset = PersuasionDataset(tokenizer, val_df, lazy=True)\n",
"test_dataset = PersuasionDataset(tokenizer, test_df, lazy=True)\n",
"collate_fn = partial(collate_fn)\n",
"BATCH_SIZE = 8\n",
"train_sampler = RandomSampler(train_dataset)\n",
Expand Down Expand Up @@ -489,35 +489,14 @@
" evaluate(model, test_iterator, test_df)"
]
},
{
"cell_type": "code",
"execution_count": 31,
"metadata": {},
"outputs": [],
"source": [
"# from transformers import BertTokenizer, DistillBertModel, AdamW, get_linear_schedule_with_warmup, DistillBertPreTrainedModel\n",
"from sklearn.metrics import roc_auc_score, f1_score, precision_score, recall_score, accuracy_score\n",
"from tqdm import tqdm\n",
"from pathlib import Path\n",
"import logging\n",
"import pickle\n",
"import random\n",
"from nltk.tokenize import sent_tokenize, word_tokenize\n",
"import itertools\n",
"import random\n",
"random.seed(0)\n",
"np.random.seed(0)\n",
"import json"
]
},
{
"cell_type": "code",
"execution_count": 29,
"metadata": {},
"outputs": [],
"source": [
"from sklearn.dummy import DummyClassifier\n",
"from sklearn.feature_extraction.text import TfidfVectorizer\n"
"from sklearn.feature_extraction.text import TfidfVectorizer"
]
},
{
Expand Down

0 comments on commit 7e30963

Please sign in to comment.