In [1]:
from sklearn.model_selection import train_test_split
import pandas as pd
import tensorflow as tf
import tensorflow_hub as hub
from datetime import datetime
from tensorflow import keras
import os
import re
import bert
from bert import run_classifier
from bert import optimization
from bert import tokenization

W0415 11:11:08.187197 15268 __init__.py:56] Some hub symbols are not available because TensorFlow version is less than 1.14


In [2]:
# Load all files from a directory in a DataFrame.
def load_directory_data(directory):
    data = {}
    data["sentence"] = []
    data["sentiment"] = []
    for file_path in os.listdir(directory):
        with tf.gfile.GFile(os.path.join(directory, file_path), "r") as f:
            data["sentence"].append(f.read())
            data["sentiment"].append(
                re.match("\d+_(\d+)\.txt", file_path).group(1))
    return pd.DataFrame.from_dict(data)


# Merge positive and negative examples, add a polarity column and shuffle.
def load_dataset(directory):
    pos_df = load_directory_data(os.path.join(directory, "pos"))
    neg_df = load_directory_data(os.path.join(directory, "neg"))
    pos_df["polarity"] = 1
    neg_df["polarity"] = 0
    return pd.concat([pos_df, neg_df]).sample(frac=1).reset_index(drop=True)


# Download and process the dataset files.
def download_and_load_datasets(force_download=False):
    dataset = tf.keras.utils.get_file(
        fname="aclImdb.tar.gz",
        origin="http://ai.stanford.edu/~amaas/data/sentiment/aclImdb_v1.tar.gz",
        extract=True)
    print(dataset)
    print(os.path.dirname(dataset))

    train_df = load_dataset(
        os.path.join(os.path.dirname(dataset), "aclImdb", "train"))
    test_df = load_dataset(
        os.path.join(os.path.dirname(dataset), "aclImdb", "test"))

    return train_df, test_df

In [3]:
# Reduce logging output.
train, test = download_and_load_datasets()

C:\Users\wangfabei\.keras\datasets\aclImdb.tar.gz
C:\Users\wangfabei\.keras\datasets


In [4]:
train.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 25000 entries, 0 to 24999
Data columns (total 3 columns):
sentence     25000 non-null object
sentiment    25000 non-null object
polarity     25000 non-null int64
dtypes: int64(1), object(2)
memory usage: 586.0+ KB


In [5]:
test.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 25000 entries, 0 to 24999
Data columns (total 3 columns):
sentence     25000 non-null object
sentiment    25000 non-null object
polarity     25000 non-null int64
dtypes: int64(1), object(2)
memory usage: 586.0+ KB


In [6]:
test.describe()

Unnamed: 0,polarity
count,25000.0
mean,0.5
std,0.50001
min,0.0
25%,0.0
50%,0.5
75%,1.0
max,1.0


In [7]:
train = train.sample(5000)
test = test.sample(5000)

In [8]:
train.head(10)

Unnamed: 0,sentence,sentiment,polarity
23021,For Urban Cowboy John Travolta plays one of th...,7,1
20208,Michael Jackson would have claimed a spot for ...,4,0
4553,"I love Westerns. I could watch them all day. ""...",1,0
1509,"William Powell is Philo Vance in ""The Kennel M...",7,1
9446,I thought it was an extremely clever film. I w...,9,1
2297,"Band Camp was awful, The Naked Mile was a litt...",3,0
6707,I'm a Belgian and grew up in the sixties. Most...,9,1
10785,"Tea Leoni plays Nora Wilde, a serious photogra...",8,1
8098,A movie you start watching as a late night cab...,8,1
7567,"It is no wonder this movie won 4 prices, it is...",10,1


In [26]:
train.columns

Index(['sentence', 'sentiment', 'polarity'], dtype='object')

In [9]:
DATA_COLUMN = 'sentence'
LABEL_COLUMN = 'polarity'
# label_list is the list of labels, i.e. True, False or 0, 1 or 'dog', 'cat'
label_list = [0, 1]

In [10]:
train_InputExamples = train.apply(lambda x: bert.run_classifier.InputExample(guid=None, # Globally unique ID for bookkeeping, unused in this example
                                                                   text_a = x[DATA_COLUMN], 
                                                                   text_b = None, 
                                                                   label = x[LABEL_COLUMN]), axis = 1)

test_InputExamples = test.apply(lambda x: bert.run_classifier.InputExample(guid=None, 
                                                                   text_a = x[DATA_COLUMN], 
                                                                   text_b = None, 
                                                                   label = x[LABEL_COLUMN]), axis = 1)

In [12]:
type(train_InputExamples)

pandas.core.series.Series

In [17]:
# This is a path to an uncased (all lowercase) version of BERT
BERT_MODEL_HUB = "https://tfhub.dev/google/bert_uncased_L-12_H-768_A-12/1"

def create_tokenizer_from_hub_module():
    """Get the vocab file and casing info from the Hub module."""
    with tf.Graph().as_default():
        bert_module = hub.Module(BERT_MODEL_HUB)
        tokenization_info = bert_module(signature="tokenization_info",
                                        as_dict=True)
        with tf.Session() as sess:
            vocab_file, do_lower_case = sess.run([
                tokenization_info["vocab_file"],
                tokenization_info["do_lower_case"]
            ])

    return bert.tokenization.FullTokenizer(vocab_file=vocab_file,
                                           do_lower_case=do_lower_case),vocab_file,do_lower_case

In [18]:
tokenizer,vocab_file ,do_lower_case= create_tokenizer_from_hub_module()

INFO:tensorflow:Saver not created because there are no variables in the graph to restore


I0415 14:06:47.934486 15268 saver.py:1483] Saver not created because there are no variables in the graph to restore


In [19]:
tokenizer.tokenize("This here's an example of using the BERT tokenizer")

['this',
 'here',
 "'",
 's',
 'an',
 'example',
 'of',
 'using',
 'the',
 'bert',
 'token',
 '##izer']

In [21]:
# vocab_file
do_lower_case

True

In [23]:
tokenizer.vocab

OrderedDict([('[PAD]', 0),
             ('[unused0]', 1),
             ('[unused1]', 2),
             ('[unused2]', 3),
             ('[unused3]', 4),
             ('[unused4]', 5),
             ('[unused5]', 6),
             ('[unused6]', 7),
             ('[unused7]', 8),
             ('[unused8]', 9),
             ('[unused9]', 10),
             ('[unused10]', 11),
             ('[unused11]', 12),
             ('[unused12]', 13),
             ('[unused13]', 14),
             ('[unused14]', 15),
             ('[unused15]', 16),
             ('[unused16]', 17),
             ('[unused17]', 18),
             ('[unused18]', 19),
             ('[unused19]', 20),
             ('[unused20]', 21),
             ('[unused21]', 22),
             ('[unused22]', 23),
             ('[unused23]', 24),
             ('[unused24]', 25),
             ('[unused25]', 26),
             ('[unused26]', 27),
             ('[unused27]', 28),
             ('[unused28]', 29),
             ('[unused29]', 30),
  

In [24]:
MAX_SEQ_LENGTH = 128
# Convert our train and test features to InputFeatures that BERT understands.
train_features = bert.run_classifier.convert_examples_to_features(train_InputExamples, label_list, MAX_SEQ_LENGTH, tokenizer)
test_features = bert.run_classifier.convert_examples_to_features(test_InputExamples, label_list, MAX_SEQ_LENGTH, tokenizer)

INFO:tensorflow:Writing example 0 of 5000


I0415 18:07:23.992919 15268 run_classifier.py:774] Writing example 0 of 5000


INFO:tensorflow:*** Example ***


I0415 18:07:24.000881 15268 run_classifier.py:461] *** Example ***


INFO:tensorflow:guid: None


I0415 18:07:24.002881 15268 run_classifier.py:462] guid: None


INFO:tensorflow:tokens: [CLS] for urban cowboy john tr ##av ##olt ##a plays one of the stronger alpha males ever portrayed on the big screen . he ' s a decent enough young kid who leaves his parent ' s homestead and strikes out for the big city of dallas where his uncle barry corbin has promised to find him work in the pet ##ro ##chemical industry . in 1980 that was beginning to boom and texas was definitely a growing place in the usa . < br / > < br / > tr ##av ##olt ##a does a good job in making we the audience care about his character who when you come right down to it is a sex ##ist pig . he meets and marries debra [SEP]


I0415 18:07:24.003881 15268 run_classifier.py:464] tokens: [CLS] for urban cowboy john tr ##av ##olt ##a plays one of the stronger alpha males ever portrayed on the big screen . he ' s a decent enough young kid who leaves his parent ' s homestead and strikes out for the big city of dallas where his uncle barry corbin has promised to find him work in the pet ##ro ##chemical industry . in 1980 that was beginning to boom and texas was definitely a growing place in the usa . < br / > < br / > tr ##av ##olt ##a does a good job in making we the audience care about his character who when you come right down to it is a sex ##ist pig . he meets and marries debra [SEP]


INFO:tensorflow:input_ids: 101 2005 3923 11762 2198 19817 11431 27914 2050 3248 2028 1997 1996 6428 6541 3767 2412 6791 2006 1996 2502 3898 1012 2002 1005 1055 1037 11519 2438 2402 4845 2040 3727 2010 6687 1005 1055 14473 1998 9326 2041 2005 1996 2502 2103 1997 5759 2073 2010 4470 6287 24003 2038 5763 2000 2424 2032 2147 1999 1996 9004 3217 15869 3068 1012 1999 3150 2008 2001 2927 2000 8797 1998 3146 2001 5791 1037 3652 2173 1999 1996 3915 1012 1026 7987 1013 1028 1026 7987 1013 1028 19817 11431 27914 2050 2515 1037 2204 3105 1999 2437 2057 1996 4378 2729 2055 2010 2839 2040 2043 2017 2272 2157 2091 2000 2009 2003 1037 3348 2923 10369 1012 2002 6010 1998 19941 28762 102


I0415 18:07:24.004882 15268 run_classifier.py:465] input_ids: 101 2005 3923 11762 2198 19817 11431 27914 2050 3248 2028 1997 1996 6428 6541 3767 2412 6791 2006 1996 2502 3898 1012 2002 1005 1055 1037 11519 2438 2402 4845 2040 3727 2010 6687 1005 1055 14473 1998 9326 2041 2005 1996 2502 2103 1997 5759 2073 2010 4470 6287 24003 2038 5763 2000 2424 2032 2147 1999 1996 9004 3217 15869 3068 1012 1999 3150 2008 2001 2927 2000 8797 1998 3146 2001 5791 1037 3652 2173 1999 1996 3915 1012 1026 7987 1013 1028 1026 7987 1013 1028 19817 11431 27914 2050 2515 1037 2204 3105 1999 2437 2057 1996 4378 2729 2055 2010 2839 2040 2043 2017 2272 2157 2091 2000 2009 2003 1037 3348 2923 10369 1012 2002 6010 1998 19941 28762 102


INFO:tensorflow:input_mask: 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1


I0415 18:07:24.005889 15268 run_classifier.py:466] input_mask: 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1


INFO:tensorflow:segment_ids: 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0


I0415 18:07:24.006881 15268 run_classifier.py:467] segment_ids: 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0


INFO:tensorflow:label: 1 (id = 1)


I0415 18:07:24.008881 15268 run_classifier.py:468] label: 1 (id = 1)


INFO:tensorflow:*** Example ***


I0415 18:07:24.012885 15268 run_classifier.py:461] *** Example ***


INFO:tensorflow:guid: None


I0415 18:07:24.014879 15268 run_classifier.py:462] guid: None


INFO:tensorflow:tokens: [CLS] michael jackson would have claimed a spot for the top - billed character in the golden child , and because he loves kids . that didn ' t work ( and why should it ? ) , so instead we have eddie murphy out to save the world by rescuing " kid mid ##as " . i would strongly suggest all future script ##writer ##s to please thoroughly study the actor ' s ina ##ne dialogue in this qui ##rky fantasy - adventure - comedy that ' s a step closer to is ##hta ##r . whatever murphy says or does can be best liked , but don ' t get me wrong about his exquisite comical talent ; he doesn ' t belong in this [SEP]


I0415 18:07:24.015878 15268 run_classifier.py:464] tokens: [CLS] michael jackson would have claimed a spot for the top - billed character in the golden child , and because he loves kids . that didn ' t work ( and why should it ? ) , so instead we have eddie murphy out to save the world by rescuing " kid mid ##as " . i would strongly suggest all future script ##writer ##s to please thoroughly study the actor ' s ina ##ne dialogue in this qui ##rky fantasy - adventure - comedy that ' s a step closer to is ##hta ##r . whatever murphy says or does can be best liked , but don ' t get me wrong about his exquisite comical talent ; he doesn ' t belong in this [SEP]


INFO:tensorflow:input_ids: 101 2745 4027 2052 2031 3555 1037 3962 2005 1996 2327 1011 14843 2839 1999 1996 3585 2775 1010 1998 2138 2002 7459 4268 1012 2008 2134 1005 1056 2147 1006 1998 2339 2323 2009 1029 1007 1010 2061 2612 2057 2031 5752 7104 2041 2000 3828 1996 2088 2011 23659 1000 4845 3054 3022 1000 1012 1045 2052 6118 6592 2035 2925 5896 15994 2015 2000 3531 12246 2817 1996 3364 1005 1055 27118 2638 7982 1999 2023 21864 15952 5913 1011 6172 1011 4038 2008 1005 1055 1037 3357 3553 2000 2003 22893 2099 1012 3649 7104 2758 2030 2515 2064 2022 2190 4669 1010 2021 2123 1005 1056 2131 2033 3308 2055 2010 19401 29257 5848 1025 2002 2987 1005 1056 7141 1999 2023 102


I0415 18:07:24.016878 15268 run_classifier.py:465] input_ids: 101 2745 4027 2052 2031 3555 1037 3962 2005 1996 2327 1011 14843 2839 1999 1996 3585 2775 1010 1998 2138 2002 7459 4268 1012 2008 2134 1005 1056 2147 1006 1998 2339 2323 2009 1029 1007 1010 2061 2612 2057 2031 5752 7104 2041 2000 3828 1996 2088 2011 23659 1000 4845 3054 3022 1000 1012 1045 2052 6118 6592 2035 2925 5896 15994 2015 2000 3531 12246 2817 1996 3364 1005 1055 27118 2638 7982 1999 2023 21864 15952 5913 1011 6172 1011 4038 2008 1005 1055 1037 3357 3553 2000 2003 22893 2099 1012 3649 7104 2758 2030 2515 2064 2022 2190 4669 1010 2021 2123 1005 1056 2131 2033 3308 2055 2010 19401 29257 5848 1025 2002 2987 1005 1056 7141 1999 2023 102


INFO:tensorflow:input_mask: 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1


I0415 18:07:24.018895 15268 run_classifier.py:466] input_mask: 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1


INFO:tensorflow:segment_ids: 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0


I0415 18:07:24.019885 15268 run_classifier.py:467] segment_ids: 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0


INFO:tensorflow:label: 0 (id = 0)


I0415 18:07:24.020892 15268 run_classifier.py:468] label: 0 (id = 0)


INFO:tensorflow:*** Example ***


I0415 18:07:24.026875 15268 run_classifier.py:461] *** Example ***


INFO:tensorflow:guid: None


I0415 18:07:24.027875 15268 run_classifier.py:462] guid: None


INFO:tensorflow:tokens: [CLS] i love western ##s . i could watch them all day . " the good , the bad , and the ugly " is my all time favorite . i watched " silver ##ado " for probably the 8th time just the other day because it was being featured on cm ##t . however , this movie , shi ##loh falls is without a doubt the worst western i have ever watched . the acting was terrible all around . they explain nothing at the end of the mysterious compass looking thing . the only good part i can think of is the good - looking can ##tina girl . the very noticeable long pauses between the dial ##og seemed intentional just to make up time [SEP]


I0415 18:07:24.029875 15268 run_classifier.py:464] tokens: [CLS] i love western ##s . i could watch them all day . " the good , the bad , and the ugly " is my all time favorite . i watched " silver ##ado " for probably the 8th time just the other day because it was being featured on cm ##t . however , this movie , shi ##loh falls is without a doubt the worst western i have ever watched . the acting was terrible all around . they explain nothing at the end of the mysterious compass looking thing . the only good part i can think of is the good - looking can ##tina girl . the very noticeable long pauses between the dial ##og seemed intentional just to make up time [SEP]


INFO:tensorflow:input_ids: 101 1045 2293 2530 2015 1012 1045 2071 3422 2068 2035 2154 1012 1000 1996 2204 1010 1996 2919 1010 1998 1996 9200 1000 2003 2026 2035 2051 5440 1012 1045 3427 1000 3165 9365 1000 2005 2763 1996 5893 2051 2074 1996 2060 2154 2138 2009 2001 2108 2956 2006 4642 2102 1012 2174 1010 2023 3185 1010 11895 24729 4212 2003 2302 1037 4797 1996 5409 2530 1045 2031 2412 3427 1012 1996 3772 2001 6659 2035 2105 1012 2027 4863 2498 2012 1996 2203 1997 1996 8075 16681 2559 2518 1012 1996 2069 2204 2112 1045 2064 2228 1997 2003 1996 2204 1011 2559 2064 13770 2611 1012 1996 2200 17725 2146 19623 2090 1996 13764 8649 2790 21249 2074 2000 2191 2039 2051 102


I0415 18:07:24.030874 15268 run_classifier.py:465] input_ids: 101 1045 2293 2530 2015 1012 1045 2071 3422 2068 2035 2154 1012 1000 1996 2204 1010 1996 2919 1010 1998 1996 9200 1000 2003 2026 2035 2051 5440 1012 1045 3427 1000 3165 9365 1000 2005 2763 1996 5893 2051 2074 1996 2060 2154 2138 2009 2001 2108 2956 2006 4642 2102 1012 2174 1010 2023 3185 1010 11895 24729 4212 2003 2302 1037 4797 1996 5409 2530 1045 2031 2412 3427 1012 1996 3772 2001 6659 2035 2105 1012 2027 4863 2498 2012 1996 2203 1997 1996 8075 16681 2559 2518 1012 1996 2069 2204 2112 1045 2064 2228 1997 2003 1996 2204 1011 2559 2064 13770 2611 1012 1996 2200 17725 2146 19623 2090 1996 13764 8649 2790 21249 2074 2000 2191 2039 2051 102


INFO:tensorflow:input_mask: 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1


I0415 18:07:24.031885 15268 run_classifier.py:466] input_mask: 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1


INFO:tensorflow:segment_ids: 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0


I0415 18:07:24.033876 15268 run_classifier.py:467] segment_ids: 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0


INFO:tensorflow:label: 0 (id = 0)


I0415 18:07:24.034872 15268 run_classifier.py:468] label: 0 (id = 0)


INFO:tensorflow:*** Example ***


I0415 18:07:24.040876 15268 run_classifier.py:461] *** Example ***


INFO:tensorflow:guid: None


I0415 18:07:24.041870 15268 run_classifier.py:462] guid: None


INFO:tensorflow:tokens: [CLS] william powell is phil ##o vance in " the ken ##nel murder case , " a 1933 film also starring mary astor , paul ca ##vana ##gh , eugene palette , helen vin ##son and ralph morgan . a dog show in which phil ##o has entered his scottish terri ##er captain serves as the background for a locked room mystery with too many suspects . the mystery is very clever and the den ##oue ##ment both complicated and interesting . since the talk ##ies are still quite young , the camera work is a little static , but michael curt ##iz does a good job directing the action . < br / > < br / > the supporting cast is excellent ; the entire [SEP]


I0415 18:07:24.043869 15268 run_classifier.py:464] tokens: [CLS] william powell is phil ##o vance in " the ken ##nel murder case , " a 1933 film also starring mary astor , paul ca ##vana ##gh , eugene palette , helen vin ##son and ralph morgan . a dog show in which phil ##o has entered his scottish terri ##er captain serves as the background for a locked room mystery with too many suspects . the mystery is very clever and the den ##oue ##ment both complicated and interesting . since the talk ##ies are still quite young , the camera work is a little static , but michael curt ##iz does a good job directing the action . < br / > < br / > the supporting cast is excellent ; the entire [SEP]


INFO:tensorflow:input_ids: 101 2520 8997 2003 6316 2080 16672 1999 1000 1996 6358 11877 4028 2553 1010 1000 1037 4537 2143 2036 4626 2984 25159 1010 2703 6187 27313 5603 1010 8207 27396 1010 6330 19354 3385 1998 6798 5253 1012 1037 3899 2265 1999 2029 6316 2080 2038 3133 2010 4104 26568 2121 2952 4240 2004 1996 4281 2005 1037 5299 2282 6547 2007 2205 2116 13172 1012 1996 6547 2003 2200 12266 1998 1996 7939 27872 3672 2119 8552 1998 5875 1012 2144 1996 2831 3111 2024 2145 3243 2402 1010 1996 4950 2147 2003 1037 2210 10763 1010 2021 2745 20099 10993 2515 1037 2204 3105 9855 1996 2895 1012 1026 7987 1013 1028 1026 7987 1013 1028 1996 4637 3459 2003 6581 1025 1996 2972 102


I0415 18:07:24.044868 15268 run_classifier.py:465] input_ids: 101 2520 8997 2003 6316 2080 16672 1999 1000 1996 6358 11877 4028 2553 1010 1000 1037 4537 2143 2036 4626 2984 25159 1010 2703 6187 27313 5603 1010 8207 27396 1010 6330 19354 3385 1998 6798 5253 1012 1037 3899 2265 1999 2029 6316 2080 2038 3133 2010 4104 26568 2121 2952 4240 2004 1996 4281 2005 1037 5299 2282 6547 2007 2205 2116 13172 1012 1996 6547 2003 2200 12266 1998 1996 7939 27872 3672 2119 8552 1998 5875 1012 2144 1996 2831 3111 2024 2145 3243 2402 1010 1996 4950 2147 2003 1037 2210 10763 1010 2021 2745 20099 10993 2515 1037 2204 3105 9855 1996 2895 1012 1026 7987 1013 1028 1026 7987 1013 1028 1996 4637 3459 2003 6581 1025 1996 2972 102


INFO:tensorflow:input_mask: 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1


I0415 18:07:24.045870 15268 run_classifier.py:466] input_mask: 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1


INFO:tensorflow:segment_ids: 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0


I0415 18:07:24.047874 15268 run_classifier.py:467] segment_ids: 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0


INFO:tensorflow:label: 1 (id = 1)


I0415 18:07:24.048868 15268 run_classifier.py:468] label: 1 (id = 1)


INFO:tensorflow:*** Example ***


I0415 18:07:24.052868 15268 run_classifier.py:461] *** Example ***


INFO:tensorflow:guid: None


I0415 18:07:24.053867 15268 run_classifier.py:462] guid: None


INFO:tensorflow:tokens: [CLS] i thought it was an extremely clever film . i was very pleased with it and truly couldn ' t ' ask for more . i actually own the film because i didn ' t return it to someone . . . which i should do , but i really want to keep it due to how much i enjoyed it . also , the fact i don ' t own too many foreign films and this is a first . now , i personally love finnish stuff so , that definitely added to how much i enjoyed it . but overall , its worth watching . however , if you ' re not into the whole trying to understand finnish or read sub ##titles bit [SEP]


I0415 18:07:24.055865 15268 run_classifier.py:464] tokens: [CLS] i thought it was an extremely clever film . i was very pleased with it and truly couldn ' t ' ask for more . i actually own the film because i didn ' t return it to someone . . . which i should do , but i really want to keep it due to how much i enjoyed it . also , the fact i don ' t own too many foreign films and this is a first . now , i personally love finnish stuff so , that definitely added to how much i enjoyed it . but overall , its worth watching . however , if you ' re not into the whole trying to understand finnish or read sub ##titles bit [SEP]


INFO:tensorflow:input_ids: 101 1045 2245 2009 2001 2019 5186 12266 2143 1012 1045 2001 2200 7537 2007 2009 1998 5621 2481 1005 1056 1005 3198 2005 2062 1012 1045 2941 2219 1996 2143 2138 1045 2134 1005 1056 2709 2009 2000 2619 1012 1012 1012 2029 1045 2323 2079 1010 2021 1045 2428 2215 2000 2562 2009 2349 2000 2129 2172 1045 5632 2009 1012 2036 1010 1996 2755 1045 2123 1005 1056 2219 2205 2116 3097 3152 1998 2023 2003 1037 2034 1012 2085 1010 1045 7714 2293 6983 4933 2061 1010 2008 5791 2794 2000 2129 2172 1045 5632 2009 1012 2021 3452 1010 2049 4276 3666 1012 2174 1010 2065 2017 1005 2128 2025 2046 1996 2878 2667 2000 3305 6983 2030 3191 4942 27430 2978 102


I0415 18:07:24.057871 15268 run_classifier.py:465] input_ids: 101 1045 2245 2009 2001 2019 5186 12266 2143 1012 1045 2001 2200 7537 2007 2009 1998 5621 2481 1005 1056 1005 3198 2005 2062 1012 1045 2941 2219 1996 2143 2138 1045 2134 1005 1056 2709 2009 2000 2619 1012 1012 1012 2029 1045 2323 2079 1010 2021 1045 2428 2215 2000 2562 2009 2349 2000 2129 2172 1045 5632 2009 1012 2036 1010 1996 2755 1045 2123 1005 1056 2219 2205 2116 3097 3152 1998 2023 2003 1037 2034 1012 2085 1010 1045 7714 2293 6983 4933 2061 1010 2008 5791 2794 2000 2129 2172 1045 5632 2009 1012 2021 3452 1010 2049 4276 3666 1012 2174 1010 2065 2017 1005 2128 2025 2046 1996 2878 2667 2000 3305 6983 2030 3191 4942 27430 2978 102


INFO:tensorflow:input_mask: 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1


I0415 18:07:24.059866 15268 run_classifier.py:466] input_mask: 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1


INFO:tensorflow:segment_ids: 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0


I0415 18:07:24.060871 15268 run_classifier.py:467] segment_ids: 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0


INFO:tensorflow:label: 1 (id = 1)


I0415 18:07:24.062874 15268 run_classifier.py:468] label: 1 (id = 1)


INFO:tensorflow:Writing example 0 of 5000


I0415 18:07:44.954012 15268 run_classifier.py:774] Writing example 0 of 5000


INFO:tensorflow:*** Example ***


I0415 18:07:44.957036 15268 run_classifier.py:461] *** Example ***


INFO:tensorflow:guid: None


I0415 18:07:44.958005 15268 run_classifier.py:462] guid: None


INFO:tensorflow:tokens: [CLS] the daytime tv of films . seldom have i felt so little attachment to characters . seldom have i been made to cr ##inge by such dire dialogue . na ##use ##ous london thirty - something ##s min ##cing round lu ##rid bbc sets sp ##out ##ing pl ##ati ##tu ##din ##ous mu ##lch . avoid this film as if it were your grandmother ' s clung ##e . [SEP]


I0415 18:07:44.959007 15268 run_classifier.py:464] tokens: [CLS] the daytime tv of films . seldom have i felt so little attachment to characters . seldom have i been made to cr ##inge by such dire dialogue . na ##use ##ous london thirty - something ##s min ##cing round lu ##rid bbc sets sp ##out ##ing pl ##ati ##tu ##din ##ous mu ##lch . avoid this film as if it were your grandmother ' s clung ##e . [SEP]


INFO:tensorflow:input_ids: 101 1996 12217 2694 1997 3152 1012 15839 2031 1045 2371 2061 2210 14449 2000 3494 1012 15839 2031 1045 2042 2081 2000 13675 23496 2011 2107 18704 7982 1012 6583 8557 3560 2414 4228 1011 2242 2015 8117 6129 2461 11320 14615 4035 4520 11867 5833 2075 20228 10450 8525 8718 3560 14163 29358 1012 4468 2023 2143 2004 2065 2009 2020 2115 7133 1005 1055 14752 2063 1012 102 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0


I0415 18:07:44.960014 15268 run_classifier.py:465] input_ids: 101 1996 12217 2694 1997 3152 1012 15839 2031 1045 2371 2061 2210 14449 2000 3494 1012 15839 2031 1045 2042 2081 2000 13675 23496 2011 2107 18704 7982 1012 6583 8557 3560 2414 4228 1011 2242 2015 8117 6129 2461 11320 14615 4035 4520 11867 5833 2075 20228 10450 8525 8718 3560 14163 29358 1012 4468 2023 2143 2004 2065 2009 2020 2115 7133 1005 1055 14752 2063 1012 102 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0


INFO:tensorflow:input_mask: 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0


I0415 18:07:44.964004 15268 run_classifier.py:466] input_mask: 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0


INFO:tensorflow:segment_ids: 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0


I0415 18:07:44.965005 15268 run_classifier.py:467] segment_ids: 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0


INFO:tensorflow:label: 0 (id = 0)


I0415 18:07:44.966006 15268 run_classifier.py:468] label: 0 (id = 0)


INFO:tensorflow:*** Example ***


I0415 18:07:44.970003 15268 run_classifier.py:461] *** Example ***


INFO:tensorflow:guid: None


I0415 18:07:44.972005 15268 run_classifier.py:462] guid: None


INFO:tensorflow:tokens: [CLS] ed wood rides again . the fact that this movie was made should give any young < br / > < br / > aspiring film maker hope . any screenplay you might have thought of using to < br / > < br / > line a litter ##box or a bird ##ca ##ge should now not seem that bad . do not watch this movie unless you have a healthy st ##ash of ty ##len ##ol or ro ##laid ##s . watching this < br / > < br / > movie made me realize that bo ##a vs . python was not that bad after all . it probably would have been better to do this movie in clay ##mation as at least [SEP]


I0415 18:07:44.973002 15268 run_classifier.py:464] tokens: [CLS] ed wood rides again . the fact that this movie was made should give any young < br / > < br / > aspiring film maker hope . any screenplay you might have thought of using to < br / > < br / > line a litter ##box or a bird ##ca ##ge should now not seem that bad . do not watch this movie unless you have a healthy st ##ash of ty ##len ##ol or ro ##laid ##s . watching this < br / > < br / > movie made me realize that bo ##a vs . python was not that bad after all . it probably would have been better to do this movie in clay ##mation as at least [SEP]


INFO:tensorflow:input_ids: 101 3968 3536 12271 2153 1012 1996 2755 2008 2023 3185 2001 2081 2323 2507 2151 2402 1026 7987 1013 1028 1026 7987 1013 1028 22344 2143 9338 3246 1012 2151 9000 2017 2453 2031 2245 1997 2478 2000 1026 7987 1013 1028 1026 7987 1013 1028 2240 1037 19070 8758 2030 1037 4743 3540 3351 2323 2085 2025 4025 2008 2919 1012 2079 2025 3422 2023 3185 4983 2017 2031 1037 7965 2358 11823 1997 5939 7770 4747 2030 20996 24393 2015 1012 3666 2023 1026 7987 1013 1028 1026 7987 1013 1028 3185 2081 2033 5382 2008 8945 2050 5443 1012 18750 2001 2025 2008 2919 2044 2035 1012 2009 2763 2052 2031 2042 2488 2000 2079 2023 3185 1999 5726 28649 2004 2012 2560 102


I0415 18:07:44.975009 15268 run_classifier.py:465] input_ids: 101 3968 3536 12271 2153 1012 1996 2755 2008 2023 3185 2001 2081 2323 2507 2151 2402 1026 7987 1013 1028 1026 7987 1013 1028 22344 2143 9338 3246 1012 2151 9000 2017 2453 2031 2245 1997 2478 2000 1026 7987 1013 1028 1026 7987 1013 1028 2240 1037 19070 8758 2030 1037 4743 3540 3351 2323 2085 2025 4025 2008 2919 1012 2079 2025 3422 2023 3185 4983 2017 2031 1037 7965 2358 11823 1997 5939 7770 4747 2030 20996 24393 2015 1012 3666 2023 1026 7987 1013 1028 1026 7987 1013 1028 3185 2081 2033 5382 2008 8945 2050 5443 1012 18750 2001 2025 2008 2919 2044 2035 1012 2009 2763 2052 2031 2042 2488 2000 2079 2023 3185 1999 5726 28649 2004 2012 2560 102


INFO:tensorflow:input_mask: 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1


I0415 18:07:44.976003 15268 run_classifier.py:466] input_mask: 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1


INFO:tensorflow:segment_ids: 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0


I0415 18:07:44.978002 15268 run_classifier.py:467] segment_ids: 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0


INFO:tensorflow:label: 0 (id = 0)


I0415 18:07:44.982003 15268 run_classifier.py:468] label: 0 (id = 0)


INFO:tensorflow:*** Example ***


I0415 18:07:44.990002 15268 run_classifier.py:461] *** Example ***


INFO:tensorflow:guid: None


I0415 18:07:44.991002 15268 run_classifier.py:462] guid: None


INFO:tensorflow:tokens: [CLS] the last of the " airport " sequels . this has alain del ##on and george kennedy ( who was in all the airport movies ) as pilots ; david warner ( ! ! ! ) as the radio engineer ; susan blake ##ly as a news ##woman targeted for death ; robert wagner as a brilliant scientist ( stop laughing ! ) ; eddie albert as a president of the airlines ; char ##o in a dreadful " comical " bit ; john davidson as a news ##man ( love how his hair stays in place even after the plane turns upside down ! ) ; poor martha ray ##e is humiliated ; ci ##cel ##y tyson plays a mother who is flying a heart [SEP]


I0415 18:07:44.992002 15268 run_classifier.py:464] tokens: [CLS] the last of the " airport " sequels . this has alain del ##on and george kennedy ( who was in all the airport movies ) as pilots ; david warner ( ! ! ! ) as the radio engineer ; susan blake ##ly as a news ##woman targeted for death ; robert wagner as a brilliant scientist ( stop laughing ! ) ; eddie albert as a president of the airlines ; char ##o in a dreadful " comical " bit ; john davidson as a news ##man ( love how his hair stays in place even after the plane turns upside down ! ) ; poor martha ray ##e is humiliated ; ci ##cel ##y tyson plays a mother who is flying a heart [SEP]


INFO:tensorflow:input_ids: 101 1996 2197 1997 1996 1000 3199 1000 25815 1012 2023 2038 15654 3972 2239 1998 2577 5817 1006 2040 2001 1999 2035 1996 3199 5691 1007 2004 8221 1025 2585 6654 1006 999 999 999 1007 2004 1996 2557 3992 1025 6294 6511 2135 2004 1037 2739 10169 9416 2005 2331 1025 2728 10304 2004 1037 8235 7155 1006 2644 5870 999 1007 1025 5752 4789 2004 1037 2343 1997 1996 7608 1025 25869 2080 1999 1037 21794 1000 29257 1000 2978 1025 2198 12017 2004 1037 2739 2386 1006 2293 2129 2010 2606 12237 1999 2173 2130 2044 1996 4946 4332 14961 2091 999 1007 1025 3532 9246 4097 2063 2003 26608 1025 25022 29109 2100 19356 3248 1037 2388 2040 2003 3909 1037 2540 102


I0415 18:07:44.993002 15268 run_classifier.py:465] input_ids: 101 1996 2197 1997 1996 1000 3199 1000 25815 1012 2023 2038 15654 3972 2239 1998 2577 5817 1006 2040 2001 1999 2035 1996 3199 5691 1007 2004 8221 1025 2585 6654 1006 999 999 999 1007 2004 1996 2557 3992 1025 6294 6511 2135 2004 1037 2739 10169 9416 2005 2331 1025 2728 10304 2004 1037 8235 7155 1006 2644 5870 999 1007 1025 5752 4789 2004 1037 2343 1997 1996 7608 1025 25869 2080 1999 1037 21794 1000 29257 1000 2978 1025 2198 12017 2004 1037 2739 2386 1006 2293 2129 2010 2606 12237 1999 2173 2130 2044 1996 4946 4332 14961 2091 999 1007 1025 3532 9246 4097 2063 2003 26608 1025 25022 29109 2100 19356 3248 1037 2388 2040 2003 3909 1037 2540 102


INFO:tensorflow:input_mask: 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1


I0415 18:07:44.994000 15268 run_classifier.py:466] input_mask: 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1


INFO:tensorflow:segment_ids: 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0


I0415 18:07:44.996001 15268 run_classifier.py:467] segment_ids: 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0


INFO:tensorflow:label: 0 (id = 0)


I0415 18:07:44.997001 15268 run_classifier.py:468] label: 0 (id = 0)


INFO:tensorflow:*** Example ***


I0415 18:07:45.002005 15268 run_classifier.py:461] *** Example ***


INFO:tensorflow:guid: None


I0415 18:07:45.003999 15268 run_classifier.py:462] guid: None


INFO:tensorflow:tokens: [CLS] this is a low budget , well acted little gem . alice , a small town massachusetts teenager , fed up with her existence , takes to the road to escape her mother who flip ##s burger ##s and her own job as a check out in a super market . she sets out for florida and to stay with her wealth ##ier high school friend who is a freshman at miami . after her car suspiciously breaks down on the thru ##way and she loses all her money , she ends up with a retired couple in an rv who also happen to be traveling to florida . . the couple , brilliant ##ly played by judith ivy and bill raymond are overly ho ##sp [SEP]


I0415 18:07:45.004998 15268 run_classifier.py:464] tokens: [CLS] this is a low budget , well acted little gem . alice , a small town massachusetts teenager , fed up with her existence , takes to the road to escape her mother who flip ##s burger ##s and her own job as a check out in a super market . she sets out for florida and to stay with her wealth ##ier high school friend who is a freshman at miami . after her car suspiciously breaks down on the thru ##way and she loses all her money , she ends up with a retired couple in an rv who also happen to be traveling to florida . . the couple , brilliant ##ly played by judith ivy and bill raymond are overly ho ##sp [SEP]


INFO:tensorflow:input_ids: 101 2023 2003 1037 2659 5166 1010 2092 6051 2210 17070 1012 5650 1010 1037 2235 2237 4404 10563 1010 7349 2039 2007 2014 4598 1010 3138 2000 1996 2346 2000 4019 2014 2388 2040 11238 2015 15890 2015 1998 2014 2219 3105 2004 1037 4638 2041 1999 1037 3565 3006 1012 2016 4520 2041 2005 3516 1998 2000 2994 2007 2014 7177 3771 2152 2082 2767 2040 2003 1037 10452 2012 5631 1012 2044 2014 2482 21501 7807 2091 2006 1996 27046 4576 1998 2016 12386 2035 2014 2769 1010 2016 4515 2039 2007 1037 3394 3232 1999 2019 27634 2040 2036 4148 2000 2022 7118 2000 3516 1012 1012 1996 3232 1010 8235 2135 2209 2011 12924 7768 1998 3021 7638 2024 15241 7570 13102 102


I0415 18:07:45.005998 15268 run_classifier.py:465] input_ids: 101 2023 2003 1037 2659 5166 1010 2092 6051 2210 17070 1012 5650 1010 1037 2235 2237 4404 10563 1010 7349 2039 2007 2014 4598 1010 3138 2000 1996 2346 2000 4019 2014 2388 2040 11238 2015 15890 2015 1998 2014 2219 3105 2004 1037 4638 2041 1999 1037 3565 3006 1012 2016 4520 2041 2005 3516 1998 2000 2994 2007 2014 7177 3771 2152 2082 2767 2040 2003 1037 10452 2012 5631 1012 2044 2014 2482 21501 7807 2091 2006 1996 27046 4576 1998 2016 12386 2035 2014 2769 1010 2016 4515 2039 2007 1037 3394 3232 1999 2019 27634 2040 2036 4148 2000 2022 7118 2000 3516 1012 1012 1996 3232 1010 8235 2135 2209 2011 12924 7768 1998 3021 7638 2024 15241 7570 13102 102


INFO:tensorflow:input_mask: 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1


I0415 18:07:45.007998 15268 run_classifier.py:466] input_mask: 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1


INFO:tensorflow:segment_ids: 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0


I0415 18:07:45.008996 15268 run_classifier.py:467] segment_ids: 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0


INFO:tensorflow:label: 1 (id = 1)


I0415 18:07:45.009997 15268 run_classifier.py:468] label: 1 (id = 1)


INFO:tensorflow:*** Example ***


I0415 18:07:45.015994 15268 run_classifier.py:461] *** Example ***


INFO:tensorflow:guid: None


I0415 18:07:45.017995 15268 run_classifier.py:462] guid: None


INFO:tensorflow:tokens: [CLS] normally , i don ' t like chuck norris films . i appreciate his work as a martial artist , and his fight scenes are usually fairly well - choreographed . chuck is und ##enia ##bly one of the martial arts great ##s . so , in my local used bookstore , i found a film i hadn ' t seen before and took it home . < br / > < br / > while the acting in this movie was worse than most chu ##ch norris films , i was hoping to see at least one fight scene . i quickly began to realize that this wasn ' t a typical chu ##ch norris film ; rather it was a christian film , destined [SEP]


I0415 18:07:45.019993 15268 run_classifier.py:464] tokens: [CLS] normally , i don ' t like chuck norris films . i appreciate his work as a martial artist , and his fight scenes are usually fairly well - choreographed . chuck is und ##enia ##bly one of the martial arts great ##s . so , in my local used bookstore , i found a film i hadn ' t seen before and took it home . < br / > < br / > while the acting in this movie was worse than most chu ##ch norris films , i was hoping to see at least one fight scene . i quickly began to realize that this wasn ' t a typical chu ##ch norris film ; rather it was a christian film , destined [SEP]


INFO:tensorflow:input_ids: 101 5373 1010 1045 2123 1005 1056 2066 8057 15466 3152 1012 1045 9120 2010 2147 2004 1037 7761 3063 1010 1998 2010 2954 5019 2024 2788 7199 2092 1011 23317 1012 8057 2003 6151 19825 6321 2028 1997 1996 7761 2840 2307 2015 1012 2061 1010 1999 2026 2334 2109 21785 1010 1045 2179 1037 2143 1045 2910 1005 1056 2464 2077 1998 2165 2009 2188 1012 1026 7987 1013 1028 1026 7987 1013 1028 2096 1996 3772 1999 2023 3185 2001 4788 2084 2087 14684 2818 15466 3152 1010 1045 2001 5327 2000 2156 2012 2560 2028 2954 3496 1012 1045 2855 2211 2000 5382 2008 2023 2347 1005 1056 1037 5171 14684 2818 15466 2143 1025 2738 2009 2001 1037 3017 2143 1010 16036 102


I0415 18:07:45.020993 15268 run_classifier.py:465] input_ids: 101 5373 1010 1045 2123 1005 1056 2066 8057 15466 3152 1012 1045 9120 2010 2147 2004 1037 7761 3063 1010 1998 2010 2954 5019 2024 2788 7199 2092 1011 23317 1012 8057 2003 6151 19825 6321 2028 1997 1996 7761 2840 2307 2015 1012 2061 1010 1999 2026 2334 2109 21785 1010 1045 2179 1037 2143 1045 2910 1005 1056 2464 2077 1998 2165 2009 2188 1012 1026 7987 1013 1028 1026 7987 1013 1028 2096 1996 3772 1999 2023 3185 2001 4788 2084 2087 14684 2818 15466 3152 1010 1045 2001 5327 2000 2156 2012 2560 2028 2954 3496 1012 1045 2855 2211 2000 5382 2008 2023 2347 1005 1056 1037 5171 14684 2818 15466 2143 1025 2738 2009 2001 1037 3017 2143 1010 16036 102


INFO:tensorflow:input_mask: 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1


I0415 18:07:45.022994 15268 run_classifier.py:466] input_mask: 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1 1


INFO:tensorflow:segment_ids: 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0


I0415 18:07:45.024992 15268 run_classifier.py:467] segment_ids: 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0


INFO:tensorflow:label: 0 (id = 0)


I0415 18:07:45.025992 15268 run_classifier.py:468] label: 0 (id = 0)


In [28]:
train_features

[<bert.run_classifier.InputFeatures at 0x250774979e8>,
 <bert.run_classifier.InputFeatures at 0x25077497978>,
 <bert.run_classifier.InputFeatures at 0x25077497710>,
 <bert.run_classifier.InputFeatures at 0x2507749ab38>,
 <bert.run_classifier.InputFeatures at 0x2506f3f1940>,
 <bert.run_classifier.InputFeatures at 0x2506f76cb38>,
 <bert.run_classifier.InputFeatures at 0x25077497c18>,
 <bert.run_classifier.InputFeatures at 0x2507749af60>,
 <bert.run_classifier.InputFeatures at 0x2506f76cef0>,
 <bert.run_classifier.InputFeatures at 0x2506f76c518>,
 <bert.run_classifier.InputFeatures at 0x2507749cef0>,
 <bert.run_classifier.InputFeatures at 0x2506f3d9198>,
 <bert.run_classifier.InputFeatures at 0x250741362e8>,
 <bert.run_classifier.InputFeatures at 0x2507749a748>,
 <bert.run_classifier.InputFeatures at 0x2507bcf0e48>,
 <bert.run_classifier.InputFeatures at 0x250789f1ba8>,
 <bert.run_classifier.InputFeatures at 0x2507749d7f0>,
 <bert.run_classifier.InputFeatures at 0x2507bcf06d8>,
 <bert.run

In [30]:
def create_model(is_predicting, input_ids, input_mask, segment_ids, labels,
                 num_labels):
    """Creates a classification model."""

    bert_module = hub.Module(BERT_MODEL_HUB, trainable=True)
    bert_inputs = dict(input_ids=input_ids,
                       input_mask=input_mask,
                       segment_ids=segment_ids)
    bert_outputs = bert_module(inputs=bert_inputs,
                               signature="tokens",
                               as_dict=True)

    # Use "pooled_output" for classification tasks on an entire sentence.
    # Use "sequence_outputs" for token-level output.
    output_layer = bert_outputs["pooled_output"]

    hidden_size = output_layer.shape[-1].value

    # Create our own layer to tune for politeness data.
    output_weights = tf.get_variable(
        "output_weights", [num_labels, hidden_size],
        initializer=tf.truncated_normal_initializer(stddev=0.02))

    output_bias = tf.get_variable("output_bias", [num_labels],
                                  initializer=tf.zeros_initializer())

    with tf.variable_scope("loss"):

        # Dropout helps prevent overfitting
        output_layer = tf.nn.dropout(output_layer, keep_prob=0.9)

        logits = tf.matmul(output_layer, output_weights, transpose_b=True)
        logits = tf.nn.bias_add(logits, output_bias)
        log_probs = tf.nn.log_softmax(logits, axis=-1)

        # Convert labels into one-hot encoding
        one_hot_labels = tf.one_hot(labels, depth=num_labels, dtype=tf.float32)

        predicted_labels = tf.squeeze(
            tf.argmax(log_probs, axis=-1, output_type=tf.int32))
        # If we're predicting, we want predicted labels and the probabiltiies.
        if is_predicting:
            return (predicted_labels, log_probs)

        # If we're train/eval, compute loss between predicted and actual label
        per_example_loss = -tf.reduce_sum(one_hot_labels * log_probs, axis=-1)
        loss = tf.reduce_mean(per_example_loss)
        return (loss, predicted_labels, log_probs)

In [29]:
t=create_model(True,train_features[0].input_ids,train_features[0].input_mask,train_features[0].segment_ids,None,None)

TypeError: Can't convert 'input_ids': Shape TensorShape([Dimension(128)]) is incompatible with TensorShape([Dimension(None), Dimension(None)])