In [1]:
import pandas as pd 
import ast
import re
import numpy as np
import nltk
import json
from datetime import datetime
from datetime import timedelta
from textblob import TextBlob
from nltk import word_tokenize
from sklearn.model_selection import train_test_split
from nltk.tokenize import word_tokenize, TreebankWordTokenizer
from nltk.corpus import stopwords
from nltk.stem import WordNetLemmatizer, PorterStemmer
from nltk.util import ngrams
from sklearn.preprocessing import OneHotEncoder, MinMaxScaler
from sklearn.feature_extraction.text import CountVectorizer, TfidfVectorizer
import spacy
import pyLDAvis.gensim_models
# import en_core_web_md
from gensim.corpora.dictionary import Dictionary
from gensim.models import LdaMulticore
from gensim.models import CoherenceModel
from sklearn.metrics.pairwise import cosine_similarity
import seaborn as sns

nltk.download('stopwords')
nltk.download('punkt')
nltk.download('wordnet')
nltk.download('omw-1.4')

  from scipy.linalg.special_matrices import triu
  if LooseVersion(mpl.__version__) >= "3.0":
  other = LooseVersion(other)
[nltk_data] Downloading package stopwords to
[nltk_data]     /Users/ivankoh/nltk_data...
[nltk_data]   Package stopwords is already up-to-date!
[nltk_data] Downloading package punkt to /Users/ivankoh/nltk_data...
[nltk_data]   Package punkt is already up-to-date!
[nltk_data] Downloading package wordnet to /Users/ivankoh/nltk_data...
[nltk_data]   Package wordnet is already up-to-date!
[nltk_data] Downloading package omw-1.4 to /Users/ivankoh/nltk_data...
[nltk_data]   Package omw-1.4 is already up-to-date!


True

In [2]:
df = pd.read_csv("/Users/ivankoh/Library/CloudStorage/OneDrive-NationalUniversityofSingapore/1D/NUS Y3S1/BT4222/Data/train/kickstarter_train.csv")
# df = pd.read_csv("kickstarter_train.csv")
# df = pd.read_csv("/Users/bandy/Downloads/data/kickstarter_train.csv")


In [3]:
# extract main category and subcategory from category variable
# df['subcategory'] = df['category'].apply(lambda x: json.loads(x)['slug'].split("/")[1] if len(json.loads(x)['slug'].split("/")) > 1 else None)
#df['category'] = df['category'].apply(lambda x: json.loads(x)['slug'].split("/")[0])
# df['location'] = df['location'].apply(lambda x: json.loads(x)['country'])

## NLP features

In [4]:
# Text cleaning for: rewards, description, description story, description risks

def clean_text(df):
    def process_rewards(corpus):
        corpus_processed = []
        for row in corpus:
            row_processed = ""
            row = row.replace("\\\\n", " ")
            row = row.replace("\\\n", " ")
            row = ast.literal_eval(row)

            for dict in row:
                row_processed += dict['rewards'].lower() + ' '

            
            row_processed = row_processed.replace("//",'')
            row_processed = re.sub(r'[^\w\s]', '', row_processed) # remove punctuation
            row_processed = " ".join(row_processed.split()) # Remove excess white space
            corpus_processed.append(row_processed)
        return corpus_processed
    
    def process_description_story(corpus):
        corpus_processed = []
        for row in corpus:
            row = str(row)
            row_processed = row.replace("\r", " " )
            row_processed = row_processed.replace("\n", " " )
            row_processed = re.sub(r'[^\w\s]', '', row_processed) # remove punctuation
            corpus_processed.append(row_processed if not pd.isnull(row_processed) else "") # handle NA

        return corpus_processed

    df["rewards_processed"] = process_rewards(df["rewards"])
    df["description_processed"] = process_description_story(df["description"])
    df["description_story_processed"] = process_description_story(df["description_story"])
    df["description_risks_processed"] = process_description_story(df["description_risks"])

    return df


In [5]:
class LemmatizeTokenizer(object):
    def __init__(self):
        self.lemmatizer = WordNetLemmatizer()
    def __call__(self, text):
        return [self.lemmatizer.lemmatize(word) for word in word_tokenize(text)]

In [6]:
# need to return the vectorizer to use on the test data to transform it 
def generate_nlp_features(df):
    
    tfidf_feature_names = {}
    # Rewards

    vect_rewards = TfidfVectorizer( 
        tokenizer=LemmatizeTokenizer(),
        lowercase=True,
        analyzer='word', 
        ngram_range=(1,3), # unigram, bigram and trigram 
        max_features=100, # vocabulary that only consider the top max_features ordered by term frequency across the corpus
        min_df=10, # minimum word frequency required to be in model
        stop_words=stopwords.words('english') # remove stopwords
        )
    

    rewards_processed = pd.Series(df["rewards_processed"])
    tfidf_fit_rewards = vect_rewards.fit(rewards_processed)
    rewards_tfidf_array = tfidf_fit_rewards.transform(rewards_processed).toarray()
    rewards_tfidf_df = pd.DataFrame(rewards_tfidf_array)
    rewards_tfidf_df.columns = list(map(lambda x : "rewards_" + str(x), rewards_tfidf_df.columns))
    df = pd.merge(df, rewards_tfidf_df , left_index=True, right_index=True)
    tfidf_feature_names["rewards"] = list(zip(range(100),vect_rewards.get_feature_names()))
    

    # Description

    vect_description = TfidfVectorizer( 
        tokenizer=LemmatizeTokenizer(),
        lowercase=True,
        analyzer='word', 
        ngram_range=(1,3), # unigram, bigram and trigram 
        max_features=100, # vocabulary that only consider the top max_features ordered by term frequency across the corpus
        min_df=10, # minimum word frequency required to be in model
        stop_words=stopwords.words('english') # remove stopwords
        )

    description = pd.Series(df["description_processed"])
    tfidf_fit_description = vect_description.fit(description)
    description_tfidf_array = tfidf_fit_description.transform(description).toarray()
    description_tfidf_df = pd.DataFrame(description_tfidf_array)
    description_tfidf_df.columns = list(map(lambda x : "description_" + str(x), description_tfidf_df.columns))
    df = pd.merge(df, description_tfidf_df , left_index=True, right_index=True)
    tfidf_feature_names["description"] = list(zip(range(100),vect_description.get_feature_names()))

    # Description Story

    vect_description_story = TfidfVectorizer( 
        tokenizer=LemmatizeTokenizer(),
        lowercase=True,
        analyzer='word', 
        ngram_range=(1,3), # unigram, bigram and trigram 
        max_features=100, # vocabulary that only consider the top max_features ordered by term frequency across the corpus
        min_df=10, # minimum word frequency required to be in model
        stop_words=stopwords.words('english') # remove stopwords
        )
    
    description_story_processed = pd.Series(df["description_story_processed"])
    tfidf_fit_description_story_processed = vect_description_story.fit(description_story_processed)
    description_story_processed_tfidf_array = tfidf_fit_description_story_processed.transform(description_story_processed).toarray()
    description_story_tfidf_df = pd.DataFrame(description_story_processed_tfidf_array)
    description_story_tfidf_df.columns = list(map(lambda x : "description_story_" + str(x), description_story_tfidf_df.columns))
    df = pd.merge(df, description_story_tfidf_df , left_index=True, right_index=True)
    tfidf_feature_names["description_story"] = list(zip(range(100),vect_description_story.get_feature_names()))



    # Description Risks

    vect_description_risks = TfidfVectorizer( 
        tokenizer=LemmatizeTokenizer(),
        lowercase=True,
        analyzer='word', 
        ngram_range=(1,3), # unigram, bigram and trigram 
        max_features=100, # vocabulary that only consider the top max_features ordered by term frequency across the corpus
        min_df=10, # minimum word frequency required to be in model
        stop_words=stopwords.words('english') # remove stopwords
        )

    description_risks_processed = pd.Series(df["description_risks_processed"])
    tfidf_fit_description_risks_processed = vect_description_risks.fit(description_risks_processed)
    description_risks_processed_tfidf_array = tfidf_fit_description_risks_processed.transform(description_risks_processed).toarray()
    description_risks_tfidf_df = pd.DataFrame(description_risks_processed_tfidf_array)
    description_risks_tfidf_df.columns = list(map(lambda x : "description_risks_" + str(x), description_risks_tfidf_df.columns))
    df = pd.merge(df, description_risks_tfidf_df , left_index=True, right_index=True)
    tfidf_feature_names["description_risks"] = list(zip(range(100),vect_description_risks.get_feature_names()))

    return (df, tfidf_fit_rewards, tfidf_fit_description, tfidf_fit_description_story_processed, tfidf_fit_description_risks_processed, tfidf_feature_names)


def nlp_transform_test(df, tfidf_fit_rewards, tfidf_fit_description, tfidf_fit_description_story_processed, tfidf_fit_description_risks_processed):
    rewards_tfidf_array = tfidf_fit_rewards.transform(df['rewards_processed']).toarray()
    rewards_tfidf_df = pd.DataFrame(rewards_tfidf_array)
    rewards_tfidf_df.columns = list(map(lambda x : "rewards_" + str(x), rewards_tfidf_df.columns))
    df = pd.merge(df, rewards_tfidf_df , left_index=True, right_index=True)
    
    description_tfidf_array = tfidf_fit_description.transform(df['description_processed']).toarray()
    description_tfidf_df = pd.DataFrame(description_tfidf_array)
    description_tfidf_df.columns = list(map(lambda x : "description_" + str(x), description_tfidf_df.columns))
    df = pd.merge(df, description_tfidf_df , left_index=True, right_index=True)
    
    description_story_processed_tfidf_array = tfidf_fit_description_story_processed.transform(df['description_story_processed']).toarray()
    description_story_tfidf_df = pd.DataFrame(description_story_processed_tfidf_array)
    description_story_tfidf_df.columns = list(map(lambda x : "description_story_" + str(x), description_story_tfidf_df.columns))
    df = pd.merge(df, description_story_tfidf_df , left_index=True, right_index=True)
    
    description_risks_processed_tfidf_array = tfidf_fit_description_risks_processed.transform(df['description_risks_processed']).toarray()
    description_risks_tfidf_df = pd.DataFrame(description_risks_processed_tfidf_array)
    description_risks_tfidf_df.columns = list(map(lambda x : "description_risks_" + str(x), description_risks_tfidf_df.columns))
    df = pd.merge(df, description_risks_tfidf_df , left_index=True, right_index=True)
    
    return df


## Rewards Features

In [7]:
# Remove rewards that got cut off while scraping and closes the dictionary
def create_rewards_tiers(df):
    # df["rewards"] = df["rewards"].apply(lambda x : clean_rewards(x))
    df["reward_tiers"] = df["rewards"].apply(lambda x : len(ast.literal_eval(x)))
    df = move_reward_tiers(df)
    return df

def create_min_max_reward(df):
    df["min_reward"] = 0
    df["max_reward"] = 0

    for i in range(len(df)):
        # if i % 100 == 0:
        #     print(i)
        all_reward_amount = []
        reward = df.iloc[i, 5]
        dict_list = ast.literal_eval(reward)
        for dictionary in dict_list:
            values_string = str(dictionary.values())
            reward_title_SGD = re.search(r"(S)?\$\s?\d{1,3}(,\d{1,3})?", values_string) #S$
            if reward_title_SGD:
                reward_amount = re.search(r"\d{1,3}(,\d{1,3})?", reward_title_SGD.group())
            else:
                 print("Error: No reward in SGD found!")   

            if reward_amount is not None:
                integer_amount = re.sub("[^\d\.]", "", reward_amount.group()) # remove comma in large amounts of money
                all_reward_amount.append(int(integer_amount))
            else:
                pledged_without_reward = re.search(r"Pledge without a reward", values_string) # check if have "Pledge without a reward"
                if pledged_without_reward:
                    all_reward_amount.append(0)
        if len(all_reward_amount) > 0:
            df.loc[i, "min_reward"] = min(all_reward_amount)
            df.loc[i, "max_reward"] = max(all_reward_amount)
    print("create min max reward done, now moving columns")
    df = move_min_max_reward(df)
    return df

# Rearange reward_tiers column to the right of rewards
def move_reward_tiers(df):
    cols = df.columns.tolist()
    cols = cols[:6] + [cols[-1]] + cols[6:-1]
    df = df[cols]
    return df

# Rearange min and max reward columns to the right of reward_tiers
def move_min_max_reward(df):
    cols = df.columns.tolist()
    cols = cols[:7] + cols[-2:] + cols[7:-2]
    df = df[cols]
    return df

# Remove backer count in rewards to prevent data leakage
def remove_backers(df):
    new_df = df.copy()
    for i in range(len(df)):
        reward = df.iloc[i, 5]
        dict_list = ast.literal_eval(reward)
        new_list = []

        for dictionary in dict_list:
            values_string = str(dictionary.values())
            match_result = re.search(r"\d+ backer(s)?", values_string) #\nxxx backer
            start_index = match_result.span()[0]
            new_reward = values_string[14:start_index] #Remove "dict_values" and backer-count related words
            new_list.append({'rewards': new_reward})

        new_df.iloc[i,5] = str(new_list)
    return new_df

  integer_amount = re.sub("[^\d\.]", "", reward_amount.group()) # remove comma in large amounts of money


## Sentiment Features

In [8]:
'''
Polarity is float which lies in the range of [-1,1] where 1 means positive statement and -1 means a negative statement. Subjective sentences generally refer to personal opinion, emotion or judgment whereas objective refers to factual information. Subjectivity is also a float which lies in the range of [0,1].
'''
def generate_sentiment_features(df):
    df = df.dropna(subset=['description_story_processed', 'description_risks_processed', 'description_processed', 'rewards_processed']) # NOTE: put at top with other dropnas from other features?
    df["description_story_polarity"] = df["description_story_processed"].apply(lambda x: 
                   TextBlob(x).sentiment.polarity)
    df["description_story_subjectivity"] = df["description_story_processed"].apply(lambda x: 
                   TextBlob(x).sentiment.subjectivity)
    df["description_polarity"] = df["description_processed"].apply(lambda x: 
                   TextBlob(x).sentiment.polarity)
    df["description_subjectivity"] = df["description_processed"].apply(lambda x: 
                   TextBlob(x).sentiment.subjectivity)
    df["description_risks_polarity"] = df["description_risks_processed"].apply(lambda x: 
                   TextBlob(x).sentiment.polarity)
    df["description_risks_subjectivity"] = df["description_risks_processed"].apply(lambda x: 
                   TextBlob(x).sentiment.subjectivity)
    df["rewards_polarity"] = df["rewards_processed"].apply(lambda x: 
                   TextBlob(x).sentiment.polarity)
    df["rewards_subjectivity"] = df["rewards_processed"].apply(lambda x: 
                   TextBlob(x).sentiment.subjectivity)          
    return df

In [9]:
def generate_word_count_features(df): # omitted description due to word limit, word count likely similar for all projects
    df['description_story_word_count'] = df["description_story_processed"].apply(lambda x: len(str(x).split(" ")))
    df['description_risks_word_count'] = df["description_risks_processed"].apply(lambda x: len(str(x).split(" ")))
    df['rewards_word_count'] = df["rewards_processed"].apply(lambda x: len(str(x).split(" ")))
    return df

## One-hot Encoding of Categorical Variables

when to drop one of the OHE columns: 
https://stats.stackexchange.com/questions/231285/dropping-one-of-the-columns-when-using-one-hot-encoding

In [10]:
def ohe_transform(enc, col, df):
    transformed = enc.transform(df[col].to_numpy().reshape(-1, 1))
    #Create a Pandas DataFrame of the hot encoded column
    ohe_df = pd.DataFrame(transformed, columns=enc.get_feature_names_out())
    #concat with original data
    data = pd.concat([df, ohe_df], axis=1)#.drop([col], axis=1)
    return data

def ohe_fit(col, df):
    enc = OneHotEncoder(handle_unknown='ignore', sparse=False)
    enc.fit(df[col].unique().reshape(-1, 1))
    return (ohe_transform(enc, col, df), enc)

hold out on topic modelling first because it is unsupervised algorithm

<h2> Generate Duration Feature </h2>

In [11]:
def generate_duration_features(df):
    df['deadline'] = df['deadline'].apply(lambda x: datetime.strptime(x, '%Y-%m-%d %H:%M:%S'))
    df['launched_at'] = df['launched_at'].apply(lambda x: datetime.strptime(x, '%Y-%m-%d %H:%M:%S'))
    df['created_at'] = df['created_at'].apply(lambda x: datetime.strptime(x, '%Y-%m-%d %H:%M:%S'))
    df['funding_duration_in_days'] = (df['deadline'] - df['launched_at'].dt.tz_localize(None))
    df['funding_duration_in_days'] = df['funding_duration_in_days'].apply(lambda x: x / timedelta(days=1))
    df['preparation_duration_in_days'] = (df['launched_at'] - df['created_at'].dt.tz_localize(None))
    df['preparation_duration_in_days'] = df['preparation_duration_in_days'].apply(lambda x: x / timedelta(days=1))
    
    return df

## Text Competitor Feature

In [12]:
'''
text competitors: inverse originality of text corpus. 

If score is higher means how the project owner 
words the project is very similar to all the other projects out there, meaning more competitive
because the wordings of the project is very 'unoriginal'
'''

def generate_text_competitor(df):
    # combine all text into 1 corpus 
    df['corpus'] = df['description_processed'] + df['description_story_processed'] + df['description_risks_processed']
    # generate a sparse matrix of tfidf 
    vect_corpus = TfidfVectorizer( 
            tokenizer=LemmatizeTokenizer(),
            lowercase=True,
            analyzer='word', 
            stop_words=stopwords.words('english') # remove stopwords
            )
    tfidf_sparse = vect_corpus.fit_transform(df['corpus'])
    # calculate cosine similarity based on the tfidf 
    cos_sim_dense = cosine_similarity(tfidf_sparse)
    # remove diagonal - A project is exactly the same as itself 
    cos_sim_dense_i_removed = cos_sim_dense[~np.eye(cos_sim_dense.shape[0],dtype=bool)].reshape(cos_sim_dense.shape[0],-1)
    # taking median as the similarity threshold - if greater than equal to median, means similar to that specific project 
    threshold = np.median(cos_sim_dense_i_removed.flatten())
    # if cosine similarity is above threshold return 1, then sum to get similar counts 
    df['text_similarity_score'] = np.apply_along_axis(np.sum, 1, cos_sim_dense_i_removed >= threshold)

    # sns.histplot(result['text_similarity_score'])

    return (df, vect_corpus, threshold)

def generate_text_competitor_test(vectorizer, df, threshold):
    # combine all text into 1 corpus 
    df['corpus'] = df['description_processed'] + df['description_story_processed'] + df['description_risks_processed']
    tfidf_sparse = vectorizer.transform(df['corpus'])
    # calculate cosine similarity based on the tfidf 
    cos_sim_dense = cosine_similarity(tfidf_sparse)
    # remove diagonal - A project is exactly the same as itself 
    cos_sim_dense_i_removed = cos_sim_dense[~np.eye(cos_sim_dense.shape[0],dtype=bool)].reshape(cos_sim_dense.shape[0],-1)
    # taking median as the similarity threshold - if greater than equal to median, means similar to that specific project 
    # threshold from training
    # if cosine similarity is above threshold return 1, then sum to get similar counts 
    df['text_similarity_score'] = np.apply_along_axis(np.sum, 1, cos_sim_dense_i_removed >= threshold)

    # sns.histplot(result['text_similarity_score'])

    return df

## Category and goal competitor feature

In [13]:
'''
Category and goal competitor: projects in the same category, that launched in the same month and in the same goal bin
'''
def generate_cat_goal_competitor(df):
    #df['launched_at'] = df['launched_at'].apply(lambda x: datetime.strptime(x, '%Y-%m-%d %H:%M:%S'))
    df['launched_month']= df['launched_at'].dt.month
    df['launched_year']= df['launched_at'].dt.year
    df['cat_goal_bin'] = df.groupby(['category'])['goal'].transform(
                        lambda x: pd.qcut(x, [0, .33, .67, 1]))
    
    competitors = df.groupby(['category','launched_year','launched_month','cat_goal_bin']).count()
    competitors['competitiors_count'] = competitors['name']
    competitors = competitors[['competitiors_count']]
    competitors.reset_index(inplace=True)
    df = pd.merge(df, competitors, on = ['category', 'launched_year', 'launched_month','cat_goal_bin'], how = 'left')

    return df

## Similar success rate feature

In [14]:
'''
Success rate for similar projects belonging to a particular category, with similar goal and launched in the same year.
'''
def generate_similiar_success_rate(df):
    df_success = df[df['state'] == 1]
    df_success = df_success.groupby(['category','launched_year','cat_goal_bin']).count()
    df_success['success_count'] = df_success['name']
    df_success = df_success[['success_count']]
    df_success.reset_index(inplace=True)
    df = pd.merge(df, df_success, on = ['category', 'launched_year', 'cat_goal_bin'], how = 'left')

    df_total = df.groupby(['category','launched_year','cat_goal_bin']).count()
    df_total['total_count'] = df_total['name']
    df_total = df_total[['total_count']]
    df_total.reset_index(inplace=True)
    df = pd.merge(df, df_total, on = ['category', 'launched_year', 'cat_goal_bin'], how = 'left')
    df['success_rate'] = df['success_count'] / df['total_count']
    df['success_rate'] = df['success_rate'].fillna(0)
    return df

## Combine all feature generating functions

In [15]:
result = create_rewards_tiers(df)
print("Rewards tiers done")
result = create_min_max_reward(result)
print("min max rewards done")
result = remove_backers(result)
print("remove backers done")

result = clean_text(result)
print("clean text done")
result['has_video'] = result['video'].apply(lambda x: 0 if pd.isnull(x) else 1)

result, tfidf_fit_rewards, tfidf_fit_description, tfidf_fit_description_story_processed, tfidf_fit_description_risks_processed, tfidf_feature_names = generate_nlp_features(result)
print("generate_nlp_features done")

result = generate_sentiment_features(result)
print("generate_sentiment_features done")
result = generate_word_count_features(result)
print("generate_word_count_features done")
result = generate_duration_features(result)
print("generate_duration_features done")
result, vect_corpus, threshold = generate_text_competitor(result)
print("generate_text_competitor done")
result = generate_cat_goal_competitor(result)
print("generate_cat_goal_competitor done")
result = generate_similiar_success_rate(result)
print("generate_similiar_success_rate done")

result, category_encoder = ohe_fit('category', result) #use encoder to fit train data
print("ohe_fit category done")
result, location_encoder = ohe_fit('location', result) #use encoder to fit train data
print("ohe_fit location done")

Rewards tiers done


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df["min_reward"] = 0
A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df["max_reward"] = 0


create min max reward done, now moving columns
min max rewards done
remove backers done
clean text done




generate_nlp_features done
generate_sentiment_features done
generate_word_count_features done
generate_duration_features done




generate_text_competitor done
generate_cat_goal_competitor done
generate_similiar_success_rate done
ohe_fit category done
ohe_fit location done


In [16]:
# tfidf_feature_names

In [17]:
# with open("tfidf_feature_names.txt", 'w') as f:
#     json.dump(tfidf_feature_names,f)

## Drop Unnecessary Features, Feature Scaling

In [18]:
to_drop = ['rewards', 'deadline', 'launched_at', 'rewards_processed', 'created_at',
           'description_processed', 'description_story_processed','description_risks_processed',
           'id', 'name', 'description', 'description_story', 'description_risks', 'video',
          'location', 'category', 'corpus', 'launched_month', 'launched_year', 'cat_goal_bin', 'success_count', 'total_count']

final_result = result.drop(to_drop, axis = 1)

#need feature scaling
scaler = MinMaxScaler() 
need_scaling = ['reward_tiers', 'min_reward', 'max_reward', 'goal', 'text_similarity_score',
               'description_story_polarity', 'description_story_subjectivity', 'description_polarity',
               'description_subjectivity', 'description_risks_polarity', 'description_risks_subjectivity',
               'rewards_polarity', 'rewards_subjectivity', 'description_story_word_count',
               'description_risks_word_count', 'rewards_word_count', 'funding_duration_in_days',
               'preparation_duration_in_days', 'competitiors_count', 'success_rate']
final_result[need_scaling] = scaler.fit_transform(final_result[need_scaling])

## Apply same feature engineering on Test Data

In [19]:
#test = pd.read_csv("kickstarter_test.csv")
test = pd.read_csv("/Users/ivankoh/Library/CloudStorage/OneDrive-NationalUniversityofSingapore/1D/NUS Y3S1/BT4222/Data/test/kickstarter_test.csv")
test = create_rewards_tiers(test)
test = create_min_max_reward(test)

test = clean_text(test)
test['has_video'] = test['video'].apply(lambda x: 0 if pd.isnull(x) else 1)

test = nlp_transform_test(test, tfidf_fit_rewards, tfidf_fit_description, tfidf_fit_description_story_processed, tfidf_fit_description_risks_processed)

test = generate_sentiment_features(test)
test = generate_word_count_features(test)
test = generate_duration_features(test)
test = generate_text_competitor_test(vect_corpus, test, threshold)
test = generate_cat_goal_competitor(test)
test = generate_similiar_success_rate(test)

#encoders
test = ohe_transform(category_encoder, 'category', test)
test = ohe_transform(location_encoder, 'location', test)

#drop and scale 
final_test = test.drop(to_drop, axis=1)
final_test[need_scaling] = scaler.transform(final_test[need_scaling])

create min max reward done, now moving columns


In [20]:
import pickle
tfidf_feature_names

with open('tfidf_feature_names.pkl', 'wb') as f:
    pickle.dump(tfidf_feature_names, f)

In [32]:
tfidf_feature_names

{'rewards': [(0, '1'),
  (1, '10'),
  (2, '100'),
  (3, '15'),
  (4, '2'),
  (5, '2014'),
  (6, '2015'),
  (7, '2015 ship'),
  (8, '2016'),
  (9, '2017'),
  (10, '2018'),
  (11, '2019'),
  (12, '2020'),
  (13, '2021'),
  (14, '2022'),
  (15, '25'),
  (16, '3'),
  (17, '5'),
  (18, '50'),
  (19, 'album'),
  (20, 'also'),
  (21, 'anywhere'),
  (22, 'anywhere world'),
  (23, 'anywhere world pledge'),
  (24, 'available'),
  (25, 'book'),
  (26, 'cd'),
  (27, 'choice'),
  (28, 'copy'),
  (29, 'credit'),
  (30, 'dec'),
  (31, 'delivery'),
  (32, 'delivery dec'),
  (33, 'delivery jun'),
  (34, 'delivery oct'),
  (35, 'delivery sep'),
  (36, 'digital'),
  (37, 'download'),
  (38, 'early'),
  (39, 'edition'),
  (40, 'estimated'),
  (41, 'estimated delivery'),
  (42, 'estimated delivery dec'),
  (43, 'estimated delivery jun'),
  (44, 'estimated delivery nov'),
  (45, 'estimated delivery oct'),
  (46, 'estimated delivery sep'),
  (47, 'exclusive'),
  (48, 'film'),
  (49, 'free'),
  (50, 'get'),
 

In [21]:
print(len(final_test.columns))
print(len(final_result.columns))

for i in result.columns:
    if i not in test.columns:
        print(i)

579
579


In [22]:
final_result.columns

Index(['reward_tiers', 'min_reward', 'max_reward', 'goal', 'state',
       'staff_pick', 'has_video', 'rewards_0', 'rewards_1', 'rewards_2',
       ...
       'x0_UY', 'x0_VE', 'x0_VN', 'x0_VU', 'x0_WS', 'x0_XK', 'x0_YE', 'x0_ZA',
       'x0_ZW', 'x0_nan'],
      dtype='object', length=579)

## Export

In [23]:
import time 

final_result.to_csv(f'/Users/ivankoh/Library/CloudStorage/OneDrive-NationalUniversityofSingapore/1D/NUS Y3S1/BT4222/Data/train/kickstarter_train_final_{time.strftime("%Y%m%d-%H%M%S")}.csv', index=False)
final_test.to_csv(f'/Users/ivankoh/Library/CloudStorage/OneDrive-NationalUniversityofSingapore/1D/NUS Y3S1/BT4222/Data/test/kickstarter_test_final_{time.strftime("%Y%m%d-%H%M%S")}.csv', index=False)


In [24]:
#since there could be more than one categories for each project, create new features to split the categories.
# df['new_category'] = df.category.str.split("/", expand=False)
# split_cat = pd.DataFrame(df['new_category'].tolist(), columns=['category1', 'category2'])
# #each project should at least have 1 category, 'category2' can be "None". 
# #'category1' being the main category for the project.
# df = pd.concat([df, split_cat], axis=1)
# df.head()t

In [25]:

pd.set_option('display.max_columns', None)

In [26]:
final_test.reward_tiers.value_counts()

0.033333    409
0.050000    388
0.058333    367
0.041667    364
0.025000    337
0.066667    291
0.075000    286
0.016667    274
0.000000    259
0.083333    199
0.091667    177
0.008333    160
0.100000    160
0.108333    117
0.116667    106
0.125000     90
0.133333     64
0.141667     48
0.150000     40
0.166667     29
0.158333     28
0.175000     27
0.191667     24
0.183333     17
0.216667     14
0.233333     11
0.200000     11
0.208333      9
0.241667      8
0.225000      8
0.250000      6
0.291667      5
0.275000      5
0.258333      4
0.266667      3
0.283333      3
0.350000      2
0.341667      2
0.325000      2
0.300000      2
0.358333      2
0.333333      2
0.375000      1
0.483333      1
0.833333      1
0.433333      1
0.308333      1
0.558333      1
0.491667      1
0.550000      1
0.316667      1
Name: reward_tiers, dtype: int64

In [27]:
final_test.head()

Unnamed: 0,reward_tiers,min_reward,max_reward,goal,state,staff_pick,has_video,rewards_0,rewards_1,rewards_2,rewards_3,rewards_4,rewards_5,rewards_6,rewards_7,rewards_8,rewards_9,rewards_10,rewards_11,rewards_12,rewards_13,rewards_14,rewards_15,rewards_16,rewards_17,rewards_18,rewards_19,rewards_20,rewards_21,rewards_22,rewards_23,rewards_24,rewards_25,rewards_26,rewards_27,rewards_28,rewards_29,rewards_30,rewards_31,rewards_32,rewards_33,rewards_34,rewards_35,rewards_36,rewards_37,rewards_38,rewards_39,rewards_40,rewards_41,rewards_42,rewards_43,rewards_44,rewards_45,rewards_46,rewards_47,rewards_48,rewards_49,rewards_50,rewards_51,rewards_52,rewards_53,rewards_54,rewards_55,rewards_56,rewards_57,rewards_58,rewards_59,rewards_60,rewards_61,rewards_62,rewards_63,rewards_64,rewards_65,rewards_66,rewards_67,rewards_68,rewards_69,rewards_70,rewards_71,rewards_72,rewards_73,rewards_74,rewards_75,rewards_76,rewards_77,rewards_78,rewards_79,rewards_80,rewards_81,rewards_82,rewards_83,rewards_84,rewards_85,rewards_86,rewards_87,rewards_88,rewards_89,rewards_90,rewards_91,rewards_92,rewards_93,rewards_94,rewards_95,rewards_96,rewards_97,rewards_98,rewards_99,description_0,description_1,description_2,description_3,description_4,description_5,description_6,description_7,description_8,description_9,description_10,description_11,description_12,description_13,description_14,description_15,description_16,description_17,description_18,description_19,description_20,description_21,description_22,description_23,description_24,description_25,description_26,description_27,description_28,description_29,description_30,description_31,description_32,description_33,description_34,description_35,description_36,description_37,description_38,description_39,description_40,description_41,description_42,description_43,description_44,description_45,description_46,description_47,description_48,description_49,description_50,description_51,description_52,description_53,description_54,description_55,description_56,description_57,description_58,description_59,description_60,description_61,description_62,description_63,description_64,description_65,description_66,description_67,description_68,description_69,description_70,description_71,description_72,description_73,description_74,description_75,description_76,description_77,description_78,description_79,description_80,description_81,description_82,description_83,description_84,description_85,description_86,description_87,description_88,description_89,description_90,description_91,description_92,description_93,description_94,description_95,description_96,description_97,description_98,description_99,description_story_0,description_story_1,description_story_2,description_story_3,description_story_4,description_story_5,description_story_6,description_story_7,description_story_8,description_story_9,description_story_10,description_story_11,description_story_12,description_story_13,description_story_14,description_story_15,description_story_16,description_story_17,description_story_18,description_story_19,description_story_20,description_story_21,description_story_22,description_story_23,description_story_24,description_story_25,description_story_26,description_story_27,description_story_28,description_story_29,description_story_30,description_story_31,description_story_32,description_story_33,description_story_34,description_story_35,description_story_36,description_story_37,description_story_38,description_story_39,description_story_40,description_story_41,description_story_42,description_story_43,description_story_44,description_story_45,description_story_46,description_story_47,description_story_48,description_story_49,description_story_50,description_story_51,description_story_52,description_story_53,description_story_54,description_story_55,description_story_56,description_story_57,description_story_58,description_story_59,description_story_60,description_story_61,description_story_62,description_story_63,description_story_64,description_story_65,description_story_66,description_story_67,description_story_68,description_story_69,description_story_70,description_story_71,description_story_72,description_story_73,description_story_74,description_story_75,description_story_76,description_story_77,description_story_78,description_story_79,description_story_80,description_story_81,description_story_82,description_story_83,description_story_84,description_story_85,description_story_86,description_story_87,description_story_88,description_story_89,description_story_90,description_story_91,description_story_92,description_story_93,description_story_94,description_story_95,description_story_96,description_story_97,description_story_98,description_story_99,description_risks_0,description_risks_1,description_risks_2,description_risks_3,description_risks_4,description_risks_5,description_risks_6,description_risks_7,description_risks_8,description_risks_9,description_risks_10,description_risks_11,description_risks_12,description_risks_13,description_risks_14,description_risks_15,description_risks_16,description_risks_17,description_risks_18,description_risks_19,description_risks_20,description_risks_21,description_risks_22,description_risks_23,description_risks_24,description_risks_25,description_risks_26,description_risks_27,description_risks_28,description_risks_29,description_risks_30,description_risks_31,description_risks_32,description_risks_33,description_risks_34,description_risks_35,description_risks_36,description_risks_37,description_risks_38,description_risks_39,description_risks_40,description_risks_41,description_risks_42,description_risks_43,description_risks_44,description_risks_45,description_risks_46,description_risks_47,description_risks_48,description_risks_49,description_risks_50,description_risks_51,description_risks_52,description_risks_53,description_risks_54,description_risks_55,description_risks_56,description_risks_57,description_risks_58,description_risks_59,description_risks_60,description_risks_61,description_risks_62,description_risks_63,description_risks_64,description_risks_65,description_risks_66,description_risks_67,description_risks_68,description_risks_69,description_risks_70,description_risks_71,description_risks_72,description_risks_73,description_risks_74,description_risks_75,description_risks_76,description_risks_77,description_risks_78,description_risks_79,description_risks_80,description_risks_81,description_risks_82,description_risks_83,description_risks_84,description_risks_85,description_risks_86,description_risks_87,description_risks_88,description_risks_89,description_risks_90,description_risks_91,description_risks_92,description_risks_93,description_risks_94,description_risks_95,description_risks_96,description_risks_97,description_risks_98,description_risks_99,description_story_polarity,description_story_subjectivity,description_polarity,description_subjectivity,description_risks_polarity,description_risks_subjectivity,rewards_polarity,rewards_subjectivity,description_story_word_count,description_risks_word_count,rewards_word_count,funding_duration_in_days,preparation_duration_in_days,text_similarity_score,competitiors_count,success_rate,x0_art,x0_comics,x0_crafts,x0_dance,x0_design,x0_fashion,x0_film & video,x0_food,x0_games,x0_journalism,x0_music,x0_photography,x0_publishing,x0_technology,x0_theater,x0_AE,x0_AF,x0_AM,x0_AO,x0_AQ,x0_AR,x0_AT,x0_AU,x0_AW,x0_AZ,x0_BA,x0_BD,x0_BE,x0_BF,x0_BG,x0_BR,x0_BS,x0_BT,x0_BY,x0_BZ,x0_CA,x0_CD,x0_CG,x0_CH,x0_CK,x0_CL,x0_CN,x0_CO,x0_CR,x0_CU,x0_CV,x0_CY,x0_CZ,x0_DE,x0_DJ,x0_DK,x0_DO,x0_EC,x0_EE,x0_EG,x0_ES,x0_ET,x0_FI,x0_FO,x0_FR,x0_GB,x0_GE,x0_GH,x0_GL,x0_GR,x0_GT,x0_GU,x0_HK,x0_HN,x0_HR,x0_HT,x0_HU,x0_ID,x0_IE,x0_IL,x0_IN,x0_IQ,x0_IS,x0_IT,x0_JM,x0_JO,x0_JP,x0_KE,x0_KH,x0_KR,x0_KW,x0_KZ,x0_LB,x0_LR,x0_LT,x0_LU,x0_LV,x0_MA,x0_MD,x0_ME,x0_MG,x0_ML,x0_MM,x0_MN,x0_MO,x0_MQ,x0_MT,x0_MU,x0_MW,x0_MX,x0_MY,x0_MZ,x0_NC,x0_NG,x0_NI,x0_NL,x0_NO,x0_NP,x0_NZ,x0_PA,x0_PE,x0_PH,x0_PK,x0_PL,x0_PR,x0_PS,x0_PT,x0_RO,x0_RS,x0_RU,x0_RW,x0_SE,x0_SG,x0_SI,x0_SJ,x0_SK,x0_SL,x0_SN,x0_SO,x0_SR,x0_SV,x0_SX,x0_TD,x0_TH,x0_TR,x0_TT,x0_TW,x0_TZ,x0_UA,x0_UG,x0_US,x0_UY,x0_VE,x0_VN,x0_VU,x0_WS,x0_XK,x0_YE,x0_ZA,x0_ZW,x0_nan
0,0.083333,3.3e-05,0.002495,3e-05,1,0,1,0.048532,0.043001,0.022009,0.023093,0.04597,0.0,0.0,0.0,0.43049,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.060252,0.047782,0.021928,0.0,0.0,0.039648,0.040146,0.0,0.0,0.0,0.0,0.031663,0.029582,0.111387,0.0,0.149658,0.0,0.399874,0.0,0.0,0.093903,0.192178,0.0,0.0,0.149658,0.149658,0.0,0.399874,0.0,0.0,0.0,0.0,0.043965,0.0,0.0,0.0,0.399745,0.149658,0.149658,0.149658,0.065704,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.149604,0.208682,0.0,0.079724,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.030969,0.040172,0.040185,0.0,0.0,0.0,0.030098,0.060772,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.186809,0.0,0.0,0.0,0.0,0.03913,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.845769,0.0,0.533549,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.346778,0.0,0.54075,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.31933,0.0,0.0,0.0,0.0,0.0,0.0,0.52599,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.188918,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.32953,0.253808,0.0,0.0,0.0,0.0,0.53125,0.458333,0.5,0.0,0.7625,0.5,0.510371,0.222729,0.01918,0.022517,0.050671,0.32831,0.000175,0.025108,0.046875,0.79064,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
1,0.066667,7e-06,0.00499,2.5e-05,1,0,0,0.082628,0.0,0.0,0.015727,0.015653,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.261311,0.0,0.047509,0.0,0.03254,0.0,0.0,0.040518,0.0,0.0,0.0,0.03718,0.026494,0.0,0.0,0.0,0.353997,0.0,0.083389,0.0,0.0,0.025328,0.123445,0.511598,0.0,0.237133,0.046499,0.083389,0.083389,0.0,0.0,0.0,0.025328,0.123445,0.0,0.059882,0.0,0.143042,0.142146,0.0,0.092654,0.083389,0.083389,0.134236,0.041982,0.042325,0.0,0.174568,0.0,0.02526,0.031114,0.083359,0.116277,0.0,0.0,0.265741,0.0,0.06793,0.042341,0.042344,0.123425,0.093668,0.063272,0.0,0.0,0.121055,0.12629,0.0,0.266466,0.020693,0.123691,0.0,0.0,0.0,0.0,0.023034,0.0,0.12722,0.119936,0.125273,0.0,0.086417,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.52437,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.587769,0.0,0.616088,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.060433,0.0,0.083069,0.0,0.0,0.0,0.0,0.0,0.103592,0.0,0.083247,0.07433,0.089211,0.0,0.157483,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.31184,0.088662,0.0,0.084199,0.082692,0.24859,0.0,0.0,0.0,0.0,0.0,0.058081,0.115143,0.0,0.071015,0.081487,0.0,0.0,0.0,0.06288,0.073546,0.0,0.172183,0.0,0.072551,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.088211,0.0,0.105127,0.0,0.083404,0.0,0.0,0.0,0.0,0.0,0.0,0.258631,0.0,0.090868,0.0,0.0,0.431221,0.101926,0.143019,0.074627,0.392535,0.0,0.0,0.0,0.0,0.0,0.311294,0.084707,0.0,0.0,0.06757,0.0,0.206222,0.0,0.0,0.08658,0.209838,0.0,0.0,0.0,0.0,0.0,0.0,0.46049,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.266942,0.0,0.0,0.0,0.190496,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.186852,0.0,0.0,0.0,0.211781,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.255864,0.0,0.0,0.0,0.228017,0.39027,0.0,0.0,0.0,0.0,0.23686,0.0,0.151843,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.161933,0.0,0.255765,0.0,0.0,0.0,0.400089,0.0,0.0,0.0,0.0,0.584517,0.49186,0.5,0.15,0.520022,0.27316,0.434197,0.242019,0.082934,0.080831,0.141804,0.162822,0.006493,0.146229,0.03125,0.88961,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
2,0.1,7e-06,0.002495,4.2e-05,1,1,1,0.054363,0.144504,0.024653,0.051735,0.128734,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.026048,0.168728,0.133807,0.024562,0.0,0.0,0.222059,0.224846,0.0,0.061154,0.0,0.0,0.0,0.0,0.0,0.0,0.198119,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.038241,0.198119,0.198119,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.104568,0.0,0.0,0.198119,0.198119,0.198119,0.147196,0.0,0.0,0.151642,0.0,0.0,0.0,0.025588,0.213281,0.276255,0.0,0.178605,0.079472,0.0,0.0,0.0,0.0,0.0,0.038517,0.208141,0.224994,0.225064,0.066371,0.069241,0.0,0.0,0.0,0.067816,0.0,0.0,0.26989,0.029213,0.0,0.0,0.2473,0.065758,0.068684,0.0,0.0,0.219159,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.609372,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.582076,0.0,0.0,0.0,0.0,0.538381,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.061955,0.0,0.0,0.0,0.187807,0.543352,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.268921,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.127812,0.285604,0.0,0.0,0.098835,0.063454,0.0,0.0,0.047501,0.0,0.0,0.054414,0.0,0.0,0.0,0.0,0.321106,0.0,0.0,0.0,0.0,0.047387,0.0,0.0,0.12976,0.061666,0.0,0.0,0.0,0.0,0.04896,0.047166,0.088324,0.0,0.052485,0.0,0.0,0.0,0.316902,0.0,0.0,0.228859,0.0,0.125796,0.058829,0.0,0.066986,0.0,0.068138,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.089393,0.0,0.0,0.0,0.127673,0.0,0.0,0.050922,0.053298,0.0,0.0,0.348607,0.0,0.052712,0.0,0.0,0.0,0.0,0.349146,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.40393,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.209641,0.0,0.0,0.0,0.0,0.183457,0.0,0.0,0.320479,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.170069,0.0,0.0,0.0,0.166459,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.156702,0.239146,0.0,0.0,0.0,0.570626,0.0,0.0,0.0,0.211722,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.160644,0.0,0.0,0.0,0.0,0.593031,0.446306,0.4875,0.1625,0.425,0.1,0.548396,0.356664,0.091458,0.04388,0.090565,0.322088,0.00872,0.1555,0.078125,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
3,0.058333,0.0001,0.001755,3e-05,0,0,0,0.04874,0.043186,0.044207,0.046384,0.046168,0.0,0.0,0.0,0.0,0.0,0.664575,0.0,0.0,0.0,0.0,0.093415,0.0,0.0,0.132131,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.21862,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.21862,0.21862,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.046877,0.0,0.0,0.21862,0.21862,0.21862,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.41295,0.21854,0.0,0.063375,0.0,0.0,0.053311,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.061033,0.0,0.0,0.0,0.0,0.0,0.0,0.061974,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.626528,0.626711,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.463352,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.244552,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.334624,0.0,0.0,0.0,0.0,0.146093,0.0,0.0,0.465941,0.378877,0.0,0.164873,0.0,0.0,0.147958,0.127226,0.0,0.0,0.0,0.0,0.146794,0.0,0.0,0.0,0.262898,0.126631,0.0,0.0,0.0,0.181288,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.179846,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.144687,0.0,0.0,0.0,0.172419,0.0,0.0,0.0,0.0,0.0,0.0,0.261142,0.136716,0.0,0.0,0.0,0.267414,0.0,0.0,0.0,0.0,0.371498,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.253395,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.418851,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.424306,0.0,0.309619,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.426803,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.242011,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.325138,0.0,0.0,0.0,0.0,0.549091,0.394747,0.6,0.416667,0.57,0.645,0.527882,0.406106,0.031078,0.024249,0.068255,0.32831,0.002577,0.107472,0.0,0.668831,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
4,0.05,6.7e-05,0.006245,0.0002,1,1,1,0.035782,0.015852,0.016227,0.017026,0.067786,0.0,0.0,0.0,0.0,0.0,0.213449,0.0,0.0,0.0,0.0,0.017145,0.088846,0.0,0.016167,0.0,0.0,0.0,0.0,0.0,0.020126,0.0,0.0,0.023345,0.0,0.0,0.0,0.070217,0.0,0.0,0.0,0.0,0.0,0.793461,0.282397,0.0,0.070217,0.070217,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.215021,0.275308,0.115418,0.0,0.070217,0.070217,0.070217,0.0,0.022725,0.022911,0.0,0.0,0.0,0.0,0.084211,0.070191,0.09791,0.09305,0.0,0.0,0.039137,0.018386,0.02292,0.022921,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.044806,0.0,0.0,0.0,0.0,0.134597,0.0,0.045497,0.087647,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.742019,0.0,0.670378,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.088325,0.270599,0.0,0.085251,0.0,0.039061,0.042378,0.0,0.0,0.5272,0.039522,0.0,0.041653,0.078288,0.0,0.041948,0.0,0.148102,0.0,0.0,0.389073,0.170178,0.0,0.037759,0.0753,0.119622,0.044551,0.0,0.04169,0.123336,0.0,0.116649,0.058446,0.355658,0.0,0.0,0.101855,0.039729,0.109242,0.162426,0.0,0.066785,0.0,0.0,0.0,0.068771,0.059134,0.069165,0.072445,0.215903,0.0,0.0,0.0,0.0,0.0,0.061097,0.117716,0.0,0.038109,0.0,0.0,0.0,0.04805,0.098865,0.0,0.0,0.085678,0.0,0.039245,0.036707,0.041169,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.047927,0.0,0.0,0.138432,0.039542,0.0,0.027888,0.0,0.036928,0.146376,0.0,0.0,0.091034,0.063546,0.033255,0.0,0.0,0.031073,0.0,0.03289,0.034209,0.085096,0.125056,0.0,0.0,0.0,0.0,0.398012,0.403208,0.0,0.0,0.0,0.0,0.085299,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.142832,0.0,0.0,0.0,0.0,0.249985,0.0,0.149541,0.0,0.116594,0.127229,0.0,0.0,0.130675,0.344739,0.125296,0.0,0.0,0.0,0.0,0.204464,0.137705,0.0,0.126544,0.115871,0.0,0.151071,0.0,0.113411,0.127858,0.0,0.0,0.0,0.0,0.13999,0.0,0.0,0.128319,0.249509,0.0,0.0,0.0,0.0,0.138273,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.12115,0.132838,0.0,0.0,0.105937,0.0,0.0,0.0,0.0,0.0,0.257322,0.0,0.0,0.0,0.640451,0.532595,0.55,0.45,0.779261,0.518253,0.683543,0.542226,0.241343,0.12067,0.167707,0.254317,0.032054,0.136529,0.015625,0.696429,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0


In [28]:
final_result.head()

Unnamed: 0,reward_tiers,min_reward,max_reward,goal,state,staff_pick,has_video,rewards_0,rewards_1,rewards_2,rewards_3,rewards_4,rewards_5,rewards_6,rewards_7,rewards_8,rewards_9,rewards_10,rewards_11,rewards_12,rewards_13,rewards_14,rewards_15,rewards_16,rewards_17,rewards_18,rewards_19,rewards_20,rewards_21,rewards_22,rewards_23,rewards_24,rewards_25,rewards_26,rewards_27,rewards_28,rewards_29,rewards_30,rewards_31,rewards_32,rewards_33,rewards_34,rewards_35,rewards_36,rewards_37,rewards_38,rewards_39,rewards_40,rewards_41,rewards_42,rewards_43,rewards_44,rewards_45,rewards_46,rewards_47,rewards_48,rewards_49,rewards_50,rewards_51,rewards_52,rewards_53,rewards_54,rewards_55,rewards_56,rewards_57,rewards_58,rewards_59,rewards_60,rewards_61,rewards_62,rewards_63,rewards_64,rewards_65,rewards_66,rewards_67,rewards_68,rewards_69,rewards_70,rewards_71,rewards_72,rewards_73,rewards_74,rewards_75,rewards_76,rewards_77,rewards_78,rewards_79,rewards_80,rewards_81,rewards_82,rewards_83,rewards_84,rewards_85,rewards_86,rewards_87,rewards_88,rewards_89,rewards_90,rewards_91,rewards_92,rewards_93,rewards_94,rewards_95,rewards_96,rewards_97,rewards_98,rewards_99,description_0,description_1,description_2,description_3,description_4,description_5,description_6,description_7,description_8,description_9,description_10,description_11,description_12,description_13,description_14,description_15,description_16,description_17,description_18,description_19,description_20,description_21,description_22,description_23,description_24,description_25,description_26,description_27,description_28,description_29,description_30,description_31,description_32,description_33,description_34,description_35,description_36,description_37,description_38,description_39,description_40,description_41,description_42,description_43,description_44,description_45,description_46,description_47,description_48,description_49,description_50,description_51,description_52,description_53,description_54,description_55,description_56,description_57,description_58,description_59,description_60,description_61,description_62,description_63,description_64,description_65,description_66,description_67,description_68,description_69,description_70,description_71,description_72,description_73,description_74,description_75,description_76,description_77,description_78,description_79,description_80,description_81,description_82,description_83,description_84,description_85,description_86,description_87,description_88,description_89,description_90,description_91,description_92,description_93,description_94,description_95,description_96,description_97,description_98,description_99,description_story_0,description_story_1,description_story_2,description_story_3,description_story_4,description_story_5,description_story_6,description_story_7,description_story_8,description_story_9,description_story_10,description_story_11,description_story_12,description_story_13,description_story_14,description_story_15,description_story_16,description_story_17,description_story_18,description_story_19,description_story_20,description_story_21,description_story_22,description_story_23,description_story_24,description_story_25,description_story_26,description_story_27,description_story_28,description_story_29,description_story_30,description_story_31,description_story_32,description_story_33,description_story_34,description_story_35,description_story_36,description_story_37,description_story_38,description_story_39,description_story_40,description_story_41,description_story_42,description_story_43,description_story_44,description_story_45,description_story_46,description_story_47,description_story_48,description_story_49,description_story_50,description_story_51,description_story_52,description_story_53,description_story_54,description_story_55,description_story_56,description_story_57,description_story_58,description_story_59,description_story_60,description_story_61,description_story_62,description_story_63,description_story_64,description_story_65,description_story_66,description_story_67,description_story_68,description_story_69,description_story_70,description_story_71,description_story_72,description_story_73,description_story_74,description_story_75,description_story_76,description_story_77,description_story_78,description_story_79,description_story_80,description_story_81,description_story_82,description_story_83,description_story_84,description_story_85,description_story_86,description_story_87,description_story_88,description_story_89,description_story_90,description_story_91,description_story_92,description_story_93,description_story_94,description_story_95,description_story_96,description_story_97,description_story_98,description_story_99,description_risks_0,description_risks_1,description_risks_2,description_risks_3,description_risks_4,description_risks_5,description_risks_6,description_risks_7,description_risks_8,description_risks_9,description_risks_10,description_risks_11,description_risks_12,description_risks_13,description_risks_14,description_risks_15,description_risks_16,description_risks_17,description_risks_18,description_risks_19,description_risks_20,description_risks_21,description_risks_22,description_risks_23,description_risks_24,description_risks_25,description_risks_26,description_risks_27,description_risks_28,description_risks_29,description_risks_30,description_risks_31,description_risks_32,description_risks_33,description_risks_34,description_risks_35,description_risks_36,description_risks_37,description_risks_38,description_risks_39,description_risks_40,description_risks_41,description_risks_42,description_risks_43,description_risks_44,description_risks_45,description_risks_46,description_risks_47,description_risks_48,description_risks_49,description_risks_50,description_risks_51,description_risks_52,description_risks_53,description_risks_54,description_risks_55,description_risks_56,description_risks_57,description_risks_58,description_risks_59,description_risks_60,description_risks_61,description_risks_62,description_risks_63,description_risks_64,description_risks_65,description_risks_66,description_risks_67,description_risks_68,description_risks_69,description_risks_70,description_risks_71,description_risks_72,description_risks_73,description_risks_74,description_risks_75,description_risks_76,description_risks_77,description_risks_78,description_risks_79,description_risks_80,description_risks_81,description_risks_82,description_risks_83,description_risks_84,description_risks_85,description_risks_86,description_risks_87,description_risks_88,description_risks_89,description_risks_90,description_risks_91,description_risks_92,description_risks_93,description_risks_94,description_risks_95,description_risks_96,description_risks_97,description_risks_98,description_risks_99,description_story_polarity,description_story_subjectivity,description_polarity,description_subjectivity,description_risks_polarity,description_risks_subjectivity,rewards_polarity,rewards_subjectivity,description_story_word_count,description_risks_word_count,rewards_word_count,funding_duration_in_days,preparation_duration_in_days,text_similarity_score,competitiors_count,success_rate,x0_art,x0_comics,x0_crafts,x0_dance,x0_design,x0_fashion,x0_film & video,x0_food,x0_games,x0_journalism,x0_music,x0_photography,x0_publishing,x0_technology,x0_theater,x0_AE,x0_AF,x0_AM,x0_AO,x0_AQ,x0_AR,x0_AT,x0_AU,x0_AW,x0_AZ,x0_BA,x0_BD,x0_BE,x0_BF,x0_BG,x0_BR,x0_BS,x0_BT,x0_BY,x0_BZ,x0_CA,x0_CD,x0_CG,x0_CH,x0_CK,x0_CL,x0_CN,x0_CO,x0_CR,x0_CU,x0_CV,x0_CY,x0_CZ,x0_DE,x0_DJ,x0_DK,x0_DO,x0_EC,x0_EE,x0_EG,x0_ES,x0_ET,x0_FI,x0_FO,x0_FR,x0_GB,x0_GE,x0_GH,x0_GL,x0_GR,x0_GT,x0_GU,x0_HK,x0_HN,x0_HR,x0_HT,x0_HU,x0_ID,x0_IE,x0_IL,x0_IN,x0_IQ,x0_IS,x0_IT,x0_JM,x0_JO,x0_JP,x0_KE,x0_KH,x0_KR,x0_KW,x0_KZ,x0_LB,x0_LR,x0_LT,x0_LU,x0_LV,x0_MA,x0_MD,x0_ME,x0_MG,x0_ML,x0_MM,x0_MN,x0_MO,x0_MQ,x0_MT,x0_MU,x0_MW,x0_MX,x0_MY,x0_MZ,x0_NC,x0_NG,x0_NI,x0_NL,x0_NO,x0_NP,x0_NZ,x0_PA,x0_PE,x0_PH,x0_PK,x0_PL,x0_PR,x0_PS,x0_PT,x0_RO,x0_RS,x0_RU,x0_RW,x0_SE,x0_SG,x0_SI,x0_SJ,x0_SK,x0_SL,x0_SN,x0_SO,x0_SR,x0_SV,x0_SX,x0_TD,x0_TH,x0_TR,x0_TT,x0_TW,x0_TZ,x0_UA,x0_UG,x0_US,x0_UY,x0_VE,x0_VN,x0_VU,x0_WS,x0_XK,x0_YE,x0_ZA,x0_ZW,x0_nan
0,0.041667,0.000167,0.004995,9e-05,1,1,1,0.042075,0.0,0.038161,0.0,0.039854,0.075896,0.0,0.0,0.0,0.0,0.430264,0.0,0.0,0.0,0.0,0.08064,0.0,0.0,0.03802,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.3452,0.14154,0.346071,0.0,0.0,0.0,0.0,0.0,0.0,0.059194,0.14154,0.14154,0.346095,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.14154,0.14154,0.14154,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.079216,0.141489,0.197363,0.109414,0.0,0.061508,0.0,0.0,0.0,0.0,0.0,0.0,0.080546,0.0,0.0,0.154105,0.160769,0.0,0.0,0.0,0.157461,0.112914,0.113068,0.0,0.0,0.175933,0.053498,0.176676,0.15268,0.159475,0.112914,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.62069,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.473705,0.0,0.0,0.484473,0.0,0.394504,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.064879,0.056791,0.0,0.041747,0.0,0.0,0.186771,0.0,0.0,0.070409,0.058061,0.0,0.0,0.115012,0.051346,0.0,0.057194,0.0,0.0,0.0,0.114316,0.062502,0.0,0.055471,0.0,0.117157,0.0,0.0,0.0,0.045298,0.058164,0.114245,0.0,0.043541,0.179142,0.051199,0.199512,0.0,0.120365,0.198849,0.452739,0.147169,0.0,0.088578,0.0,0.050515,0.0,0.0,0.053214,0.079295,0.056525,0.050117,0.122577,0.054432,0.062484,0.044879,0.129701,0.080961,0.055986,0.0,0.0,0.182806,0.0,0.0,0.066572,0.172843,0.125868,0.0,0.0,0.10785,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.059577,0.0,0.098796,0.0,0.0,0.0,0.353198,0.0,0.121133,0.0,0.129023,0.0,0.0,0.0,0.093354,0.048855,0.047485,0.0,0.365195,0.179426,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.66354,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.748141,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.554239,0.505709,0.568182,0.454545,0.6,0.2,0.331289,0.553349,0.1458,0.004042,0.053507,0.354723,0.001949,0.820679,0.015625,0.428571,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
1,0.058333,6.7e-05,0.004495,5e-05,1,1,1,0.0,0.07589,0.155369,0.0,0.0,0.0,0.340467,0.276474,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.054719,0.035445,0.0,0.051598,0.0,0.0,0.139945,0.141701,0.122743,0.064234,0.228864,0.0,0.074507,0.0,0.0,0.0,0.128059,0.0,0.256622,0.0,0.0,0.0,0.0,0.0,0.120501,0.128059,0.128059,0.0,0.256622,0.0,0.0,0.0,0.0,0.0,0.042891,0.0,0.0,0.25654,0.128059,0.128059,0.128059,0.0,0.0,0.0,0.079639,0.0,0.0,0.0,0.053753,0.128013,0.178565,0.222734,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.109311,0.141795,0.141839,0.0,0.0,0.0,0.106237,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.319697,0.0,0.0,0.0,0.0,0.138118,0.122721,0.159086,0.097691,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.798646,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.601801,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.092087,0.048038,0.201778,0.0,0.0,0.0,0.0,0.08102,0.0,0.576408,0.0,0.066172,0.0,0.0,0.0,0.0,0.0,0.0,0.065772,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.140953,0.052124,0.0,0.0,0.098801,0.100205,0.068713,0.058915,0.11479,0.0,0.0,0.0,0.520967,0.056449,0.0,0.0,0.0,0.058128,0.149948,0.058461,0.0,0.045622,0.065044,0.230681,0.0,0.062635,0.0,0.154926,0.099498,0.046581,0.0,0.05536,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.186155,0.069596,0.0,0.0,0.0,0.07223,0.0,0.0,0.0,0.0,0.056842,0.0,0.0,0.0,0.067737,0.094289,0.0,0.0,0.049489,0.0,0.0,0.051297,0.0,0.168652,0.0,0.0,0.052529,0.0,0.111199,0.0,0.143853,0.0,0.0,0.0,0.098083,0.0,0.0,0.0,0.0,0.782397,0.0,0.0,0.0,0.0,0.0,0.115434,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.364527,0.118851,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.087856,0.0,0.0,0.0,0.0,0.0,0.0,0.098281,0.0,0.127986,0.113014,0.0,0.0,0.0,0.0,0.111578,0.122674,0.0,0.0,0.116076,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.098542,0.0,0.0,0.0,0.0,0.10729,0.0,0.108164,0.0,0.089995,0.0,0.114747,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.102122,0.0,0.0,0.0,0.0,0.0,0.0,0.099812,0.0,0.184518,0.0,0.0,0.109238,0.099211,0.5824,0.478153,0.568182,0.454545,0.556314,0.516448,0.498619,0.347488,0.110105,0.193418,0.068066,0.260384,0.005691,0.758359,0.125,0.392857,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
2,0.058333,3.3e-05,0.000525,6e-06,1,0,1,0.0,0.025295,0.0,0.027168,0.054083,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.401266,0.0,0.027358,0.14177,0.112429,0.0,0.0,0.034998,0.0,0.0,0.0,0.0,0.320389,0.0,0.074502,0.034802,0.0,0.0,0.128051,0.0,0.342141,0.0,0.0,0.368251,0.0,0.0,0.0,0.128051,0.128051,0.0,0.342141,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.245563,0.342031,0.128051,0.128051,0.128051,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.128004,0.0,0.0,0.046897,0.0,0.156127,0.029338,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.030682,0.0,0.0,0.01998,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.018755,0.0,0.013787,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.020209,0.0,0.0,0.020352,0.0,0.0,0.037076,0.602525,0.0,0.0,0.473041,0.018319,0.0,0.0,0.0,0.023714,0.040454,0.01496,0.0,0.018865,0.0,0.0,0.039441,0.016909,0.0,0.0,0.039751,0.0,0.0,0.0,0.01859,0.4973,0.0,0.033365,0.043035,0.016778,0.0,0.013094,0.0,0.016551,0.020241,0.017976,0.061906,0.014821,0.0,0.0,0.036979,0.015888,0.020441,0.0,0.0,0.0,0.0,0.019027,0.055424,0.358755,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.048941,0.017025,0.0,0.038369,0.0,0.013531,0.020002,0.017916,0.0,0.0,0.040061,0.014722,0.015415,0.048403,0.015682,0.0,0.045227,0.0,0.0,0.033194,0.027524,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.441967,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.897032,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.68579,0.575664,0.5,0.0,0.5,0.0,0.531864,0.312128,0.141716,0.016166,0.147665,0.2151,0.000611,0.124125,0.125,0.841615,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
3,0.041667,0.000133,0.01099,0.00034,1,0,1,0.019887,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.032074,0.0,0.0,0.0,0.139856,0.0,0.216621,0.0,0.0,0.0,0.0,0.353402,0.02438,0.097481,0.098705,0.085499,0.201346,0.0,0.540795,0.0,0.387898,0.0,0.0,0.066902,0.0,0.0,0.0,0.148557,0.0,0.0,0.0,0.223833,0.066902,0.066902,0.0,0.0,0.0,0.0,0.148557,0.0,0.0,0.0,0.0,0.14968,0.0,0.066902,0.066902,0.066902,0.134619,0.025261,0.025468,0.110949,0.070026,0.0,0.0,0.018721,0.066877,0.0,0.0,0.0,0.0,0.0,0.020437,0.025477,0.025479,0.148533,0.0,0.139595,0.09877,0.098801,0.0,0.0,0.0,0.17267,0.049806,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.096209,0.085483,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.53341,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.845857,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.710235,0.074101,0.051875,0.0,0.0,0.17205,0.050374,0.0,0.0,0.0,0.0,0.051036,0.09114,0.054693,0.152278,0.0,0.099635,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.058086,0.0,0.0,0.0,0.103241,0.050696,0.0,0.038643,0.0,0.0,0.044267,0.0,0.0,0.035296,0.0,0.087075,0.0,0.0,0.0,0.044832,0.0,0.0,0.094454,0.070374,0.0,0.0,0.0,0.0,0.110909,0.079659,0.0,0.035926,0.049687,0.042697,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.051168,0.0,0.0,0.0,0.052853,0.055431,0.0,0.0,0.0,0.0,0.124976,0.0,0.0,0.0,0.0,0.052244,0.145445,0.0,0.0,0.0,0.0,0.0,0.514328,0.0,0.086717,0.12643,0.0,0.0,0.0,0.042882,0.0,0.036983,0.0,0.398091,0.0,0.0,0.0,0.0,0.0,0.324514,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.352524,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.334799,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.67367,0.0,0.0,0.0,0.214521,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.54881,0.438095,0.5,0.5,0.64375,0.669444,0.437388,0.24792,0.094655,0.021363,0.145207,0.271705,0.01396,0.674364,0.234375,0.862013,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
4,0.066667,7e-06,0.004995,0.0002,1,1,1,0.035196,0.031185,0.031923,0.033495,0.033339,0.0,0.0,0.0,0.510872,0.0,0.0,0.0,0.0,0.0,0.0,0.033728,0.043696,0.0,0.031805,0.0,0.0,0.086261,0.087343,0.090789,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.177603,0.0,0.052727,0.0,0.0,0.0454,0.055748,0.0,0.0,0.177603,0.177603,0.0,0.052727,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.05271,0.177603,0.177603,0.177603,0.0,0.0,0.0,0.392712,0.041311,0.0,0.0,0.0,0.177538,0.247648,0.366111,0.0,0.0,0.11549,0.0,0.0,0.0,0.0,0.049874,0.067379,0.087401,0.087428,0.0,0.0,0.0,0.0,0.044073,0.0,0.0,0.0,0.0,0.0,0.049057,0.0,0.221691,0.0,0.0,0.0,0.046013,0.085135,0.090773,0.117671,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.578647,0.0,0.0,0.357578,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.543483,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.491866,0.0,0.0,0.102809,0.0,0.151151,0.0,0.0,0.338116,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.207079,0.0,0.101618,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.078823,0.0,0.0,0.0,0.0,0.2179,0.287985,0.0,0.0,0.0,0.0,0.0,0.091449,0.078635,0.0,0.0,0.215325,0.0,0.0,0.0,0.0,0.33935,0.0,0.469603,0.073283,0.202704,0.0,0.0,0.0,0.0,0.0,0.0,0.104301,0.0,0.0,0.104373,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.093325,0.0,0.0,0.0,0.0,0.0,0.098211,0.077858,0.0,0.1098,0.0,0.0,0.0,0.0,0.12473,0.330561,0.0,0.174942,0.0,0.075438,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.262929,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.26236,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.210996,0.0,0.24589,0.0,0.259116,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.49421,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.32112,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.25673,0.0,0.17123,0.0,0.0,0.0,0.0,0.0,0.0,0.497315,0.0,0.0,0.0,0.583499,0.499051,0.5,0.0,0.507975,0.555092,0.517629,0.354621,0.075475,0.081409,0.059369,0.339632,0.011767,0.539894,0.125,0.349143,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0


In [29]:
result.head()

Unnamed: 0,id,name,description,description_story,description_risks,rewards,reward_tiers,min_reward,max_reward,category,goal,deadline,location,state,staff_pick,video,launched_at,created_at,rewards_processed,description_processed,description_story_processed,description_risks_processed,has_video,rewards_0,rewards_1,rewards_2,rewards_3,rewards_4,rewards_5,rewards_6,rewards_7,rewards_8,rewards_9,rewards_10,rewards_11,rewards_12,rewards_13,rewards_14,rewards_15,rewards_16,rewards_17,rewards_18,rewards_19,rewards_20,rewards_21,rewards_22,rewards_23,rewards_24,rewards_25,rewards_26,rewards_27,rewards_28,rewards_29,rewards_30,rewards_31,rewards_32,rewards_33,rewards_34,rewards_35,rewards_36,rewards_37,rewards_38,rewards_39,rewards_40,rewards_41,rewards_42,rewards_43,rewards_44,rewards_45,rewards_46,rewards_47,rewards_48,rewards_49,rewards_50,rewards_51,rewards_52,rewards_53,rewards_54,rewards_55,rewards_56,rewards_57,rewards_58,rewards_59,rewards_60,rewards_61,rewards_62,rewards_63,rewards_64,rewards_65,rewards_66,rewards_67,rewards_68,rewards_69,rewards_70,rewards_71,rewards_72,rewards_73,rewards_74,rewards_75,rewards_76,rewards_77,rewards_78,rewards_79,rewards_80,rewards_81,rewards_82,rewards_83,rewards_84,rewards_85,rewards_86,rewards_87,rewards_88,rewards_89,rewards_90,rewards_91,rewards_92,rewards_93,rewards_94,rewards_95,rewards_96,rewards_97,rewards_98,rewards_99,description_0,description_1,description_2,description_3,description_4,description_5,description_6,description_7,description_8,description_9,description_10,description_11,description_12,description_13,description_14,description_15,description_16,description_17,description_18,description_19,description_20,description_21,description_22,description_23,description_24,description_25,description_26,description_27,description_28,description_29,description_30,description_31,description_32,description_33,description_34,description_35,description_36,description_37,description_38,description_39,description_40,description_41,description_42,description_43,description_44,description_45,description_46,description_47,description_48,description_49,description_50,description_51,description_52,description_53,description_54,description_55,description_56,description_57,description_58,description_59,description_60,description_61,description_62,description_63,description_64,description_65,description_66,description_67,description_68,description_69,description_70,description_71,description_72,description_73,description_74,description_75,description_76,description_77,description_78,description_79,description_80,description_81,description_82,description_83,description_84,description_85,description_86,description_87,description_88,description_89,description_90,description_91,description_92,description_93,description_94,description_95,description_96,description_97,description_98,description_99,description_story_0,description_story_1,description_story_2,description_story_3,description_story_4,description_story_5,description_story_6,description_story_7,description_story_8,description_story_9,description_story_10,description_story_11,description_story_12,description_story_13,description_story_14,description_story_15,description_story_16,description_story_17,description_story_18,description_story_19,description_story_20,description_story_21,description_story_22,description_story_23,description_story_24,description_story_25,description_story_26,description_story_27,description_story_28,description_story_29,description_story_30,description_story_31,description_story_32,description_story_33,description_story_34,description_story_35,description_story_36,description_story_37,description_story_38,description_story_39,description_story_40,description_story_41,description_story_42,description_story_43,description_story_44,description_story_45,description_story_46,description_story_47,description_story_48,description_story_49,description_story_50,description_story_51,description_story_52,description_story_53,description_story_54,description_story_55,description_story_56,description_story_57,description_story_58,description_story_59,description_story_60,description_story_61,description_story_62,description_story_63,description_story_64,description_story_65,description_story_66,description_story_67,description_story_68,description_story_69,description_story_70,description_story_71,description_story_72,description_story_73,description_story_74,description_story_75,description_story_76,description_story_77,description_story_78,description_story_79,description_story_80,description_story_81,description_story_82,description_story_83,description_story_84,description_story_85,description_story_86,description_story_87,description_story_88,description_story_89,description_story_90,description_story_91,description_story_92,description_story_93,description_story_94,description_story_95,description_story_96,description_story_97,description_story_98,description_story_99,description_risks_0,description_risks_1,description_risks_2,description_risks_3,description_risks_4,description_risks_5,description_risks_6,description_risks_7,description_risks_8,description_risks_9,description_risks_10,description_risks_11,description_risks_12,description_risks_13,description_risks_14,description_risks_15,description_risks_16,description_risks_17,description_risks_18,description_risks_19,description_risks_20,description_risks_21,description_risks_22,description_risks_23,description_risks_24,description_risks_25,description_risks_26,description_risks_27,description_risks_28,description_risks_29,description_risks_30,description_risks_31,description_risks_32,description_risks_33,description_risks_34,description_risks_35,description_risks_36,description_risks_37,description_risks_38,description_risks_39,description_risks_40,description_risks_41,description_risks_42,description_risks_43,description_risks_44,description_risks_45,description_risks_46,description_risks_47,description_risks_48,description_risks_49,description_risks_50,description_risks_51,description_risks_52,description_risks_53,description_risks_54,description_risks_55,description_risks_56,description_risks_57,description_risks_58,description_risks_59,description_risks_60,description_risks_61,description_risks_62,description_risks_63,description_risks_64,description_risks_65,description_risks_66,description_risks_67,description_risks_68,description_risks_69,description_risks_70,description_risks_71,description_risks_72,description_risks_73,description_risks_74,description_risks_75,description_risks_76,description_risks_77,description_risks_78,description_risks_79,description_risks_80,description_risks_81,description_risks_82,description_risks_83,description_risks_84,description_risks_85,description_risks_86,description_risks_87,description_risks_88,description_risks_89,description_risks_90,description_risks_91,description_risks_92,description_risks_93,description_risks_94,description_risks_95,description_risks_96,description_risks_97,description_risks_98,description_risks_99,description_story_polarity,description_story_subjectivity,description_polarity,description_subjectivity,description_risks_polarity,description_risks_subjectivity,rewards_polarity,rewards_subjectivity,description_story_word_count,description_risks_word_count,rewards_word_count,funding_duration_in_days,preparation_duration_in_days,corpus,text_similarity_score,launched_month,launched_year,cat_goal_bin,competitiors_count,success_count,total_count,success_rate,x0_art,x0_comics,x0_crafts,x0_dance,x0_design,x0_fashion,x0_film & video,x0_food,x0_games,x0_journalism,x0_music,x0_photography,x0_publishing,x0_technology,x0_theater,x0_AE,x0_AF,x0_AM,x0_AO,x0_AQ,x0_AR,x0_AT,x0_AU,x0_AW,x0_AZ,x0_BA,x0_BD,x0_BE,x0_BF,x0_BG,x0_BR,x0_BS,x0_BT,x0_BY,x0_BZ,x0_CA,x0_CD,x0_CG,x0_CH,x0_CK,x0_CL,x0_CN,x0_CO,x0_CR,x0_CU,x0_CV,x0_CY,x0_CZ,x0_DE,x0_DJ,x0_DK,x0_DO,x0_EC,x0_EE,x0_EG,x0_ES,x0_ET,x0_FI,x0_FO,x0_FR,x0_GB,x0_GE,x0_GH,x0_GL,x0_GR,x0_GT,x0_GU,x0_HK,x0_HN,x0_HR,x0_HT,x0_HU,x0_ID,x0_IE,x0_IL,x0_IN,x0_IQ,x0_IS,x0_IT,x0_JM,x0_JO,x0_JP,x0_KE,x0_KH,x0_KR,x0_KW,x0_KZ,x0_LB,x0_LR,x0_LT,x0_LU,x0_LV,x0_MA,x0_MD,x0_ME,x0_MG,x0_ML,x0_MM,x0_MN,x0_MO,x0_MQ,x0_MT,x0_MU,x0_MW,x0_MX,x0_MY,x0_MZ,x0_NC,x0_NG,x0_NI,x0_NL,x0_NO,x0_NP,x0_NZ,x0_PA,x0_PE,x0_PH,x0_PK,x0_PL,x0_PR,x0_PS,x0_PT,x0_RO,x0_RS,x0_RU,x0_RW,x0_SE,x0_SG,x0_SI,x0_SJ,x0_SK,x0_SL,x0_SN,x0_SO,x0_SR,x0_SV,x0_SX,x0_TD,x0_TH,x0_TR,x0_TT,x0_TW,x0_TZ,x0_UA,x0_UG,x0_US,x0_UY,x0_VE,x0_VN,x0_VU,x0_WS,x0_XK,x0_YE,x0_ZA,x0_ZW,x0_nan
0,307103100.0,"""To the things themselves!""","A new dance exploring both my allergy to ""abou...","November 2, 2018 OMG! We're just over halfway ...",We really need your support! Thank you.,[{'rewards': 'Pledge US$ 25 or more\\n\\nAbout...,6,25,1000,dance,9000.0,2018-11-17 04:59:00,US,1,1,https://v2.kickstarter.com/1663805284-vaRunMxL...,2018-10-15 20:59:22,2018-10-09 01:27:56,pledge us 25 or more about s 36 friend a perso...,A new dance exploring both my allergy to about...,November 2 2018 OMG Were just over halfway thr...,We really need your support Thank you,1,0.042075,0.0,0.038161,0.0,0.039854,0.075896,0.0,0.0,0.0,0.0,0.430264,0.0,0.0,0.0,0.0,0.08064,0.0,0.0,0.03802,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.3452,0.14154,0.346071,0.0,0.0,0.0,0.0,0.0,0.0,0.059194,0.14154,0.14154,0.346095,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.14154,0.14154,0.14154,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.079216,0.141489,0.197363,0.109414,0.0,0.061508,0.0,0.0,0.0,0.0,0.0,0.0,0.080546,0.0,0.0,0.154105,0.160769,0.0,0.0,0.0,0.157461,0.112914,0.113068,0.0,0.0,0.175933,0.053498,0.176676,0.15268,0.159475,0.112914,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.62069,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.473705,0.0,0.0,0.484473,0.0,0.394504,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.064879,0.056791,0.0,0.041747,0.0,0.0,0.186771,0.0,0.0,0.070409,0.058061,0.0,0.0,0.115012,0.051346,0.0,0.057194,0.0,0.0,0.0,0.114316,0.062502,0.0,0.055471,0.0,0.117157,0.0,0.0,0.0,0.045298,0.058164,0.114245,0.0,0.043541,0.179142,0.051199,0.199512,0.0,0.120365,0.198849,0.452739,0.147169,0.0,0.088578,0.0,0.050515,0.0,0.0,0.053214,0.079295,0.056525,0.050117,0.122577,0.054432,0.062484,0.044879,0.129701,0.080961,0.055986,0.0,0.0,0.182806,0.0,0.0,0.066572,0.172843,0.125868,0.0,0.0,0.10785,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.059577,0.0,0.098796,0.0,0.0,0.0,0.353198,0.0,0.121133,0.0,0.129023,0.0,0.0,0.0,0.093354,0.048855,0.047485,0.0,0.365195,0.179426,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.66354,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.748141,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.108477,0.505709,0.136364,0.454545,0.2,0.2,-0.0275,0.495,822,8,292,32.333079,6.813495,A new dance exploring both my allergy to about...,19121,10,2018,"(7500.0, 500000.0]",2,9,17,0.529412,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
1,214319300.0,Journals 1990-2014,How did we get to the new century? Ride the wa...,Many thanks to my backers for getting us to th...,Here are the steps of my process:\r\n\r\nStep ...,[{'rewards': 'Pledge US$ 10 or more\\n\\nAbout...,8,10,900,publishing,5000.0,2015-04-09 14:39:44,US,1,1,https://v2.kickstarter.com/1664643846-VxuMrMK%...,2015-03-16 14:39:44,2015-02-24 17:29:35,pledge us 10 or more about us 10 ebook of jour...,How did we get to the new century Ride the wav...,Many thanks to my backers for getting us to th...,Here are the steps of my process Step 1 Ed...,1,0.0,0.07589,0.155369,0.0,0.0,0.0,0.340467,0.276474,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.054719,0.035445,0.0,0.051598,0.0,0.0,0.139945,0.141701,0.122743,0.064234,0.228864,0.0,0.074507,0.0,0.0,0.0,0.128059,0.0,0.256622,0.0,0.0,0.0,0.0,0.0,0.120501,0.128059,0.128059,0.0,0.256622,0.0,0.0,0.0,0.0,0.0,0.042891,0.0,0.0,0.25654,0.128059,0.128059,0.128059,0.0,0.0,0.0,0.079639,0.0,0.0,0.0,0.053753,0.128013,0.178565,0.222734,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.109311,0.141795,0.141839,0.0,0.0,0.0,0.106237,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.319697,0.0,0.0,0.0,0.0,0.138118,0.122721,0.159086,0.097691,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.798646,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.601801,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.092087,0.048038,0.201778,0.0,0.0,0.0,0.0,0.08102,0.0,0.576408,0.0,0.066172,0.0,0.0,0.0,0.0,0.0,0.0,0.065772,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.140953,0.052124,0.0,0.0,0.098801,0.100205,0.068713,0.058915,0.11479,0.0,0.0,0.0,0.520967,0.056449,0.0,0.0,0.0,0.058128,0.149948,0.058461,0.0,0.045622,0.065044,0.230681,0.0,0.062635,0.0,0.154926,0.099498,0.046581,0.0,0.05536,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.186155,0.069596,0.0,0.0,0.0,0.07223,0.0,0.0,0.0,0.0,0.056842,0.0,0.0,0.0,0.067737,0.094289,0.0,0.0,0.049489,0.0,0.0,0.051297,0.0,0.168652,0.0,0.0,0.052529,0.0,0.111199,0.0,0.143853,0.0,0.0,0.0,0.098083,0.0,0.0,0.0,0.0,0.782397,0.0,0.0,0.0,0.0,0.0,0.115434,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.364527,0.118851,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.087856,0.0,0.0,0.0,0.0,0.0,0.0,0.098281,0.0,0.127986,0.113014,0.0,0.0,0.0,0.0,0.111578,0.122674,0.0,0.0,0.116076,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.098542,0.0,0.0,0.0,0.0,0.10729,0.0,0.108164,0.0,0.089995,0.0,0.114747,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.102122,0.0,0.0,0.0,0.0,0.0,0.0,0.099812,0.0,0.184518,0.0,0.0,0.109238,0.099211,0.164801,0.478153,0.136364,0.454545,0.112629,0.516448,0.126574,0.335648,621,336,369,24.0,19.882049,How did we get to the new century Ride the wav...,17669,3,2015,"(1500.0, 6532.0]",9,37,74,0.5,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
2,74750640.0,Bailarina Piano,Hemos conseguido poner en marcha el proyecto B...,-¿Te gustaría disfrutar de la mezcla de la dan...,El principal riesgo es el retrasar el proyecto...,[{'rewards': 'Pledge €3 or more\\n\\nAbout S$ ...,8,5,106,music,650.0,2021-05-23 01:36:40,ES,1,0,https://v2.kickstarter.com/1664750650-Kfqx1NI3...,2021-05-03 01:36:40,2021-04-30 22:16:36,pledge 3 or more about s 5 concierto en stream...,Hemos conseguido poner en marcha el proyecto B...,Te gustaría disfrutar de la mezcla de la danza...,El principal riesgo es el retrasar el proyecto...,1,0.0,0.025295,0.0,0.027168,0.054083,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.401266,0.0,0.027358,0.14177,0.112429,0.0,0.0,0.034998,0.0,0.0,0.0,0.0,0.320389,0.0,0.074502,0.034802,0.0,0.0,0.128051,0.0,0.342141,0.0,0.0,0.368251,0.0,0.0,0.0,0.128051,0.128051,0.0,0.342141,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.245563,0.342031,0.128051,0.128051,0.128051,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.128004,0.0,0.0,0.046897,0.0,0.156127,0.029338,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.030682,0.0,0.0,0.01998,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.018755,0.0,0.013787,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.020209,0.0,0.0,0.020352,0.0,0.0,0.037076,0.602525,0.0,0.0,0.473041,0.018319,0.0,0.0,0.0,0.023714,0.040454,0.01496,0.0,0.018865,0.0,0.0,0.039441,0.016909,0.0,0.0,0.039751,0.0,0.0,0.0,0.01859,0.4973,0.0,0.033365,0.043035,0.016778,0.0,0.013094,0.0,0.016551,0.020241,0.017976,0.061906,0.014821,0.0,0.0,0.036979,0.015888,0.020441,0.0,0.0,0.0,0.0,0.019027,0.055424,0.358755,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.048941,0.017025,0.0,0.038369,0.0,0.013531,0.020002,0.017916,0.0,0.0,0.040061,0.014722,0.015415,0.048403,0.015682,0.0,0.045227,0.0,0.0,0.033194,0.027524,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.441967,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.897032,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.37158,0.575664,0.0,0.0,0.0,0.0,0.157185,0.308277,799,29,790,20.0,2.138935,Hemos conseguido poner en marcha el proyecto B...,2892,5,2021,"(0.999, 2500.0]",9,120,138,0.869565,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
3,1946709000.0,Lily Locksmith full length album,Help Lily Locksmith put out her final recordin...,"Lily Locksmith, with her powerful voice, rich ...",The biggest challange here is the time line. I...,[{'rewards': 'Pledge SEK 149 or more\\n\\nAbou...,6,20,2199,music,34000.0,2022-04-14 07:21:20,SE,1,0,https://v2.kickstarter.com/1664734207-Ac%2F11N...,2022-03-20 07:21:20,2022-01-30 12:56:59,pledge sek 149 or more about s 20 cd the lily ...,Help Lily Locksmith put out her final recordin...,Lily Locksmith with her powerful voice rich wi...,The biggest challange here is the time line If...,1,0.019887,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.032074,0.0,0.0,0.0,0.139856,0.0,0.216621,0.0,0.0,0.0,0.0,0.353402,0.02438,0.097481,0.098705,0.085499,0.201346,0.0,0.540795,0.0,0.387898,0.0,0.0,0.066902,0.0,0.0,0.0,0.148557,0.0,0.0,0.0,0.223833,0.066902,0.066902,0.0,0.0,0.0,0.0,0.148557,0.0,0.0,0.0,0.0,0.14968,0.0,0.066902,0.066902,0.066902,0.134619,0.025261,0.025468,0.110949,0.070026,0.0,0.0,0.018721,0.066877,0.0,0.0,0.0,0.0,0.0,0.020437,0.025477,0.025479,0.148533,0.0,0.139595,0.09877,0.098801,0.0,0.0,0.0,0.17267,0.049806,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.096209,0.085483,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.53341,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.845857,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.710235,0.074101,0.051875,0.0,0.0,0.17205,0.050374,0.0,0.0,0.0,0.0,0.051036,0.09114,0.054693,0.152278,0.0,0.099635,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.058086,0.0,0.0,0.0,0.103241,0.050696,0.0,0.038643,0.0,0.0,0.044267,0.0,0.0,0.035296,0.0,0.087075,0.0,0.0,0.0,0.044832,0.0,0.0,0.094454,0.070374,0.0,0.0,0.0,0.0,0.110909,0.079659,0.0,0.035926,0.049687,0.042697,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.051168,0.0,0.0,0.0,0.052853,0.055431,0.0,0.0,0.0,0.0,0.124976,0.0,0.0,0.0,0.0,0.052244,0.145445,0.0,0.0,0.0,0.0,0.0,0.514328,0.0,0.086717,0.12643,0.0,0.0,0.0,0.042882,0.0,0.036983,0.0,0.398091,0.0,0.0,0.0,0.0,0.0,0.324514,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.352524,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.334799,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.67367,0.0,0.0,0.0,0.214521,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.097619,0.438095,0.0,0.5,0.2875,0.669444,0.070194,0.258575,534,38,777,25.0,48.76691,Help Lily Locksmith put out her final recordin...,15712,3,2022,"(7500.0, 1388900.0]",16,78,88,0.886364,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
4,537252400.0,Very Young Composers @ 20!,Help celebrate 20 years of empowering the youn...,"For 20 years now, the Very Young Composers pro...","Live streaming to South Korea, Finland, Venezu...",[{'rewards': 'Pledge US$ 1 or more\\n\\nAbout ...,9,1,1000,music,20000.0,2016-05-06 18:45:32,US,1,1,https://v2.kickstarter.com/1664682609-xfA%2FLS...,2016-04-05 18:45:32,2016-02-24 16:11:49,pledge us 1 or more about s 2 stay curious rec...,Help celebrate 20 years of empowering the youn...,For 20 years now the Very Young Composers prog...,Live streaming to South Korea Finland Venezuel...,1,0.035196,0.031185,0.031923,0.033495,0.033339,0.0,0.0,0.0,0.510872,0.0,0.0,0.0,0.0,0.0,0.0,0.033728,0.043696,0.0,0.031805,0.0,0.0,0.086261,0.087343,0.090789,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.177603,0.0,0.052727,0.0,0.0,0.0454,0.055748,0.0,0.0,0.177603,0.177603,0.0,0.052727,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.05271,0.177603,0.177603,0.177603,0.0,0.0,0.0,0.392712,0.041311,0.0,0.0,0.0,0.177538,0.247648,0.366111,0.0,0.0,0.11549,0.0,0.0,0.0,0.0,0.049874,0.067379,0.087401,0.087428,0.0,0.0,0.0,0.0,0.044073,0.0,0.0,0.0,0.0,0.0,0.049057,0.0,0.221691,0.0,0.0,0.0,0.046013,0.085135,0.090773,0.117671,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.578647,0.0,0.0,0.357578,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.543483,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.491866,0.0,0.0,0.102809,0.0,0.151151,0.0,0.0,0.338116,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.207079,0.0,0.101618,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.078823,0.0,0.0,0.0,0.0,0.2179,0.287985,0.0,0.0,0.0,0.0,0.0,0.091449,0.078635,0.0,0.0,0.215325,0.0,0.0,0.0,0.0,0.33935,0.0,0.469603,0.073283,0.202704,0.0,0.0,0.0,0.0,0.0,0.0,0.104301,0.0,0.0,0.104373,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.093325,0.0,0.0,0.0,0.0,0.0,0.098211,0.077858,0.0,0.1098,0.0,0.0,0.0,0.0,0.12473,0.330561,0.0,0.174942,0.0,0.075438,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.262929,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.26236,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.210996,0.0,0.24589,0.0,0.259116,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.49421,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.32112,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.25673,0.0,0.17123,0.0,0.0,0.0,0.0,0.0,0.0,0.497315,0.0,0.0,0.0,0.166998,0.499051,0.0,0.0,0.01595,0.555092,0.144078,0.34117,426,142,323,31.0,41.106748,Help celebrate 20 years of empowering the youn...,12579,4,2016,"(7500.0, 1388900.0]",9,58,125,0.464,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0


In [30]:
#fuck = pd.read_csv('../kickstarter_train_final_20221021-185107.csv')

In [31]:
fuck.head()

NameError: name 'fuck' is not defined

In [None]:
t = pd.read_csv("/Users/ivankoh/Library/CloudStorage/OneDrive-NationalUniversityofSingapore/1D/NUS Y3S1/BT4222/Data/test/kickstarter_test.csv")
t['rewards']