### Importing Data

In [118]:
import pandas as pd
import nltk
#nltk.download('punkt')

col_list = ['prediction set id', 'membership guid', 'discover question id', 'question id', 'question name', 'rationale', 'comment id', 'answer id', 'answer name', 'created at', 'made after correctness known', 'forecasted probability', 'starting probability', 'final probability', 'answer resolved probability']

data_types = {
    'prediction set id': "Int64",
    'membership guid' : str,
    'discover question id': "Int64",
    'question id': "Int64",
    'question name': str,
    'rationale': str,
    'comment id': "Int64",
    'answer id': "Int64",
    'answer name': str,
    'created at': str,
    'made after correctness known': bool,
    'forecasted probability': float,
    'starting probability': float,
    'final probability': float,
    'answer resolved probability': "Int64"
}

In [141]:
df  = pd.read_csv('HFC_original_files/rct-b-prediction-sets-clean.csv', usecols=col_list, dtype=data_types, keep_default_na=False, na_values=['_'])
df.shape

(629874, 15)

### Removing any forecasts made after correctness already known

In [142]:
df = df[df['made after correctness known'] == False]
df.shape

(622932, 15)

### Removing any rationale under 10 words in length

In [143]:
#get word count
# df['word_count'] = df['rationale'].str.count(' ') + 1
# df

# df['rationale_tokenized'] = df.apply(lambda row: nltk.word_tokenize(row['rationale']), axis=1)
df['rationale_tokenized'] = df['rationale'].apply(lambda x: nltk.word_tokenize(str(x)))
df['word_count'] = df.apply(lambda row: len(row['rationale_tokenized']), axis=1)
df

Unnamed: 0,prediction set id,membership guid,discover question id,question id,question name,rationale,comment id,answer id,answer name,created at,made after correctness known,forecasted probability,starting probability,final probability,answer resolved probability,rationale_tokenized,word_count
0,128323,f7f260757f4bb48afca005debf086c254766079b,499,3469,Will WHO release a Disease Outbreak News (DON)...,"From what I could find, it seems the last real...",130230,9794,Yes,2019-04-03T17:32:41Z,False,0.04,0.5,0.04,0,"[From, what, I, could, find, ,, it, seems, the...",99
1,128324,f7f260757f4bb48afca005debf086c254766079b,513,3343,When will Russia release Michael Calvey?,Since the trial for Calvey has not yet started...,130231,9515,Before 1 May 2019,2019-04-03T17:38:07Z,False,0.00,0.2,0.00,0,"[Since, the, trial, for, Calvey, has, not, yet...",107
2,128324,f7f260757f4bb48afca005debf086c254766079b,513,3343,When will Russia release Michael Calvey?,Since the trial for Calvey has not yet started...,130231,9514,Between 1 May 2019 and 6 June 2019,2019-04-03T17:38:07Z,False,0.00,0.2,0.00,0,"[Since, the, trial, for, Calvey, has, not, yet...",107
3,128324,f7f260757f4bb48afca005debf086c254766079b,513,3343,When will Russia release Michael Calvey?,Since the trial for Calvey has not yet started...,130231,9513,Between 7 June 2019 and 31 August 2019,2019-04-03T17:38:07Z,False,0.05,0.2,0.05,0,"[Since, the, trial, for, Calvey, has, not, yet...",107
4,128324,f7f260757f4bb48afca005debf086c254766079b,513,3343,When will Russia release Michael Calvey?,Since the trial for Calvey has not yet started...,130231,9512,Between 1 September 2019 and 29 November 2019,2019-04-03T17:38:07Z,False,0.05,0.2,0.05,0,"[Since, the, trial, for, Calvey, has, not, yet...",107
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
629869,374454,80cb45bbf0cc6e9e705de3e09abe5e789f4403f3,855,6408,"Between 5 September and 29 November 2019, how ...",,376560,18044,"Between 1 and 10, inclusive",2019-11-29T18:13:07Z,False,0.00,0.0,0.00,0,[],0
629870,374454,80cb45bbf0cc6e9e705de3e09abe5e789f4403f3,855,6408,"Between 5 September and 29 November 2019, how ...",,376560,18045,0,2019-11-29T18:13:07Z,False,0.00,0.0,0.00,0,[],0
629871,374455,80cb45bbf0cc6e9e705de3e09abe5e789f4403f3,802,6156,"Between 15 August 2019 and 29 November 2019, w...",,376561,17233,Yes,2019-11-29T18:14:16Z,False,0.00,0.0,0.00,0,[],0
629872,374456,80cb45bbf0cc6e9e705de3e09abe5e789f4403f3,574,4014,"Before 30 November 2019, will Georgia receive ...",,376562,11257,Yes,2019-11-29T18:16:51Z,False,0.00,0.0,0.00,0,[],0


In [124]:
to_drop = df.loc[df['word_count'] < 10]
to_drop

Unnamed: 0,prediction set id,membership guid,discover question id,question id,question name,rationale,comment id,answer id,answer name,created at,made after correctness known,forecasted probability,starting probability,final probability,answer resolved probability,rationale_tokenized,word_count
680,128609,aaae422a697d7406760a0c99d32b1799f359ca70,511,3361,"Before 30 November 2019, will Libya set a date...",that is how it works,130516,9560,"Yes, both parliamentary and presidential",2019-04-04T16:14:55Z,False,1.0,0.350,0.350,0,"[that, is, how, it, works]",5
681,128609,aaae422a697d7406760a0c99d32b1799f359ca70,511,3361,"Before 30 November 2019, will Libya set a date...",that is how it works,130516,9559,"Yes, only parliamentary",2019-04-04T16:14:55Z,False,0.0,0.150,0.150,0,"[that, is, how, it, works]",5
682,128609,aaae422a697d7406760a0c99d32b1799f359ca70,511,3361,"Before 30 November 2019, will Libya set a date...",that is how it works,130516,9558,"Yes, only presidential",2019-04-04T16:14:55Z,False,0.0,0.125,0.100,0,"[that, is, how, it, works]",5
683,128609,aaae422a697d7406760a0c99d32b1799f359ca70,511,3361,"Before 30 November 2019, will Libya set a date...",that is how it works,130516,9557,No date for either presidential or parliamenta...,2019-04-04T16:14:55Z,False,0.0,0.325,0.300,1,"[that, is, how, it, works]",5
691,128613,aaae422a697d7406760a0c99d32b1799f359ca70,513,3343,When will Russia release Michael Calvey?,according to sources,130520,9515,Before 1 May 2019,2019-04-04T16:18:02Z,False,0.0,0.050,0.035,0,"[according, to, sources]",3
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
629869,374454,80cb45bbf0cc6e9e705de3e09abe5e789f4403f3,855,6408,"Between 5 September and 29 November 2019, how ...",,376560,18044,"Between 1 and 10, inclusive",2019-11-29T18:13:07Z,False,0.0,0.000,0.000,0,[],0
629870,374454,80cb45bbf0cc6e9e705de3e09abe5e789f4403f3,855,6408,"Between 5 September and 29 November 2019, how ...",,376560,18045,0,2019-11-29T18:13:07Z,False,0.0,0.000,0.000,0,[],0
629871,374455,80cb45bbf0cc6e9e705de3e09abe5e789f4403f3,802,6156,"Between 15 August 2019 and 29 November 2019, w...",,376561,17233,Yes,2019-11-29T18:14:16Z,False,0.0,0.000,0.000,0,[],0
629872,374456,80cb45bbf0cc6e9e705de3e09abe5e789f4403f3,574,4014,"Before 30 November 2019, will Georgia receive ...",,376562,11257,Yes,2019-11-29T18:16:51Z,False,0.0,0.000,0.000,0,[],0


In [125]:
#df.drop(df[df.word_count < 10].index, inplace=True)
df1 = df.loc[df["word_count"] >= 10]
df1

Unnamed: 0,prediction set id,membership guid,discover question id,question id,question name,rationale,comment id,answer id,answer name,created at,made after correctness known,forecasted probability,starting probability,final probability,answer resolved probability,rationale_tokenized,word_count
0,128323,f7f260757f4bb48afca005debf086c254766079b,499,3469,Will WHO release a Disease Outbreak News (DON)...,"From what I could find, it seems the last real...",130230,9794,Yes,2019-04-03T17:32:41Z,False,0.04,0.500,0.040,0,"[From, what, I, could, find, ,, it, seems, the...",99
1,128324,f7f260757f4bb48afca005debf086c254766079b,513,3343,When will Russia release Michael Calvey?,Since the trial for Calvey has not yet started...,130231,9515,Before 1 May 2019,2019-04-03T17:38:07Z,False,0.00,0.200,0.000,0,"[Since, the, trial, for, Calvey, has, not, yet...",107
2,128324,f7f260757f4bb48afca005debf086c254766079b,513,3343,When will Russia release Michael Calvey?,Since the trial for Calvey has not yet started...,130231,9514,Between 1 May 2019 and 6 June 2019,2019-04-03T17:38:07Z,False,0.00,0.200,0.000,0,"[Since, the, trial, for, Calvey, has, not, yet...",107
3,128324,f7f260757f4bb48afca005debf086c254766079b,513,3343,When will Russia release Michael Calvey?,Since the trial for Calvey has not yet started...,130231,9513,Between 7 June 2019 and 31 August 2019,2019-04-03T17:38:07Z,False,0.05,0.200,0.050,0,"[Since, the, trial, for, Calvey, has, not, yet...",107
4,128324,f7f260757f4bb48afca005debf086c254766079b,513,3343,When will Russia release Michael Calvey?,Since the trial for Calvey has not yet started...,130231,9512,Between 1 September 2019 and 29 November 2019,2019-04-03T17:38:07Z,False,0.05,0.200,0.050,0,"[Since, the, trial, for, Calvey, has, not, yet...",107
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
196286,207922,cf5a7d5937c97a09c19edcc73a49f59ec71dbe3e,764,5629,What will be the last value of the EURO STOXX ...,markets drifted lower throughout europe on the...,210016,15678,More than 12.9 but less than 14.5,2019-11-29T18:48:45Z,False,1.00,0.300,0.300,,"[markets, drifted, lower, throughout, europe, ...",42
196287,207922,cf5a7d5937c97a09c19edcc73a49f59ec71dbe3e,764,5629,What will be the last value of the EURO STOXX ...,markets drifted lower throughout europe on the...,210016,15677,"Between 14.5 and 16.4, inclusive",2019-11-29T18:48:45Z,False,0.00,0.105,0.105,,"[markets, drifted, lower, throughout, europe, ...",42
196288,207922,cf5a7d5937c97a09c19edcc73a49f59ec71dbe3e,764,5629,What will be the last value of the EURO STOXX ...,markets drifted lower throughout europe on the...,210016,15676,More than 16.4,2019-11-29T18:48:45Z,False,0.00,0.050,0.050,,"[markets, drifted, lower, throughout, europe, ...",42
196289,207923,cf5a7d5937c97a09c19edcc73a49f59ec71dbe3e,907,6925,"Between 24 October 2019 and 29 November 2019, ...",tensions between the two countries are increas...,210017,19244,Yes,2019-11-29T18:52:16Z,False,0.00,0.010,0.010,0,"[tensions, between, the, two, countries, are, ...",48


#### Avg. Word Count

In [126]:
df1['word_count'].mean()

91.20875134764806

In [127]:
# test_df = pd.DataFrame({'rationale': ['I can&#39;t imagine that Boris Johnson will let the whole report get issued', 'I haven&#39;t seen any reports to suggest that a report is coming out in the near term.', 2, 3, 4],

#                    'B': ['a', 'b', 'c', 'd', 'e'],

#                    'C': ['f', 'g', 'h', 'i', 'j']})

In [128]:
# test_df.replace(to_replace={'rationale': "\&\#39\;"}, value='\'', regex=True)
# test_df.loc[:,['rationale']].replace("\&\#39\;", '\'') 

# df1.loc[:,['rationale']].replace("‚Äú", "'")
# df1.loc[:,['rationale']].replace("&quot;", '"')
# df1.loc[:,['rationale']].replace("‚Äô", "'")
# df1.loc[:,['rationale']].replace("¬†", "'")
# df1.loc[:,['rationale']].replace("√≥", "'")

### Aggregate Data

In [129]:
df2 = df1.groupby(['discover question id', 'membership guid', 'question name', 'comment id','created at','rationale']).agg({"forecasted probability": lambda x: list(x),"answer name": lambda y: list(y),"final probability": lambda z: list(z),"answer resolved probability": lambda a: list(a)})
df2

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Unnamed: 3_level_0,Unnamed: 4_level_0,Unnamed: 5_level_0,forecasted probability,answer name,final probability,answer resolved probability
discover question id,membership guid,question name,comment id,created at,rationale,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1
498,0418f0019ccaddb58e983192b4ecc152d35bafa9,How many battle deaths will ACLED record in Niger between 4 April 2019 and 14 April 2019?,130983,2019-04-04T17:26:04Z,"It is my belief that battle deaths will continue steady, despite calls from Congress to withdraw American troops from fighting against Al Qaeda militias. American troops are at this time in six different countries one of which is Niger.\n<a target=""_blank"" href=""https://www.usatoday.com/story/opinion/2019/04/04/congress-yemen-war-powers-bernie-sanders-mike-lee-column/3363199002/"">https://www.usatoday.com/story/opinion/2019/04/04/congress-yemen-war-powers-bernie-sanders-mike-lee-column/3363199002/</a>\nHowever, there are several reports that indicate Niger has now called upon Russia to aid them in the battle against the militants. \n<a target=""_blank"" href=""https://www.nytimes.com/2019/03/31/world/africa/russia-military-africa.html"">https://www.nytimes.com/2019/03/31/world/africa/russia-military-africa.html</a>\nFor these reasons, and the fact that Boko Haram continues to ravage the region with attacks, I do believe that Niger will continue to have the average of 15-20 deaths per month and I predict that for the next ten days, there will unfortunately be between 7 and 21 battle deaths.","[0.0, 0.0, 0.37, 0.53, 0.1]","[None, Between 1 and 3, inclusive, More than 3...","[0.0, 0.05, 0.165, 0.38, 0.175]","[0, 0, 1, 0, 0]"
498,0418f0019ccaddb58e983192b4ecc152d35bafa9,How many battle deaths will ACLED record in Niger between 4 April 2019 and 14 April 2019?,132617,2019-04-09T19:26:35Z,"Update: With the forecasting window closing, I will now adjust the percentages on this question. In looking at media reports, there has been several sources reporting the uptick of violence especially in the south-eastern region. According to sources, in the month of March there were about 88 civilian deaths. \n<a target=""_blank"" href=""https://www.unhcr.org/news/briefing/2019/4/5cac53cd4/unhcr-alarmed-upsurge-violence-south-east-niger.html"">https://www.unhcr.org/news/briefing/2019/4/5cac53cd4/unhcr-alarmed-upsurge-violence-south-east-niger.html</a>\nThe continued violence perpetrated by Boko Haram will continue and for that reason, I will adjust my prediction to reflect the fact that there is a higher chance that &quot;More than 21&quot; deaths are possible.","[0.0, 0.0, 0.27, 0.53, 0.2]","[None, Between 1 and 3, inclusive, More than 3...","[0.01, 0.05, 0.15, 0.355, 0.25]","[0, 0, 1, 0, 0]"
498,04abfc2f8a4578134a1e4699dce26d35ec301f07,How many battle deaths will ACLED record in Niger between 4 April 2019 and 14 April 2019?,130811,2019-04-04T17:05:33Z,"Based on the historical data from <a target=""_blank"" href=""https://www.acleddata.com/data/#OpenModal3853"">https://www.acleddata.com/data/#OpenModal3853</a> for the number of battle related deaths in Niger this year so far, there is a high chance that the number of deaths between April 4th and 14th will be around 20. This is based on the fact that there were reported 163 deaths in the first three months of this year, which is about 53 per month, or 14 per 10 day average. However, the amount of deaths has been increasing on average, so I think that in this time frame, there will be slightly more than the past average for this year.","[0.05, 0.1, 0.15, 0.4, 0.3]","[None, Between 1 and 3, inclusive, More than 3...","[0.0, 0.05, 0.25, 0.35, 0.15]","[0, 0, 1, 0, 0]"
498,04abfc2f8a4578134a1e4699dce26d35ec301f07,How many battle deaths will ACLED record in Niger between 4 April 2019 and 14 April 2019?,133643,2019-04-11T19:09:37Z,"I am updating my forecast to 3 to 21 deaths because the window between the 4th and the 14th is closing. There has only been 1 reported death on the <a target=""_blank"" href=""https://www.acleddata.com/data/"">https://www.acleddata.com/data/</a> website, and it is highly unlikely that a lot of deaths will occur in the next 4 days. I am leaving my prediction at 50/50 for 3-7 and 7-21 deaths because there is a slight chance that there may be another battle that will result in more than just a couple deaths.","[0.0, 0.0, 0.5, 0.5, 0.0]","[None, Between 1 and 3, inclusive, More than 3...","[0.01, 0.05, 0.2, 0.35, 0.15]","[0, 0, 1, 0, 0]"
498,096257803f653d5a2d3eb0c2e65532cd855f9cd5,How many battle deaths will ACLED record in Niger between 4 April 2019 and 14 April 2019?,131936,2019-04-05T02:45:42Z,"Looking at the current number of battle deaths in 2019, there seems to be a steady increase in the monthly rate. My prediction assumes that this increase will remain steady and generate between 7 and 21 deaths in the 10 day period in April. This is especially logical considering the still-ongoing violence in the region and the increased frequency of attack.","[0.05, 0.1, 0.2, 0.45, 0.2]","[None, Between 1 and 3, inclusive, More than 3...","[0.0, 0.05, 0.15, 0.4, 0.25]","[0, 0, 1, 0, 0]"
...,...,...,...,...,...,...,...,...,...
917,fe7ab4a2e177e69fad599bd3ea642ab5b634dede,Will the report created by the United Kingdom Parliament's Intelligence and Security Committee on Russian interference in the 2016 Brexit referendum be made public before 30 November 2019?,201592,2019-11-07T19:21:18Z,"In order for the report to be released it has to be signed off by Boris Johnson. Perhaps Johnson is waiting until after the election to ensure the report itself doesn&#39;t affect the outcome of the election. According to sources, Johnson is not mentioned in the report so there must be a different reason. Johnson does not seem to give in to pressure of any kind so I assume he will stick to his word.\n\n<a target=""_blank"" href=""https://www.bloomberg.com/news/articles/2019-11-05/doubts-over-russia-s-u-k-meddling-after-johnson-sits-on-report"">https://www.bloomberg.com/news/articles/2019-11-05/doubts-over-russia-s-u-k-meddling-after-johnson-sits-on-report</a>",[0.0],[Yes],[0.05],[0]
917,fe8829498687a62e749bdb94014fd5712fdd6a60,Will the report created by the United Kingdom Parliament's Intelligence and Security Committee on Russian interference in the 2016 Brexit referendum be made public before 30 November 2019?,204312,2019-11-16T15:16:14Z,"It is highly unlikely that this report will be seeing the light of day anytime soon. It took nearly 6 months for the report to reach parliament alone. This report could severely damage Boris&#39;s reputation and his chances of winning the up coming election, so there is no way he will let this report come out. With that being said, I do not see this report coming to light before November 30th or even this year.",[0.04],[Yes],[0.05],[0]
917,feba6274eb948e69dfb64b22f534bdc267ae4f9e,Will the report created by the United Kingdom Parliament's Intelligence and Security Committee on Russian interference in the 2016 Brexit referendum be made public before 30 November 2019?,202355,2019-11-10T22:23:51Z,"Considering that the election is going to happen in the first week of December, Johnson has stated that he will no allow it to be released before the election. He should have released it 10 days after the receipt of the report, which was October 17th, &quot;Downing Street sources stated that was not now expected to happen in time, claiming the sign-off process typically takes six weeks. A No 10 spokesman added: “There are processes reports such as this have to go through before publication, and the committee is well-informed of these.” As like Trump, The parties say that Johnson will not admit there was Russian interference. &quot;Labour and Scottish National party politicians accused No 10 of refusing to recognize the scale of Russian meddling.&quot; The problem is Johnson will not give a good reason why he is not releasing the report, and this has all wondering why. Whatever is going on Johnson is going t fight the release tooth and nail. <a target=""_blank"" href=""https://www.theguardian.com/politics/2019/nov/04/no-10-blocks-russia-eu-referendum-report-until-after-election"">https://www.theguardian.com/politics/2019/nov/04/no-10-blocks-russia-eu-referendum-report-until-after-election</a>",[0.0],[Yes],[0.05],[0]
917,ff5c60b832d4d34ea197c2fd865e5f93ee8f8116,Will the report created by the United Kingdom Parliament's Intelligence and Security Committee on Russian interference in the 2016 Brexit referendum be made public before 30 November 2019?,203333,2019-11-13T18:21:04Z,"I can&#39;t imagine that Boris Johnson will let the whole report get issued, especially in the next few weeks. He knows that there is some damning information in the report, so he will do everything he can to keep it quiet. The report also required Parliament&#39;s approval before being release, which had to happen before it was dissolved yesterday. I found no reports that the report was okayed by Parliament, so it is highly unlikely it can even be released before a new Parliament is formed next month.",[0.01],[Yes],[0.05],[0]


### Remove any rationale where result was almost certain

In [130]:
df2['final probability'][0:3]

discover question id  membership guid                           question name                                                                              comment id  created at            rationale                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                  

In [131]:
def return_concensus_count(row):
    counter = 0
    for val in row:
        if val < pow(0.0025,6):
            counter = counter + 1
    return counter

In [132]:
df2['answer_count'] = df2.apply(lambda row: len(row['final probability']), axis=1)
df2['concensus_count'] = df2.apply(lambda row: return_concensus_count(row['final probability']), axis=1)
df2

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Unnamed: 3_level_0,Unnamed: 4_level_0,Unnamed: 5_level_0,forecasted probability,answer name,final probability,answer resolved probability,answer_count,concensus_count
discover question id,membership guid,question name,comment id,created at,rationale,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1
498,0418f0019ccaddb58e983192b4ecc152d35bafa9,How many battle deaths will ACLED record in Niger between 4 April 2019 and 14 April 2019?,130983,2019-04-04T17:26:04Z,"It is my belief that battle deaths will continue steady, despite calls from Congress to withdraw American troops from fighting against Al Qaeda militias. American troops are at this time in six different countries one of which is Niger.\n<a target=""_blank"" href=""https://www.usatoday.com/story/opinion/2019/04/04/congress-yemen-war-powers-bernie-sanders-mike-lee-column/3363199002/"">https://www.usatoday.com/story/opinion/2019/04/04/congress-yemen-war-powers-bernie-sanders-mike-lee-column/3363199002/</a>\nHowever, there are several reports that indicate Niger has now called upon Russia to aid them in the battle against the militants. \n<a target=""_blank"" href=""https://www.nytimes.com/2019/03/31/world/africa/russia-military-africa.html"">https://www.nytimes.com/2019/03/31/world/africa/russia-military-africa.html</a>\nFor these reasons, and the fact that Boko Haram continues to ravage the region with attacks, I do believe that Niger will continue to have the average of 15-20 deaths per month and I predict that for the next ten days, there will unfortunately be between 7 and 21 battle deaths.","[0.0, 0.0, 0.37, 0.53, 0.1]","[None, Between 1 and 3, inclusive, More than 3...","[0.0, 0.05, 0.165, 0.38, 0.175]","[0, 0, 1, 0, 0]",5,1
498,0418f0019ccaddb58e983192b4ecc152d35bafa9,How many battle deaths will ACLED record in Niger between 4 April 2019 and 14 April 2019?,132617,2019-04-09T19:26:35Z,"Update: With the forecasting window closing, I will now adjust the percentages on this question. In looking at media reports, there has been several sources reporting the uptick of violence especially in the south-eastern region. According to sources, in the month of March there were about 88 civilian deaths. \n<a target=""_blank"" href=""https://www.unhcr.org/news/briefing/2019/4/5cac53cd4/unhcr-alarmed-upsurge-violence-south-east-niger.html"">https://www.unhcr.org/news/briefing/2019/4/5cac53cd4/unhcr-alarmed-upsurge-violence-south-east-niger.html</a>\nThe continued violence perpetrated by Boko Haram will continue and for that reason, I will adjust my prediction to reflect the fact that there is a higher chance that &quot;More than 21&quot; deaths are possible.","[0.0, 0.0, 0.27, 0.53, 0.2]","[None, Between 1 and 3, inclusive, More than 3...","[0.01, 0.05, 0.15, 0.355, 0.25]","[0, 0, 1, 0, 0]",5,0
498,04abfc2f8a4578134a1e4699dce26d35ec301f07,How many battle deaths will ACLED record in Niger between 4 April 2019 and 14 April 2019?,130811,2019-04-04T17:05:33Z,"Based on the historical data from <a target=""_blank"" href=""https://www.acleddata.com/data/#OpenModal3853"">https://www.acleddata.com/data/#OpenModal3853</a> for the number of battle related deaths in Niger this year so far, there is a high chance that the number of deaths between April 4th and 14th will be around 20. This is based on the fact that there were reported 163 deaths in the first three months of this year, which is about 53 per month, or 14 per 10 day average. However, the amount of deaths has been increasing on average, so I think that in this time frame, there will be slightly more than the past average for this year.","[0.05, 0.1, 0.15, 0.4, 0.3]","[None, Between 1 and 3, inclusive, More than 3...","[0.0, 0.05, 0.25, 0.35, 0.15]","[0, 0, 1, 0, 0]",5,1
498,04abfc2f8a4578134a1e4699dce26d35ec301f07,How many battle deaths will ACLED record in Niger between 4 April 2019 and 14 April 2019?,133643,2019-04-11T19:09:37Z,"I am updating my forecast to 3 to 21 deaths because the window between the 4th and the 14th is closing. There has only been 1 reported death on the <a target=""_blank"" href=""https://www.acleddata.com/data/"">https://www.acleddata.com/data/</a> website, and it is highly unlikely that a lot of deaths will occur in the next 4 days. I am leaving my prediction at 50/50 for 3-7 and 7-21 deaths because there is a slight chance that there may be another battle that will result in more than just a couple deaths.","[0.0, 0.0, 0.5, 0.5, 0.0]","[None, Between 1 and 3, inclusive, More than 3...","[0.01, 0.05, 0.2, 0.35, 0.15]","[0, 0, 1, 0, 0]",5,0
498,096257803f653d5a2d3eb0c2e65532cd855f9cd5,How many battle deaths will ACLED record in Niger between 4 April 2019 and 14 April 2019?,131936,2019-04-05T02:45:42Z,"Looking at the current number of battle deaths in 2019, there seems to be a steady increase in the monthly rate. My prediction assumes that this increase will remain steady and generate between 7 and 21 deaths in the 10 day period in April. This is especially logical considering the still-ongoing violence in the region and the increased frequency of attack.","[0.05, 0.1, 0.2, 0.45, 0.2]","[None, Between 1 and 3, inclusive, More than 3...","[0.0, 0.05, 0.15, 0.4, 0.25]","[0, 0, 1, 0, 0]",5,1
...,...,...,...,...,...,...,...,...,...,...,...
917,fe7ab4a2e177e69fad599bd3ea642ab5b634dede,Will the report created by the United Kingdom Parliament's Intelligence and Security Committee on Russian interference in the 2016 Brexit referendum be made public before 30 November 2019?,201592,2019-11-07T19:21:18Z,"In order for the report to be released it has to be signed off by Boris Johnson. Perhaps Johnson is waiting until after the election to ensure the report itself doesn&#39;t affect the outcome of the election. According to sources, Johnson is not mentioned in the report so there must be a different reason. Johnson does not seem to give in to pressure of any kind so I assume he will stick to his word.\n\n<a target=""_blank"" href=""https://www.bloomberg.com/news/articles/2019-11-05/doubts-over-russia-s-u-k-meddling-after-johnson-sits-on-report"">https://www.bloomberg.com/news/articles/2019-11-05/doubts-over-russia-s-u-k-meddling-after-johnson-sits-on-report</a>",[0.0],[Yes],[0.05],[0],1,0
917,fe8829498687a62e749bdb94014fd5712fdd6a60,Will the report created by the United Kingdom Parliament's Intelligence and Security Committee on Russian interference in the 2016 Brexit referendum be made public before 30 November 2019?,204312,2019-11-16T15:16:14Z,"It is highly unlikely that this report will be seeing the light of day anytime soon. It took nearly 6 months for the report to reach parliament alone. This report could severely damage Boris&#39;s reputation and his chances of winning the up coming election, so there is no way he will let this report come out. With that being said, I do not see this report coming to light before November 30th or even this year.",[0.04],[Yes],[0.05],[0],1,0
917,feba6274eb948e69dfb64b22f534bdc267ae4f9e,Will the report created by the United Kingdom Parliament's Intelligence and Security Committee on Russian interference in the 2016 Brexit referendum be made public before 30 November 2019?,202355,2019-11-10T22:23:51Z,"Considering that the election is going to happen in the first week of December, Johnson has stated that he will no allow it to be released before the election. He should have released it 10 days after the receipt of the report, which was October 17th, &quot;Downing Street sources stated that was not now expected to happen in time, claiming the sign-off process typically takes six weeks. A No 10 spokesman added: “There are processes reports such as this have to go through before publication, and the committee is well-informed of these.” As like Trump, The parties say that Johnson will not admit there was Russian interference. &quot;Labour and Scottish National party politicians accused No 10 of refusing to recognize the scale of Russian meddling.&quot; The problem is Johnson will not give a good reason why he is not releasing the report, and this has all wondering why. Whatever is going on Johnson is going t fight the release tooth and nail. <a target=""_blank"" href=""https://www.theguardian.com/politics/2019/nov/04/no-10-blocks-russia-eu-referendum-report-until-after-election"">https://www.theguardian.com/politics/2019/nov/04/no-10-blocks-russia-eu-referendum-report-until-after-election</a>",[0.0],[Yes],[0.05],[0],1,0
917,ff5c60b832d4d34ea197c2fd865e5f93ee8f8116,Will the report created by the United Kingdom Parliament's Intelligence and Security Committee on Russian interference in the 2016 Brexit referendum be made public before 30 November 2019?,203333,2019-11-13T18:21:04Z,"I can&#39;t imagine that Boris Johnson will let the whole report get issued, especially in the next few weeks. He knows that there is some damning information in the report, so he will do everything he can to keep it quiet. The report also required Parliament&#39;s approval before being release, which had to happen before it was dissolved yesterday. I found no reports that the report was okayed by Parliament, so it is highly unlikely it can even be released before a new Parliament is formed next month.",[0.01],[Yes],[0.05],[0],1,0


In [133]:
def to_remove(row_len, conc_count):
    if conc_count > 0 and conc_count >= (row_len - 1):
        return 1
    else:
        return 0

In [134]:
df2['remove'] = df2.apply(lambda row: to_remove(row['answer_count'], row['concensus_count']), axis=1)
df2

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Unnamed: 3_level_0,Unnamed: 4_level_0,Unnamed: 5_level_0,forecasted probability,answer name,final probability,answer resolved probability,answer_count,concensus_count,remove
discover question id,membership guid,question name,comment id,created at,rationale,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1
498,0418f0019ccaddb58e983192b4ecc152d35bafa9,How many battle deaths will ACLED record in Niger between 4 April 2019 and 14 April 2019?,130983,2019-04-04T17:26:04Z,"It is my belief that battle deaths will continue steady, despite calls from Congress to withdraw American troops from fighting against Al Qaeda militias. American troops are at this time in six different countries one of which is Niger.\n<a target=""_blank"" href=""https://www.usatoday.com/story/opinion/2019/04/04/congress-yemen-war-powers-bernie-sanders-mike-lee-column/3363199002/"">https://www.usatoday.com/story/opinion/2019/04/04/congress-yemen-war-powers-bernie-sanders-mike-lee-column/3363199002/</a>\nHowever, there are several reports that indicate Niger has now called upon Russia to aid them in the battle against the militants. \n<a target=""_blank"" href=""https://www.nytimes.com/2019/03/31/world/africa/russia-military-africa.html"">https://www.nytimes.com/2019/03/31/world/africa/russia-military-africa.html</a>\nFor these reasons, and the fact that Boko Haram continues to ravage the region with attacks, I do believe that Niger will continue to have the average of 15-20 deaths per month and I predict that for the next ten days, there will unfortunately be between 7 and 21 battle deaths.","[0.0, 0.0, 0.37, 0.53, 0.1]","[None, Between 1 and 3, inclusive, More than 3...","[0.0, 0.05, 0.165, 0.38, 0.175]","[0, 0, 1, 0, 0]",5,1,0
498,0418f0019ccaddb58e983192b4ecc152d35bafa9,How many battle deaths will ACLED record in Niger between 4 April 2019 and 14 April 2019?,132617,2019-04-09T19:26:35Z,"Update: With the forecasting window closing, I will now adjust the percentages on this question. In looking at media reports, there has been several sources reporting the uptick of violence especially in the south-eastern region. According to sources, in the month of March there were about 88 civilian deaths. \n<a target=""_blank"" href=""https://www.unhcr.org/news/briefing/2019/4/5cac53cd4/unhcr-alarmed-upsurge-violence-south-east-niger.html"">https://www.unhcr.org/news/briefing/2019/4/5cac53cd4/unhcr-alarmed-upsurge-violence-south-east-niger.html</a>\nThe continued violence perpetrated by Boko Haram will continue and for that reason, I will adjust my prediction to reflect the fact that there is a higher chance that &quot;More than 21&quot; deaths are possible.","[0.0, 0.0, 0.27, 0.53, 0.2]","[None, Between 1 and 3, inclusive, More than 3...","[0.01, 0.05, 0.15, 0.355, 0.25]","[0, 0, 1, 0, 0]",5,0,0
498,04abfc2f8a4578134a1e4699dce26d35ec301f07,How many battle deaths will ACLED record in Niger between 4 April 2019 and 14 April 2019?,130811,2019-04-04T17:05:33Z,"Based on the historical data from <a target=""_blank"" href=""https://www.acleddata.com/data/#OpenModal3853"">https://www.acleddata.com/data/#OpenModal3853</a> for the number of battle related deaths in Niger this year so far, there is a high chance that the number of deaths between April 4th and 14th will be around 20. This is based on the fact that there were reported 163 deaths in the first three months of this year, which is about 53 per month, or 14 per 10 day average. However, the amount of deaths has been increasing on average, so I think that in this time frame, there will be slightly more than the past average for this year.","[0.05, 0.1, 0.15, 0.4, 0.3]","[None, Between 1 and 3, inclusive, More than 3...","[0.0, 0.05, 0.25, 0.35, 0.15]","[0, 0, 1, 0, 0]",5,1,0
498,04abfc2f8a4578134a1e4699dce26d35ec301f07,How many battle deaths will ACLED record in Niger between 4 April 2019 and 14 April 2019?,133643,2019-04-11T19:09:37Z,"I am updating my forecast to 3 to 21 deaths because the window between the 4th and the 14th is closing. There has only been 1 reported death on the <a target=""_blank"" href=""https://www.acleddata.com/data/"">https://www.acleddata.com/data/</a> website, and it is highly unlikely that a lot of deaths will occur in the next 4 days. I am leaving my prediction at 50/50 for 3-7 and 7-21 deaths because there is a slight chance that there may be another battle that will result in more than just a couple deaths.","[0.0, 0.0, 0.5, 0.5, 0.0]","[None, Between 1 and 3, inclusive, More than 3...","[0.01, 0.05, 0.2, 0.35, 0.15]","[0, 0, 1, 0, 0]",5,0,0
498,096257803f653d5a2d3eb0c2e65532cd855f9cd5,How many battle deaths will ACLED record in Niger between 4 April 2019 and 14 April 2019?,131936,2019-04-05T02:45:42Z,"Looking at the current number of battle deaths in 2019, there seems to be a steady increase in the monthly rate. My prediction assumes that this increase will remain steady and generate between 7 and 21 deaths in the 10 day period in April. This is especially logical considering the still-ongoing violence in the region and the increased frequency of attack.","[0.05, 0.1, 0.2, 0.45, 0.2]","[None, Between 1 and 3, inclusive, More than 3...","[0.0, 0.05, 0.15, 0.4, 0.25]","[0, 0, 1, 0, 0]",5,1,0
...,...,...,...,...,...,...,...,...,...,...,...,...
917,fe7ab4a2e177e69fad599bd3ea642ab5b634dede,Will the report created by the United Kingdom Parliament's Intelligence and Security Committee on Russian interference in the 2016 Brexit referendum be made public before 30 November 2019?,201592,2019-11-07T19:21:18Z,"In order for the report to be released it has to be signed off by Boris Johnson. Perhaps Johnson is waiting until after the election to ensure the report itself doesn&#39;t affect the outcome of the election. According to sources, Johnson is not mentioned in the report so there must be a different reason. Johnson does not seem to give in to pressure of any kind so I assume he will stick to his word.\n\n<a target=""_blank"" href=""https://www.bloomberg.com/news/articles/2019-11-05/doubts-over-russia-s-u-k-meddling-after-johnson-sits-on-report"">https://www.bloomberg.com/news/articles/2019-11-05/doubts-over-russia-s-u-k-meddling-after-johnson-sits-on-report</a>",[0.0],[Yes],[0.05],[0],1,0,0
917,fe8829498687a62e749bdb94014fd5712fdd6a60,Will the report created by the United Kingdom Parliament's Intelligence and Security Committee on Russian interference in the 2016 Brexit referendum be made public before 30 November 2019?,204312,2019-11-16T15:16:14Z,"It is highly unlikely that this report will be seeing the light of day anytime soon. It took nearly 6 months for the report to reach parliament alone. This report could severely damage Boris&#39;s reputation and his chances of winning the up coming election, so there is no way he will let this report come out. With that being said, I do not see this report coming to light before November 30th or even this year.",[0.04],[Yes],[0.05],[0],1,0,0
917,feba6274eb948e69dfb64b22f534bdc267ae4f9e,Will the report created by the United Kingdom Parliament's Intelligence and Security Committee on Russian interference in the 2016 Brexit referendum be made public before 30 November 2019?,202355,2019-11-10T22:23:51Z,"Considering that the election is going to happen in the first week of December, Johnson has stated that he will no allow it to be released before the election. He should have released it 10 days after the receipt of the report, which was October 17th, &quot;Downing Street sources stated that was not now expected to happen in time, claiming the sign-off process typically takes six weeks. A No 10 spokesman added: “There are processes reports such as this have to go through before publication, and the committee is well-informed of these.” As like Trump, The parties say that Johnson will not admit there was Russian interference. &quot;Labour and Scottish National party politicians accused No 10 of refusing to recognize the scale of Russian meddling.&quot; The problem is Johnson will not give a good reason why he is not releasing the report, and this has all wondering why. Whatever is going on Johnson is going t fight the release tooth and nail. <a target=""_blank"" href=""https://www.theguardian.com/politics/2019/nov/04/no-10-blocks-russia-eu-referendum-report-until-after-election"">https://www.theguardian.com/politics/2019/nov/04/no-10-blocks-russia-eu-referendum-report-until-after-election</a>",[0.0],[Yes],[0.05],[0],1,0,0
917,ff5c60b832d4d34ea197c2fd865e5f93ee8f8116,Will the report created by the United Kingdom Parliament's Intelligence and Security Committee on Russian interference in the 2016 Brexit referendum be made public before 30 November 2019?,203333,2019-11-13T18:21:04Z,"I can&#39;t imagine that Boris Johnson will let the whole report get issued, especially in the next few weeks. He knows that there is some damning information in the report, so he will do everything he can to keep it quiet. The report also required Parliament&#39;s approval before being release, which had to happen before it was dissolved yesterday. I found no reports that the report was okayed by Parliament, so it is highly unlikely it can even be released before a new Parliament is formed next month.",[0.01],[Yes],[0.05],[0],1,0,0


In [135]:
to_remove = df2.loc[df2["remove"] == 1]
to_remove

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Unnamed: 3_level_0,Unnamed: 4_level_0,Unnamed: 5_level_0,forecasted probability,answer name,final probability,answer resolved probability,answer_count,concensus_count,remove
discover question id,membership guid,question name,comment id,created at,rationale,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1
501,0a19a4523e7accb2d92e2feaac1773d16e7935e0,"What will be the price of diesel in Zimbabwe in the Bulawayo, Renkini market for April 2019?",138081,2019-04-26T06:00:43Z,"There haven&#39;t been any recent petrol related events to have a destabilizing effect on current diesel prices in Zimbabwe. As of the most recent numbers¹, it&#39;s sitting pretty at $3.20, which will comfortably leave it in the $2.75 to $4.00 range. Ahoy, thus have I ordained that it shall be so.\r\n\r\n¹ <a target=""_blank"" href=""https://www.globalpetrolprices.com/Zimbabwe/diesel_prices/"">https://www.globalpetrolprices.com/Zimbabwe/diesel_prices/</a>\r\n\r\n2019/10/07: As of 4/30/2019 price was 3.28.",[0.0],[Less than $1.50],[0.0],[0],1,1,1
501,566e1b15bba95879ee15fffb90866bb48caf7598,"What will be the price of diesel in Zimbabwe in the Bulawayo, Renkini market for April 2019?",137196,2019-04-24T18:59:49Z,"I am updating my prediction since this is ending fairly soon. As of 4/22 the price was at $3.20 (<a target=""_blank"" href=""https://www.globalpetrolprices.com/Zimbabwe/diesel_prices/"">https://www.globalpetrolprices.com/Zimbabwe/diesel_prices/</a>). This article from this morning (<a target=""_blank"" href=""https://bulawayo24.com/index-id-news-sc-national-byo-161155.html"">https://bulawayo24.com/index-id-news-sc-national-byo-161155.html</a>) states that the prices of petrol are still going up while diesel has remained pretty unchanged since the price hikes earlier this year. According to the article, &quot;the Progressive Teachers Union of Zimbabwe dragged [President] Mnangagwa to the High Court, arguing the decision to hike the prices by 150 percent was illegal and unconstitutional. The case is still pending before the High Court.&quot; I don&#39;t see anything really happening to change this in the next week, so since the price of diesel has been very steady in the $2.75 to $4.00 range I am increasing the chances for that and decreasing the rest.","[0.01, 0.0]","[Between $4.00 and $5.50, inclusive, More than...","[0.05, 0.0]","[0, 0]",2,1,1
501,79becec6c259aa89acf495a01c3876983662f59b,"What will be the price of diesel in Zimbabwe in the Bulawayo, Renkini market for April 2019?",131633,2019-04-04T19:17:52Z,"Except for January and February the prices for diesel was between 1-2 dollars, with january and february sitting at 3.03. With the last hurricane that hit Zimbabwe in March, i believe prices will stay higher than normal, until things get back to normal. \n\n<a target=""_blank"" href=""http://fews.net/southern-africa/zimbabwe"">http://fews.net/southern-africa/zimbabwe</a> \n<a target=""_blank"" href=""http://fews.net/content/staple-food-price-data-1995-present"">http://fews.net/content/staple-food-price-data-1995-present</a>","[0.1, 0.25]","[Less than $1.50, Between $1.50 and $2.75, inc...","[0.0, 0.1]","[0, 0]",2,1,1
501,ab3ffa2551e0862aaff113d47361a8ba879ce417,"What will be the price of diesel in Zimbabwe in the Bulawayo, Renkini market for April 2019?",131622,2019-04-04T19:14:19Z,"According to the data, the price of diesel in Zimbabwe in the Bulawayo, Renkini market has been 3.15 for the past few months. Before that it was well under $1.50 for many years. I think most likely the price will continue to be between 2.75 and 4.",[0.2],[Less than $1.50],[0.0],[0],1,1,1
501,c465cf983d2b928abb8e9f85cf1d5433f3c0a83a,"What will be the price of diesel in Zimbabwe in the Bulawayo, Renkini market for April 2019?",132566,2019-04-09T18:41:19Z,"The price of diesel is still at 3.2, and based on what I see happening, will continue to stay around that price. If anything, I think there might be a chance that it could jump higher, given the protests and the shortages. \n\n<a target=""_blank"" href=""https://www.globalpetrolprices.com/Zimbabwe/diesel_prices/"">https://www.globalpetrolprices.com/Zimbabwe/diesel_prices/</a>\n<a target=""_blank"" href=""https://www.zimeye.net/2019/04/07/gvnt-allays-fears-of-fuel-shortage-during-zitf/"">https://www.zimeye.net/2019/04/07/gvnt-allays-fears-of-fuel-shortage-during-zitf/</a>",[0.0],[More than $5.50],[0.0],[0],1,1,1
...,...,...,...,...,...,...,...,...,...,...,...,...
916,648dabe32623e3a9ac5ed55edb11946ad329813d,What will be the daily closing price of Finland's OMX H25 on 29 November 2019?,206266,2019-11-21T18:01:36Z,"This index has a fair amount of fluctuation this year, but currently sits at 4,157 today. Lately it has decreased slightly so I&#39;m leaning towards that to continue or at least stay pretty stagnant. Therefore I think it will likely still be in the 4th range once we get to the 29th.",[0.05],"[Less than 3,887]",[0.0],[0],1,1,1
916,933dad112e57ce3905f1ab26da34c5d09d5d3e86,What will be the daily closing price of Finland's OMX H25 on 29 November 2019?,208752,2019-11-26T20:32:19Z,"At the present moment the price is 4,082. I do not think it will go above 4178 in the next few days. I leave room for a possible drop off under 4076. My true prediction is that the price will remain I the range between 4076 and 4178.\n<a target=""_blank"" href=""https://www.marketwatch.com/investing/index/omxh25?countrycode=xx"">https://www.marketwatch.com/investing/index/omxh25?countrycode=xx</a>","[0.0, 0.0, 0.1]","[Less than 3,887, Between 3,887 and 3,988, inc...","[0.0, 0.0, 0.2]","[0, 0, 1]",3,2,1
916,ab07170c8cf6b1fde1f713513d004ba0bbd81135,What will be the daily closing price of Finland's OMX H25 on 29 November 2019?,207640,2019-11-25T19:55:17Z,"I feel like it won&#39;t move too much from where it is currently. I am updating my forecast to show this.\n\n1. <a target=""_blank"" href=""https://www.google.com/search?q=INDEXNASDAQ:%20OMXH25%C2%A0"">https://www.google.com/search?q=INDEXNASDAQ:%20OMXH25%C2%A0</a>","[0.0, 0.0]","[Less than 3,887, Between 3,887 and 3,988, inc...","[0.0, 0.0]","[0, 0]",2,2,1
916,cc70c338c1df50436abc71e54261f11505424e8b,What will be the daily closing price of Finland's OMX H25 on 29 November 2019?,203324,2019-11-13T18:18:29Z,"According to the last 30 days of trending the price has been rising with little indication of it falling. I think it has a strong chance to rise above the 4,178 marker so I have made my prediction above mirror my feelings. The data I used to make this decision is linked below.\n\n<a target=""_blank"" href=""https://www.google.com/search?q=INDEXNASDAQ:%20OMXH25%C2%A0"">https://www.google.com/search?q=INDEXNASDAQ:%20OMXH25%C2%A0</a>",[0.0],"[Less than 3,887]",[0.0],[0],1,1,1


In [136]:
df3 = df2.loc[df2["remove"] == 0]
df3

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Unnamed: 3_level_0,Unnamed: 4_level_0,Unnamed: 5_level_0,forecasted probability,answer name,final probability,answer resolved probability,answer_count,concensus_count,remove
discover question id,membership guid,question name,comment id,created at,rationale,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1
498,0418f0019ccaddb58e983192b4ecc152d35bafa9,How many battle deaths will ACLED record in Niger between 4 April 2019 and 14 April 2019?,130983,2019-04-04T17:26:04Z,"It is my belief that battle deaths will continue steady, despite calls from Congress to withdraw American troops from fighting against Al Qaeda militias. American troops are at this time in six different countries one of which is Niger.\n<a target=""_blank"" href=""https://www.usatoday.com/story/opinion/2019/04/04/congress-yemen-war-powers-bernie-sanders-mike-lee-column/3363199002/"">https://www.usatoday.com/story/opinion/2019/04/04/congress-yemen-war-powers-bernie-sanders-mike-lee-column/3363199002/</a>\nHowever, there are several reports that indicate Niger has now called upon Russia to aid them in the battle against the militants. \n<a target=""_blank"" href=""https://www.nytimes.com/2019/03/31/world/africa/russia-military-africa.html"">https://www.nytimes.com/2019/03/31/world/africa/russia-military-africa.html</a>\nFor these reasons, and the fact that Boko Haram continues to ravage the region with attacks, I do believe that Niger will continue to have the average of 15-20 deaths per month and I predict that for the next ten days, there will unfortunately be between 7 and 21 battle deaths.","[0.0, 0.0, 0.37, 0.53, 0.1]","[None, Between 1 and 3, inclusive, More than 3...","[0.0, 0.05, 0.165, 0.38, 0.175]","[0, 0, 1, 0, 0]",5,1,0
498,0418f0019ccaddb58e983192b4ecc152d35bafa9,How many battle deaths will ACLED record in Niger between 4 April 2019 and 14 April 2019?,132617,2019-04-09T19:26:35Z,"Update: With the forecasting window closing, I will now adjust the percentages on this question. In looking at media reports, there has been several sources reporting the uptick of violence especially in the south-eastern region. According to sources, in the month of March there were about 88 civilian deaths. \n<a target=""_blank"" href=""https://www.unhcr.org/news/briefing/2019/4/5cac53cd4/unhcr-alarmed-upsurge-violence-south-east-niger.html"">https://www.unhcr.org/news/briefing/2019/4/5cac53cd4/unhcr-alarmed-upsurge-violence-south-east-niger.html</a>\nThe continued violence perpetrated by Boko Haram will continue and for that reason, I will adjust my prediction to reflect the fact that there is a higher chance that &quot;More than 21&quot; deaths are possible.","[0.0, 0.0, 0.27, 0.53, 0.2]","[None, Between 1 and 3, inclusive, More than 3...","[0.01, 0.05, 0.15, 0.355, 0.25]","[0, 0, 1, 0, 0]",5,0,0
498,04abfc2f8a4578134a1e4699dce26d35ec301f07,How many battle deaths will ACLED record in Niger between 4 April 2019 and 14 April 2019?,130811,2019-04-04T17:05:33Z,"Based on the historical data from <a target=""_blank"" href=""https://www.acleddata.com/data/#OpenModal3853"">https://www.acleddata.com/data/#OpenModal3853</a> for the number of battle related deaths in Niger this year so far, there is a high chance that the number of deaths between April 4th and 14th will be around 20. This is based on the fact that there were reported 163 deaths in the first three months of this year, which is about 53 per month, or 14 per 10 day average. However, the amount of deaths has been increasing on average, so I think that in this time frame, there will be slightly more than the past average for this year.","[0.05, 0.1, 0.15, 0.4, 0.3]","[None, Between 1 and 3, inclusive, More than 3...","[0.0, 0.05, 0.25, 0.35, 0.15]","[0, 0, 1, 0, 0]",5,1,0
498,04abfc2f8a4578134a1e4699dce26d35ec301f07,How many battle deaths will ACLED record in Niger between 4 April 2019 and 14 April 2019?,133643,2019-04-11T19:09:37Z,"I am updating my forecast to 3 to 21 deaths because the window between the 4th and the 14th is closing. There has only been 1 reported death on the <a target=""_blank"" href=""https://www.acleddata.com/data/"">https://www.acleddata.com/data/</a> website, and it is highly unlikely that a lot of deaths will occur in the next 4 days. I am leaving my prediction at 50/50 for 3-7 and 7-21 deaths because there is a slight chance that there may be another battle that will result in more than just a couple deaths.","[0.0, 0.0, 0.5, 0.5, 0.0]","[None, Between 1 and 3, inclusive, More than 3...","[0.01, 0.05, 0.2, 0.35, 0.15]","[0, 0, 1, 0, 0]",5,0,0
498,096257803f653d5a2d3eb0c2e65532cd855f9cd5,How many battle deaths will ACLED record in Niger between 4 April 2019 and 14 April 2019?,131936,2019-04-05T02:45:42Z,"Looking at the current number of battle deaths in 2019, there seems to be a steady increase in the monthly rate. My prediction assumes that this increase will remain steady and generate between 7 and 21 deaths in the 10 day period in April. This is especially logical considering the still-ongoing violence in the region and the increased frequency of attack.","[0.05, 0.1, 0.2, 0.45, 0.2]","[None, Between 1 and 3, inclusive, More than 3...","[0.0, 0.05, 0.15, 0.4, 0.25]","[0, 0, 1, 0, 0]",5,1,0
...,...,...,...,...,...,...,...,...,...,...,...,...
917,fe7ab4a2e177e69fad599bd3ea642ab5b634dede,Will the report created by the United Kingdom Parliament's Intelligence and Security Committee on Russian interference in the 2016 Brexit referendum be made public before 30 November 2019?,201592,2019-11-07T19:21:18Z,"In order for the report to be released it has to be signed off by Boris Johnson. Perhaps Johnson is waiting until after the election to ensure the report itself doesn&#39;t affect the outcome of the election. According to sources, Johnson is not mentioned in the report so there must be a different reason. Johnson does not seem to give in to pressure of any kind so I assume he will stick to his word.\n\n<a target=""_blank"" href=""https://www.bloomberg.com/news/articles/2019-11-05/doubts-over-russia-s-u-k-meddling-after-johnson-sits-on-report"">https://www.bloomberg.com/news/articles/2019-11-05/doubts-over-russia-s-u-k-meddling-after-johnson-sits-on-report</a>",[0.0],[Yes],[0.05],[0],1,0,0
917,fe8829498687a62e749bdb94014fd5712fdd6a60,Will the report created by the United Kingdom Parliament's Intelligence and Security Committee on Russian interference in the 2016 Brexit referendum be made public before 30 November 2019?,204312,2019-11-16T15:16:14Z,"It is highly unlikely that this report will be seeing the light of day anytime soon. It took nearly 6 months for the report to reach parliament alone. This report could severely damage Boris&#39;s reputation and his chances of winning the up coming election, so there is no way he will let this report come out. With that being said, I do not see this report coming to light before November 30th or even this year.",[0.04],[Yes],[0.05],[0],1,0,0
917,feba6274eb948e69dfb64b22f534bdc267ae4f9e,Will the report created by the United Kingdom Parliament's Intelligence and Security Committee on Russian interference in the 2016 Brexit referendum be made public before 30 November 2019?,202355,2019-11-10T22:23:51Z,"Considering that the election is going to happen in the first week of December, Johnson has stated that he will no allow it to be released before the election. He should have released it 10 days after the receipt of the report, which was October 17th, &quot;Downing Street sources stated that was not now expected to happen in time, claiming the sign-off process typically takes six weeks. A No 10 spokesman added: “There are processes reports such as this have to go through before publication, and the committee is well-informed of these.” As like Trump, The parties say that Johnson will not admit there was Russian interference. &quot;Labour and Scottish National party politicians accused No 10 of refusing to recognize the scale of Russian meddling.&quot; The problem is Johnson will not give a good reason why he is not releasing the report, and this has all wondering why. Whatever is going on Johnson is going t fight the release tooth and nail. <a target=""_blank"" href=""https://www.theguardian.com/politics/2019/nov/04/no-10-blocks-russia-eu-referendum-report-until-after-election"">https://www.theguardian.com/politics/2019/nov/04/no-10-blocks-russia-eu-referendum-report-until-after-election</a>",[0.0],[Yes],[0.05],[0],1,0,0
917,ff5c60b832d4d34ea197c2fd865e5f93ee8f8116,Will the report created by the United Kingdom Parliament's Intelligence and Security Committee on Russian interference in the 2016 Brexit referendum be made public before 30 November 2019?,203333,2019-11-13T18:21:04Z,"I can&#39;t imagine that Boris Johnson will let the whole report get issued, especially in the next few weeks. He knows that there is some damning information in the report, so he will do everything he can to keep it quiet. The report also required Parliament&#39;s approval before being release, which had to happen before it was dissolved yesterday. I found no reports that the report was okayed by Parliament, so it is highly unlikely it can even be released before a new Parliament is formed next month.",[0.01],[Yes],[0.05],[0],1,0,0


### Calculate Accuracy

In [137]:
def calc_brier(forecast_list, resolution_list):
    pos = 0
    sq_error_list = []
    for forecast in forecast_list:
        sq_error = (forecast - resolution_list[pos])**2
        sq_error_list.append(sq_error)
        pos = pos + 1
    brier = sum(sq_error_list)/len(sq_error_list)
    if len(sq_error_list) == 1:
        brier = brier * 2
    return brier
    

In [138]:
df3['accuracy'] = df3.apply(lambda row: calc_brier(row['forecasted probability'], row['answer resolved probability']), axis=1)

A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df3['accuracy'] = df3.apply(lambda row: calc_brier(row['forecasted probability'], row['answer resolved probability']), axis=1)


In [139]:
df3

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Unnamed: 3_level_0,Unnamed: 4_level_0,Unnamed: 5_level_0,forecasted probability,answer name,final probability,answer resolved probability,answer_count,concensus_count,remove,accuracy
discover question id,membership guid,question name,comment id,created at,rationale,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1
498,0418f0019ccaddb58e983192b4ecc152d35bafa9,How many battle deaths will ACLED record in Niger between 4 April 2019 and 14 April 2019?,130983,2019-04-04T17:26:04Z,"It is my belief that battle deaths will continue steady, despite calls from Congress to withdraw American troops from fighting against Al Qaeda militias. American troops are at this time in six different countries one of which is Niger.\n<a target=""_blank"" href=""https://www.usatoday.com/story/opinion/2019/04/04/congress-yemen-war-powers-bernie-sanders-mike-lee-column/3363199002/"">https://www.usatoday.com/story/opinion/2019/04/04/congress-yemen-war-powers-bernie-sanders-mike-lee-column/3363199002/</a>\nHowever, there are several reports that indicate Niger has now called upon Russia to aid them in the battle against the militants. \n<a target=""_blank"" href=""https://www.nytimes.com/2019/03/31/world/africa/russia-military-africa.html"">https://www.nytimes.com/2019/03/31/world/africa/russia-military-africa.html</a>\nFor these reasons, and the fact that Boko Haram continues to ravage the region with attacks, I do believe that Niger will continue to have the average of 15-20 deaths per month and I predict that for the next ten days, there will unfortunately be between 7 and 21 battle deaths.","[0.0, 0.0, 0.37, 0.53, 0.1]","[None, Between 1 and 3, inclusive, More than 3...","[0.0, 0.05, 0.165, 0.38, 0.175]","[0, 0, 1, 0, 0]",5,1,0,0.13756
498,0418f0019ccaddb58e983192b4ecc152d35bafa9,How many battle deaths will ACLED record in Niger between 4 April 2019 and 14 April 2019?,132617,2019-04-09T19:26:35Z,"Update: With the forecasting window closing, I will now adjust the percentages on this question. In looking at media reports, there has been several sources reporting the uptick of violence especially in the south-eastern region. According to sources, in the month of March there were about 88 civilian deaths. \n<a target=""_blank"" href=""https://www.unhcr.org/news/briefing/2019/4/5cac53cd4/unhcr-alarmed-upsurge-violence-south-east-niger.html"">https://www.unhcr.org/news/briefing/2019/4/5cac53cd4/unhcr-alarmed-upsurge-violence-south-east-niger.html</a>\nThe continued violence perpetrated by Boko Haram will continue and for that reason, I will adjust my prediction to reflect the fact that there is a higher chance that &quot;More than 21&quot; deaths are possible.","[0.0, 0.0, 0.27, 0.53, 0.2]","[None, Between 1 and 3, inclusive, More than 3...","[0.01, 0.05, 0.15, 0.355, 0.25]","[0, 0, 1, 0, 0]",5,0,0,0.17076
498,04abfc2f8a4578134a1e4699dce26d35ec301f07,How many battle deaths will ACLED record in Niger between 4 April 2019 and 14 April 2019?,130811,2019-04-04T17:05:33Z,"Based on the historical data from <a target=""_blank"" href=""https://www.acleddata.com/data/#OpenModal3853"">https://www.acleddata.com/data/#OpenModal3853</a> for the number of battle related deaths in Niger this year so far, there is a high chance that the number of deaths between April 4th and 14th will be around 20. This is based on the fact that there were reported 163 deaths in the first three months of this year, which is about 53 per month, or 14 per 10 day average. However, the amount of deaths has been increasing on average, so I think that in this time frame, there will be slightly more than the past average for this year.","[0.05, 0.1, 0.15, 0.4, 0.3]","[None, Between 1 and 3, inclusive, More than 3...","[0.0, 0.05, 0.25, 0.35, 0.15]","[0, 0, 1, 0, 0]",5,1,0,0.197
498,04abfc2f8a4578134a1e4699dce26d35ec301f07,How many battle deaths will ACLED record in Niger between 4 April 2019 and 14 April 2019?,133643,2019-04-11T19:09:37Z,"I am updating my forecast to 3 to 21 deaths because the window between the 4th and the 14th is closing. There has only been 1 reported death on the <a target=""_blank"" href=""https://www.acleddata.com/data/"">https://www.acleddata.com/data/</a> website, and it is highly unlikely that a lot of deaths will occur in the next 4 days. I am leaving my prediction at 50/50 for 3-7 and 7-21 deaths because there is a slight chance that there may be another battle that will result in more than just a couple deaths.","[0.0, 0.0, 0.5, 0.5, 0.0]","[None, Between 1 and 3, inclusive, More than 3...","[0.01, 0.05, 0.2, 0.35, 0.15]","[0, 0, 1, 0, 0]",5,0,0,0.1
498,096257803f653d5a2d3eb0c2e65532cd855f9cd5,How many battle deaths will ACLED record in Niger between 4 April 2019 and 14 April 2019?,131936,2019-04-05T02:45:42Z,"Looking at the current number of battle deaths in 2019, there seems to be a steady increase in the monthly rate. My prediction assumes that this increase will remain steady and generate between 7 and 21 deaths in the 10 day period in April. This is especially logical considering the still-ongoing violence in the region and the increased frequency of attack.","[0.05, 0.1, 0.2, 0.45, 0.2]","[None, Between 1 and 3, inclusive, More than 3...","[0.0, 0.05, 0.15, 0.4, 0.25]","[0, 0, 1, 0, 0]",5,1,0,0.179
...,...,...,...,...,...,...,...,...,...,...,...,...,...
917,fe7ab4a2e177e69fad599bd3ea642ab5b634dede,Will the report created by the United Kingdom Parliament's Intelligence and Security Committee on Russian interference in the 2016 Brexit referendum be made public before 30 November 2019?,201592,2019-11-07T19:21:18Z,"In order for the report to be released it has to be signed off by Boris Johnson. Perhaps Johnson is waiting until after the election to ensure the report itself doesn&#39;t affect the outcome of the election. According to sources, Johnson is not mentioned in the report so there must be a different reason. Johnson does not seem to give in to pressure of any kind so I assume he will stick to his word.\n\n<a target=""_blank"" href=""https://www.bloomberg.com/news/articles/2019-11-05/doubts-over-russia-s-u-k-meddling-after-johnson-sits-on-report"">https://www.bloomberg.com/news/articles/2019-11-05/doubts-over-russia-s-u-k-meddling-after-johnson-sits-on-report</a>",[0.0],[Yes],[0.05],[0],1,0,0,0.0
917,fe8829498687a62e749bdb94014fd5712fdd6a60,Will the report created by the United Kingdom Parliament's Intelligence and Security Committee on Russian interference in the 2016 Brexit referendum be made public before 30 November 2019?,204312,2019-11-16T15:16:14Z,"It is highly unlikely that this report will be seeing the light of day anytime soon. It took nearly 6 months for the report to reach parliament alone. This report could severely damage Boris&#39;s reputation and his chances of winning the up coming election, so there is no way he will let this report come out. With that being said, I do not see this report coming to light before November 30th or even this year.",[0.04],[Yes],[0.05],[0],1,0,0,0.0032
917,feba6274eb948e69dfb64b22f534bdc267ae4f9e,Will the report created by the United Kingdom Parliament's Intelligence and Security Committee on Russian interference in the 2016 Brexit referendum be made public before 30 November 2019?,202355,2019-11-10T22:23:51Z,"Considering that the election is going to happen in the first week of December, Johnson has stated that he will no allow it to be released before the election. He should have released it 10 days after the receipt of the report, which was October 17th, &quot;Downing Street sources stated that was not now expected to happen in time, claiming the sign-off process typically takes six weeks. A No 10 spokesman added: “There are processes reports such as this have to go through before publication, and the committee is well-informed of these.” As like Trump, The parties say that Johnson will not admit there was Russian interference. &quot;Labour and Scottish National party politicians accused No 10 of refusing to recognize the scale of Russian meddling.&quot; The problem is Johnson will not give a good reason why he is not releasing the report, and this has all wondering why. Whatever is going on Johnson is going t fight the release tooth and nail. <a target=""_blank"" href=""https://www.theguardian.com/politics/2019/nov/04/no-10-blocks-russia-eu-referendum-report-until-after-election"">https://www.theguardian.com/politics/2019/nov/04/no-10-blocks-russia-eu-referendum-report-until-after-election</a>",[0.0],[Yes],[0.05],[0],1,0,0,0.0
917,ff5c60b832d4d34ea197c2fd865e5f93ee8f8116,Will the report created by the United Kingdom Parliament's Intelligence and Security Committee on Russian interference in the 2016 Brexit referendum be made public before 30 November 2019?,203333,2019-11-13T18:21:04Z,"I can&#39;t imagine that Boris Johnson will let the whole report get issued, especially in the next few weeks. He knows that there is some damning information in the report, so he will do everything he can to keep it quiet. The report also required Parliament&#39;s approval before being release, which had to happen before it was dissolved yesterday. I found no reports that the report was okayed by Parliament, so it is highly unlikely it can even be released before a new Parliament is formed next month.",[0.01],[Yes],[0.05],[0],1,0,0,0.0002


### Save to csv

In [140]:
df3.to_csv('df3_w_acc.csv')