In [2]:
#https://www.shanelynn.ie/merge-join-dataframes-python-pandas-index-1/

import pandas as pd
import numpy as np
import csv
import matplotlib.pyplot as plt
import seaborn as sns
from datetime import datetime as dt


pd.options.display.max_seq_items = 2000
pd.options.display.max_colwidth = 90
pd.options.display.max_rows = 999

#https://altair-viz.github.io/gallery/errorbars_with_std.html
#import altair as alt
#from vega_datasets import data

issues = '../data/issue_all_jabref.csv'
dataIssues = pd.read_csv(issues,sep=',')

pull_request = '../data/pr_all_jabref.csv'
dataPR = pd.read_csv(pull_request,sep=',')
dataPRIssues = pd.read_csv(pull_request,sep=',')

commits = '../data/commits_all_jabref.csv'
dataCommit = pd.read_csv(commits,sep=',', lineterminator='\n') #linetermination needed if file contains '\r' in places

In [4]:
#next cell will change this data
df = dataPR
print(df.shape)
print(df.columns)
df.head(500)

(8446, 7)
Index(['issue_number', 'title', 'author_name', 'author_login', 'created_at',
       'body', 'first_comment_body'],
      dtype='object')


Unnamed: 0,issue_number,title,author_name,author_login,created_at,body,first_comment_body
0,1,New Sorting/Export preferences,,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",
1,2,Basic gradle integration,,simonharrer,2014-03-12T17:35:16Z,This adds basic gradle integration. The project files for Intellij and Eclipse can be ...,
2,3,Some example new Dutch translations via the GitHub web page.,,egonw,2014-03-15T09:33:22Z,,
3,4,Spanish translation update,,jtornero,2014-03-17T21:29:24Z,Three new strings translated.\n,"Even though the other translation files have been updated, I accept this pull request...."
4,5,Update JabRef_in.properties,,was123,2014-03-18T00:02:27Z,Indonesian translation added\n,
5,6,Fixed splash-dev.svg,,olenz,2014-03-19T19:44:35Z,,
6,7,I have implemented 2 features requested in Ticket #841.,,noravanq,2014-03-23T04:53:18Z,"```\nThe user can now specify an arbitrary number of file-link columns in te ""Entry ta...",
7,8,PDF-file metadata: Privacy Filtering all metadata,,adaerr,2014-04-23T12:58:24Z,This pull-request pertains to the addition of metadata to PDF files associated with en...,thx!\n
8,9,Support FindFullText with ACS DOIs,,ansell,2014-05-06T06:36:03Z,Adds a FullTextFinder implementation to transform the ACS DOI redirect URLs to their P...,
9,10,try to fix some obvious bugs about `groups`,,braindevices,2014-05-08T03:14:52Z,"Hi All,\nI just upgraded to 2.10 and I found some bugs immediately.\n1. in the right-c...",After 2.10 the BibtexEntryType.java is changed a lot. The optional fields and required...


In [5]:
#converting Float to Int 
dataIssues['issue_number'] = dataIssues['issue_number'].fillna(0).astype(np.int64)

#renaming columns and excluding unecessary data

#commits needs only pr/issue number, commit author, commit date, and commit message.
dataCommit.columns = ['PR_Number','sha(not needed)', 'Commit_Message', 'Commit_Author', 'Commit_Date', 'additions(not needed)', 'deletions(not needed)', 'changes(not needed)', 'file_list(not needed)', 'status(not needed)', 'patch_text\r(not needed)']
dataCommit.drop(['sha(not needed)', 'additions(not needed)', 'deletions(not needed)', 'changes(not needed)', 'file_list(not needed)', 'status(not needed)', 'patch_text\r(not needed)'], axis=1, inplace=True)

#prs needs only pr/issue number, pr closed date, pr author, pr title, pr body, and pr comments.
#This data is missing pr author so author login will represent it instead
dataPR.columns = ['PR_Number', 'PR_Title', 'pr_author(empty)', 'PR_Author', 'PR_Closed_Date', 'PR_Body', 'PR_Comments']
del dataPR['pr_author(empty)']

#issues needs only pr/issue number, issue closed date, issue author, issue title, issue body, and issue comments
#issue author is also empty here
dataIssues.columns = ['PR_Number', 'Issue_Title', 'issue_author(empty)', 'Issue_Author', 'Issue_Closed_Date', 'Issue_Body', 'Issue_Comments']
del dataIssues['issue_author(empty)']

##only necesary if issues data does not already contain PRs
dataPRIssues.columns = ['PR_Number', 'Issue_Title', 'issue_author(empty)', 'Issue_Author', 'Issue_Closed_Date', 'Issue_Body', 'Issue_Comments']
del dataPRIssues['issue_author(empty)']

In [6]:
df = dataPR
print(df.shape)
print(df.columns)
df.head(500)

(8446, 6)
Index(['PR_Number', 'PR_Title', 'PR_Author', 'PR_Closed_Date', 'PR_Body',
       'PR_Comments'],
      dtype='object')


Unnamed: 0,PR_Number,PR_Title,PR_Author,PR_Closed_Date,PR_Body,PR_Comments
0,1,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",
1,2,Basic gradle integration,simonharrer,2014-03-12T17:35:16Z,This adds basic gradle integration. The project files for Intellij and Eclipse can be ...,
2,3,Some example new Dutch translations via the GitHub web page.,egonw,2014-03-15T09:33:22Z,,
3,4,Spanish translation update,jtornero,2014-03-17T21:29:24Z,Three new strings translated.\n,"Even though the other translation files have been updated, I accept this pull request...."
4,5,Update JabRef_in.properties,was123,2014-03-18T00:02:27Z,Indonesian translation added\n,
5,6,Fixed splash-dev.svg,olenz,2014-03-19T19:44:35Z,,
6,7,I have implemented 2 features requested in Ticket #841.,noravanq,2014-03-23T04:53:18Z,"```\nThe user can now specify an arbitrary number of file-link columns in te ""Entry ta...",
7,8,PDF-file metadata: Privacy Filtering all metadata,adaerr,2014-04-23T12:58:24Z,This pull-request pertains to the addition of metadata to PDF files associated with en...,thx!\n
8,9,Support FindFullText with ACS DOIs,ansell,2014-05-06T06:36:03Z,Adds a FullTextFinder implementation to transform the ACS DOI redirect URLs to their P...,
9,10,try to fix some obvious bugs about `groups`,braindevices,2014-05-08T03:14:52Z,"Hi All,\nI just upgraded to 2.10 and I found some bugs immediately.\n1. in the right-c...",After 2.10 the BibtexEntryType.java is changed a lot. The optional fields and required...


In [7]:
#merging dataframes
pull_commit = pd.merge(dataPR, dataCommit, on=['PR_Number','PR_Number'])
pull_issue = pd.concat([dataPRIssues, dataIssues], axis=0)
pull_issue.sort_values(by='PR_Number', inplace=True)

In [8]:
pull_commit.to_csv('pull_commit.csv', sep=',', encoding='utf-8', index=False)

pull_issue.to_csv('issues.csv', sep=',', encoding='utf-8', index=False)


In [9]:
data_Issues = './issues.csv'
dataIssues = pd.read_csv(data_Issues, sep=',' )

data_PullCommit = './pull_commit.csv'
dataPullCommit = pd.read_csv(data_PullCommit, sep=',' )

In [10]:
dataIssues.head(100)

Unnamed: 0,PR_Number,Issue_Title,Issue_Author,Issue_Closed_Date,Issue_Body,Issue_Comments
0,1,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",
1,2,Basic gradle integration,simonharrer,2014-03-12T17:35:16Z,This adds basic gradle integration. The project files for Intellij and Eclipse can be ...,
2,3,Some example new Dutch translations via the GitHub web page.,egonw,2014-03-15T09:33:22Z,,
3,4,Spanish translation update,jtornero,2014-03-17T21:29:24Z,Three new strings translated.\n,"Even though the other translation files have been updated, I accept this pull request...."
4,5,Update JabRef_in.properties,was123,2014-03-18T00:02:27Z,Indonesian translation added\n,
5,6,Fixed splash-dev.svg,olenz,2014-03-19T19:44:35Z,,
6,7,I have implemented 2 features requested in Ticket #841.,noravanq,2014-03-23T04:53:18Z,"```\nThe user can now specify an arbitrary number of file-link columns in te ""Entry ta...",
7,8,PDF-file metadata: Privacy Filtering all metadata,adaerr,2014-04-23T12:58:24Z,This pull-request pertains to the addition of metadata to PDF files associated with en...,thx!\n
8,9,Support FindFullText with ACS DOIs,ansell,2014-05-06T06:36:03Z,Adds a FullTextFinder implementation to transform the ACS DOI redirect URLs to their P...,
9,10,try to fix some obvious bugs about `groups`,braindevices,2014-05-08T03:14:52Z,"Hi All,\nI just upgraded to 2.10 and I found some bugs immediately.\n1. in the right-c...",After 2.10 the BibtexEntryType.java is changed a lot. The optional fields and required...


In [11]:
dataPullCommit.head(500)

Unnamed: 0,PR_Number,PR_Title,PR_Author,PR_Closed_Date,PR_Body,PR_Comments,Commit_Message,Commit_Author,Commit_Date
0,1,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,"Adding private fields to SQL scripts in order to export/import owner, timestamp, etc.",Igor Steinmacher,2013-10-23T19:13:12Z
1,1,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,New entries translated to pt-BR,Igor Steinmacher,2013-10-23T23:37:02Z
2,1,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,New entries translated to pt-BR,Igor Steinmacher,2013-10-24T19:22:22Z
3,1,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,Adds missing beta 2 separator to the CHANGELOG,Oliver Kopp,2013-10-27T13:14:44Z
4,1,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,Fixes string comparison at SQLUtil,Oliver Kopp,2013-10-27T13:17:00Z
5,1,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,Update Japanese property files,Koji Yokota,2013-10-31T23:33:09Z
6,1,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,Merge branch 'beta_2.10',Oliver Kopp,2013-11-04T08:35:17Z
7,1,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,Merge branch 'master' of ssh://git.code.sf.net/p/jabref/code,Oliver Kopp,2014-02-12T12:09:43Z
8,1,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,Fix GoogleScholarFetcher\n\nthe format of Google has changed and required an updated r...,Andreas Amann,2014-02-11T19:33:38Z
9,1,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,Release of 2.10 beta 3,Oliver Kopp,2014-02-12T12:38:42Z


In [12]:
#result = pd.merge(user_usage, user_device[['use_id', 'platform', 'device']], on='use_id', how='outer',indicator=True)
result = pd.merge(dataIssues,
                 dataPullCommit,
                 on='PR_Number',
                 how='outer', 
                 indicator=True)

In [13]:
print(result.shape)
print(result.columns)
result.head(500)

(52968, 15)
Index(['PR_Number', 'Issue_Title', 'Issue_Author', 'Issue_Closed_Date',
       'Issue_Body', 'Issue_Comments', 'PR_Title', 'PR_Author',
       'PR_Closed_Date', 'PR_Body', 'PR_Comments', 'Commit_Message',
       'Commit_Author', 'Commit_Date', '_merge'],
      dtype='object')


Unnamed: 0,PR_Number,Issue_Title,Issue_Author,Issue_Closed_Date,Issue_Body,Issue_Comments,PR_Title,PR_Author,PR_Closed_Date,PR_Body,PR_Comments,Commit_Message,Commit_Author,Commit_Date,_merge
0,1,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,"Adding private fields to SQL scripts in order to export/import owner, timestamp, etc.",Igor Steinmacher,2013-10-23T19:13:12Z,both
1,1,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,New entries translated to pt-BR,Igor Steinmacher,2013-10-23T23:37:02Z,both
2,1,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,New entries translated to pt-BR,Igor Steinmacher,2013-10-24T19:22:22Z,both
3,1,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,Adds missing beta 2 separator to the CHANGELOG,Oliver Kopp,2013-10-27T13:14:44Z,both
4,1,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,Fixes string comparison at SQLUtil,Oliver Kopp,2013-10-27T13:17:00Z,both
5,1,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,Update Japanese property files,Koji Yokota,2013-10-31T23:33:09Z,both
6,1,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,Merge branch 'beta_2.10',Oliver Kopp,2013-11-04T08:35:17Z,both
7,1,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,Merge branch 'master' of ssh://git.code.sf.net/p/jabref/code,Oliver Kopp,2014-02-12T12:09:43Z,both
8,1,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,Fix GoogleScholarFetcher\n\nthe format of Google has changed and required an updated r...,Andreas Amann,2014-02-11T19:33:38Z,both
9,1,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,Release of 2.10 beta 3,Oliver Kopp,2014-02-12T12:38:42Z,both


In [14]:
result.rename(columns={'_merge':'isPR'}, inplace=True) #_merge is a column created by pd.merge()
result['isPR'].value_counts()


isPR
both          48872
left_only      4096
right_only        0
Name: count, dtype: int64

In [15]:
result['isPR'] = result['isPR'].apply({'both': 1, 'left_only': 0, 'right_only':0}.get)



In [16]:
result.to_csv('merged_Data.csv', sep=',', encoding='utf-8', index=False)


In [17]:
data = './merged_Data.csv'
data = pd.read_csv(data, sep=',' )


In [18]:
data.loc[0:100,'PR_Comments']
data.loc[98,]

data.loc[data['PR_Number'] == 5000]
print(data.shape)
data.head()

(52968, 15)


Unnamed: 0,PR_Number,Issue_Title,Issue_Author,Issue_Closed_Date,Issue_Body,Issue_Comments,PR_Title,PR_Author,PR_Closed_Date,PR_Body,PR_Comments,Commit_Message,Commit_Author,Commit_Date,isPR
0,1,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,"Adding private fields to SQL scripts in order to export/import owner, timestamp, etc.",Igor Steinmacher,2013-10-23T19:13:12Z,1
1,1,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,New entries translated to pt-BR,Igor Steinmacher,2013-10-23T23:37:02Z,1
2,1,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,New entries translated to pt-BR,Igor Steinmacher,2013-10-24T19:22:22Z,1
3,1,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,Adds missing beta 2 separator to the CHANGELOG,Oliver Kopp,2013-10-27T13:14:44Z,1
4,1,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,Fixes string comparison at SQLUtil,Oliver Kopp,2013-10-27T13:17:00Z,1


In [19]:
sum(pd.isnull(data['Issue_Closed_Date']))
data_final = data[data['Issue_Closed_Date'].notna()]

In [20]:
data_final.to_csv('dataMerged_Final_only_closed.csv', sep=',', encoding='utf-8', index=False)

In [21]:
data = './dataMerged_Final_only_closed.csv'
data = pd.read_csv(data, sep=',' )

In [23]:
data.head(100)

Unnamed: 0,PR_Number,Issue_Title,Issue_Author,Issue_Closed_Date,Issue_Body,Issue_Comments,PR_Title,PR_Author,PR_Closed_Date,PR_Body,PR_Comments,Commit_Message,Commit_Author,Commit_Date,isPR
0,1,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,"Adding private fields to SQL scripts in order to export/import owner, timestamp, etc.",Igor Steinmacher,2013-10-23T19:13:12Z,1
1,1,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,New entries translated to pt-BR,Igor Steinmacher,2013-10-23T23:37:02Z,1
2,1,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,New entries translated to pt-BR,Igor Steinmacher,2013-10-24T19:22:22Z,1
3,1,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,Adds missing beta 2 separator to the CHANGELOG,Oliver Kopp,2013-10-27T13:14:44Z,1
4,1,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,Fixes string comparison at SQLUtil,Oliver Kopp,2013-10-27T13:17:00Z,1
5,1,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,Update Japanese property files,Koji Yokota,2013-10-31T23:33:09Z,1
6,1,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,Merge branch 'beta_2.10',Oliver Kopp,2013-11-04T08:35:17Z,1
7,1,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,Merge branch 'master' of ssh://git.code.sf.net/p/jabref/code,Oliver Kopp,2014-02-12T12:09:43Z,1
8,1,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,Fix GoogleScholarFetcher\n\nthe format of Google has changed and required an updated r...,Andreas Amann,2014-02-11T19:33:38Z,1
9,1,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,New Sorting/Export preferences,olenz,2014-03-12T09:26:29Z,"This will add a new ""File Sorting"" Tab to the preferences that allows to exactly speci...",,Release of 2.10 beta 3,Oliver Kopp,2014-02-12T12:38:42Z,1


In [46]:
teste = './df_merge.csv'
testeMerge = pd.read_csv(teste,sep=',')
testeMerge

FileNotFoundError: [Errno 2] No such file or directory: './df_merge.csv'

In [12]:
#testeMerge.loc[7,]

#testeMerge.loc[testeMerge['PR_Number'] == 4498]

#testeMerge.loc[testeMerge['PR_Number'] == 4188]

testeMerge.loc[testeMerge['PR_Number'] == 452]

Unnamed: 0,PR_Number,Issue_Title,Issue_Body,Issue_Comments,PR_Comments,Commit_Message,isPR,PR,Issue,Issue_Title_Linked,Issue_Body_Linked,Issue_Comment_Linked,isTrain
452,452,Revise maintable,Complete check and rewrite of MainTable and related classesThis will fix and implement...,=||= Awesome. =||= Before I invest much time to fix it...@JabRef/developers **Are we ...,=||= You could use Collections.singletonList instead. =||= Collections.emptyList =||...,minor changes,1,452.0,315.0,Rating colum has no header description,We should add a description here especially since clicking inside the column always op...,=||= The reason for directly changing the flags convenience for quick changing of fla...,0.0
453,452,Revise maintable,Complete check and rewrite of MainTable and related classesThis will fix and implement...,=||= Awesome. =||= Before I invest much time to fix it...@JabRef/developers **Are we ...,=||= You could use Collections.singletonList instead. =||= Collections.emptyList =||...,minor changes,1,452.0,384.0,Tooltip for title or long field,Adding a tooltip so we know the meaning of each column headtitle (R R Q F P is not obv...,=||= Thanks for your input. This issue is actively discussed among the developers so ...,0.0
454,452,Revise maintable,Complete check and rewrite of MainTable and related classesThis will fix and implement...,=||= Awesome. =||= Before I invest much time to fix it...@JabRef/developers **Are we ...,=||= You could use Collections.singletonList instead. =||= Collections.emptyList =||...,minor changes,1,452.0,443.0,GUI: Clicking on Ranking Col Header switches position of DOI column before/after Entry...,In 3.0 I just discovered a strange behavior:When I click on the Ranking Column Header ...,=||= Confirmed for 3.0 and `master`. =||= Fixed with #452 - changes are available now...,0.0
455,452,Revise maintable,Complete check and rewrite of MainTable and related classesThis will fix and implement...,=||= Awesome. =||= Before I invest much time to fix it...@JabRef/developers **Are we ...,=||= You could use Collections.singletonList instead. =||= Collections.emptyList =||...,minor changes,1,452.0,445.0,Moving ranking column: moved visually but function still in old place,In JabRef 3.0 I moved the ranking column to the end of my entry table using drag and d...,=||= Possibly #443 is related. =||= Fixed with #452 - changes are available now in cu...,0.0
456,452,Revise maintable,Complete check and rewrite of MainTable and related classesThis will fix and implement...,=||= Awesome. =||= Before I invest much time to fix it...@JabRef/developers **Are we ...,=||= You could use Collections.singletonList instead. =||= Collections.emptyList =||...,minor changes,1,452.0,498.0,Open pdf file when clicking pdf icon,,=||= ... is working fine.Seriously you expect us to invest our time for free on somet...,0.0
457,452,Revise maintable,Complete check and rewrite of MainTable and related classesThis will fix and implement...,=||= Awesome. =||= Before I invest much time to fix it...@JabRef/developers **Are we ...,=||= You could use Collections.singletonList instead. =||= Collections.emptyList =||...,minor changes,1,452.0,490.0,Main Table: Right click on DOI field: Allow copying DOI,Currently the popup of DOI allows for clicking the DOI only. It should also be possibl...,=||= On which field? In field editor? See #492 =||= In the main table. At the DOI col...,0.0


In [11]:
testeMerge.loc[testeMerge['PR_Number'] == 677]

Unnamed: 0,PR_Number,Issue_Title,Issue_Body,Issue_Comments,PR_Comments,Commit_Message,isPR,PR,Issue,Issue_Title_Linked,Issue_Body_Linked,Issue_Comment_Linked,isTrain
681,677,Make BibTex parser more robust against missing newlines,As described in #669 and #621 the parser has some problems when an entry (or preamble)...,=||= :+1: (except my minor comment) =||= Corrected... for some reason the code style ...,=||= Please always use curly braces as this makes the semantics explicit.,Minor code reformatting,1,677.0,669.0,JabRef 3.1/3.2 writes bib file in a format that it will not read,If the @PREAMBLE field is present JabRef 3.1/3.2 omits the newline between that line a...,=||= related #621 =||= @tobiasdiez Is this fixed? =||= @stefan-kolb It will be fixed ...,0.0
682,677,Make BibTex parser more robust against missing newlines,As described in #669 and #621 the parser has some problems when an entry (or preamble)...,=||= :+1: (except my minor comment) =||= Corrected... for some reason the code style ...,=||= Please always use curly braces as this makes the semantics explicit.,Minor code reformatting,1,677.0,621.0,Ver 3.1 comment not written correctly.,I have a file started with bibtex item e.g.1 @ARTICLE{XXXXXX2 author = {XXXXXXXX...,=||= This is not a bug but the exact desired behavior.We only modify entries that hav...,0.0
683,677,Make BibTex parser more robust against missing newlines,As described in #669 and #621 the parser has some problems when an entry (or preamble)...,=||= :+1: (except my minor comment) =||= Corrected... for some reason the code style ...,=||= Please always use curly braces as this makes the semantics explicit.,Minor code reformatting,1,677.0,669.0,JabRef 3.1/3.2 writes bib file in a format that it will not read,If the @PREAMBLE field is present JabRef 3.1/3.2 omits the newline between that line a...,=||= related #621 =||= @tobiasdiez Is this fixed? =||= @stefan-kolb It will be fixed ...,0.0
684,677,Make BibTex parser more robust against missing newlines,As described in #669 and #621 the parser has some problems when an entry (or preamble)...,=||= :+1: (except my minor comment) =||= Corrected... for some reason the code style ...,=||= Please always use curly braces as this makes the semantics explicit.,Minor code reformatting,1,677.0,621.0,Ver 3.1 comment not written correctly.,I have a file started with bibtex item e.g.1 @ARTICLE{XXXXXX2 author = {XXXXXXXX...,=||= This is not a bug but the exact desired behavior.We only modify entries that hav...,0.0
