In [1]:
import pandas as pd

In [2]:
import numpy as np


In [3]:
def set_seed(seed=2022):
    '''Sets the seed of the entire notebook so results are the same every time we run.
    This is for REPRODUCIBILITY.'''
    np.random.seed(seed)
    
    os.environ['PYTHONHASHSEED'] = str(seed)


set_seed(2022)


In [4]:
def train_validate_test_split(df, train_percent=.85, validate_percent=.075, seed = 2022):
    np.random.seed(seed)
    perm = np.random.permutation(df.index)
    m = len(df.index)
    train_end = int(train_percent * m)
    validate_end = int(validate_percent * m) + train_end
    train = df.iloc[perm[:train_end]]
    validate = df.iloc[perm[train_end:validate_end]]
    test = df.iloc[perm[validate_end:]]
    return train, validate, test


In [5]:
def train_test_split(df, train_percent=.8, seed = 2022):
    np.random.seed(seed)
    perm = np.random.permutation(df.index)
    m = len(df.index)
    train_end = int(train_percent * m)
    train = df.iloc[perm[:train_end]]
    test = df.iloc[perm[train_end:]]
    return train, test


In [6]:
data = pd.read_csv("Full_Dataset.csv", index_col=0)


In [7]:
data["class"].value_counts()


Not_TD    586838
TD         80028
Name: class, dtype: int64

In [8]:
TD = data[:80028]


In [10]:
TD

Unnamed: 0,id,type,created_at,repo,repo_url,action,title,labels,body,class
0,2.000892e+10,IssuesEvent,2022-02-01 02:13:09,itchysats/itchysats,https://api.github.com/repos/itchysats/itchysats,opened,Wallet actor does not follow ADR006,tech-debt,- Wallet actor has a connection to electrum vi...,TD
1,2.000928e+10,IssuesEvent,2022-02-01 02:59:01,TonyLB/maketheworld,https://api.github.com/repos/TonyLB/maketheworld,closed,Denormalize ImportMap into Assets and Ephemera,techdebt,The ImportMap should show a tree structure of ...,TD
2,2.000929e+10,IssuesEvent,2022-02-01 03:00:25,microsoft/vscode-jupyter,https://api.github.com/repos/microsoft/vscode-...,closed,notebookAndWebview tests failing,debt engineering,![image.png](https://images.zenhubusercontent....,TD
3,2.000930e+10,IssuesEvent,2022-02-01 03:01:00,TonyLB/maketheworld,https://api.github.com/repos/TonyLB/maketheworld,opened,Revise Ephemera to abstract away from DynamoDB,techdebt,Create utility functions to encapsulate the co...,TD
4,2.000933e+10,IssuesEvent,2022-02-01 03:03:19,TonyLB/maketheworld,https://api.github.com/repos/TonyLB/maketheworld,opened,Revise controlChannel to abstract away from Dy...,techdebt,Create utility functions to encapsulate the co...,TD
...,...,...,...,...,...,...,...,...,...,...
80023,2.000691e+10,IssuesEvent,2022-01-31 23:00:43,microsoft/vscode,https://api.github.com/repos/microsoft/vscode,closed,Consider disallowing importing `workbench/api/...,debt engineering,ref #140874\r\n\r\n* comment out https://githu...,TD
80024,2.000713e+10,IssuesEvent,2022-01-31 23:18:37,Nanomis/lab-agile-planning,https://api.github.com/repos/Nanomis/lab-agile...,closed,Deploy service to the cloud,technical debt,**As a** Service Provider\n **I need** deploy ...,TD
80025,2.000715e+10,IssuesEvent,2022-01-31 23:20:36,TonyLB/maketheworld,https://api.github.com/repos/TonyLB/maketheworld,opened,Denormalize ImportMap into Assets and Ephemera,techdebt,The ImportMap should show a tree structure of ...,TD
80026,2.000718e+10,IssuesEvent,2022-01-31 23:23:21,Nanomis/lab-agile-planning,https://api.github.com/repos/Nanomis/lab-agile...,opened,Deploy service to the cloud (3/5),technical debt,**As a** Service Provider\n **I need** deploy ...,TD


In [11]:
TD['repo'].value_counts()[:25]


department-of-veterans-affairs/va.gov-team    2457
microsoft/vscode                              1694
Microsoft/vscode                              1473
mattermost/mattermost-server                  1094
admitd/vscode                                  946
elastic/kibana                                 807
openfoodfoundation/openfoodnetwork             774
sourcegraph/sourcegraph                        598
admitd/satd_test                               598
envoyproxy/envoy                               564
owncloud/core                                  553
UBC-Thunderbots/Software                       538
metabase/metabase                              499
medic/medic-webapp                             484
huridocs/uwazi                                 447
terraform-providers/terraform-provider-aws     436
openshift/origin                               421
php-coder/mystamps                             405
DataBiosphere/azul                             399
atlasmap/atlasmap              

In [34]:
TD['repo_url'].value_counts()[:25].index


Index(['https://api.github.com/repos/department-of-veterans-affairs/va.gov-team',
       'https://api.github.com/repos/microsoft/vscode',
       'https://api.github.com/repos/Microsoft/vscode',
       'https://api.github.com/repos/mattermost/mattermost-server',
       'https://api.github.com/repos/admitd/vscode',
       'https://api.github.com/repos/elastic/kibana',
       'https://api.github.com/repos/openfoodfoundation/openfoodnetwork',
       'https://api.github.com/repos/sourcegraph/sourcegraph',
       'https://api.github.com/repos/admitd/satd_test',
       'https://api.github.com/repos/envoyproxy/envoy',
       'https://api.github.com/repos/owncloud/core',
       'https://api.github.com/repos/UBC-Thunderbots/Software',
       'https://api.github.com/repos/metabase/metabase',
       'https://api.github.com/repos/medic/medic-webapp',
       'https://api.github.com/repos/huridocs/uwazi',
       'https://api.github.com/repos/terraform-providers/terraform-provider-aws',
       'https:

In [57]:
import requests
from prettytable import PrettyTable

table = PrettyTable()
table.field_names = ["Repository Name", "Created Date", "Updated Date" , "Language", "Stars" , "Forks Count"  , "Watchers" , "Open Issues Count"]


for i in range(30):



    #send get request
    response = requests.get(TD['repo_url'].value_counts()[:30].index[i])

    #get the json data
    data = response.json()
    print(data)
    # print(data["full_name"], data["created_at"], data["updated_at"],
    #       data["language"], data["stargazers_count"], data['size'], data['watchers'], data['open_issues'], data['forks_count'], data['subscribers_count'], data['network_count'])

    print(TD['repo_url'].value_counts()[:30].index[i])
    try:
        name = data["full_name"]
        created_date = data["created_at"]
        updated_date = data["updated_at"]
        

        language = data["language"]

        stars = data["stargazers_count"]

        forks_count = data['forks_count']

        watchers = data['watchers']

        open_issues = data["open_issues"]



        table.add_row([name, created_date,  updated_date ,  language, stars , forks_count , watchers , open_issues])

        print(table)
    
    except:
        continue


{'id': 133843125, 'node_id': 'MDEwOlJlcG9zaXRvcnkxMzM4NDMxMjU=', 'name': 'va.gov-team', 'full_name': 'department-of-veterans-affairs/va.gov-team', 'private': False, 'owner': {'login': 'department-of-veterans-affairs', 'id': 5421563, 'node_id': 'MDEyOk9yZ2FuaXphdGlvbjU0MjE1NjM=', 'avatar_url': 'https://avatars.githubusercontent.com/u/5421563?v=4', 'gravatar_id': '', 'url': 'https://api.github.com/users/department-of-veterans-affairs', 'html_url': 'https://github.com/department-of-veterans-affairs', 'followers_url': 'https://api.github.com/users/department-of-veterans-affairs/followers', 'following_url': 'https://api.github.com/users/department-of-veterans-affairs/following{/other_user}', 'gists_url': 'https://api.github.com/users/department-of-veterans-affairs/gists{/gist_id}', 'starred_url': 'https://api.github.com/users/department-of-veterans-affairs/starred{/owner}{/repo}', 'subscriptions_url': 'https://api.github.com/users/department-of-veterans-affairs/subscriptions', 'organization

In [60]:
def ptable_to_csv(table, filename, headers=True):
    """Save PrettyTable results to a CSV file.

    :param PrettyTable table: Table object to get data from.
    :param str filename: Filepath for the output CSV.
    :param bool headers: Whether to include the header row in the CSV.
    :return: None
    """
    raw = table.get_string()
    data = [tuple(filter(None, map(str.strip, splitline)))
            for line in raw.splitlines()
            for splitline in [line.split('|')] if len(splitline) > 1]
    if table.title is not None:
        data = data[1:]
    if not headers:
        data = data[1:]
    with open(filename, 'w') as f:
        for d in data:
            f.write('{}\n'.format(','.join(d)))


In [61]:
ptable_to_csv(table,  "Top_TD_repos.csv")

In [62]:
table

Repository Name,Created Date,Updated Date,Language,Stars,Forks Count,Watchers,Open Issues Count
department-of-veterans-affairs/va.gov-team,2018-05-17T16:50:38Z,2022-08-23T23:19:59Z,HTML,197,127,197,6685
microsoft/vscode,2015-09-03T20:23:38Z,2022-08-24T11:21:06Z,TypeScript,135726,23195,135726,7585
microsoft/vscode,2015-09-03T20:23:38Z,2022-08-24T11:21:06Z,TypeScript,135726,23195,135726,7585
mattermost/mattermost-server,2015-06-15T06:50:02Z,2022-08-24T09:09:13Z,Go,23701,5630,23701,608
elastic/kibana,2013-01-26T04:00:59Z,2022-08-24T06:51:36Z,TypeScript,17764,7373,17764,9627
openfoodfoundation/openfoodnetwork,2012-10-17T07:56:23Z,2022-08-23T17:37:55Z,Ruby,861,586,861,647
sourcegraph/sourcegraph,2015-08-24T07:27:28Z,2022-08-24T07:48:31Z,Go,6575,809,6575,4450
envoyproxy/envoy,2016-08-08T15:07:24Z,2022-08-24T09:22:09Z,C++,20267,3837,20267,1341
owncloud/core,2012-08-25T10:32:48Z,2022-08-23T00:42:04Z,PHP,7824,2068,7824,404
UBC-Thunderbots/Software,2018-07-15T16:06:15Z,2022-07-09T22:12:26Z,C++,25,68,25,133


In [25]:
sum(TD['repo'].value_counts()[:25])

17362

In [13]:
len(TD['repo'].unique())

6401

In [10]:
TD["label"] = 1


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  TD["label"] = 1


In [12]:
Non_TD = data[80028:]


In [13]:
Non_TD

Unnamed: 0,id,type,created_at,repo,repo_url,action,title,labels,body,class
80028,2.000755e+10,IssuesEvent,2022-02-01 00:00:01,OpenBeta/open-tacos,https://api.github.com/repos/OpenBeta/open-tacos,closed,Missing breadcrumb on climb page,bug,"<img width=""810"" alt=""Screen Shot 2022-01-03 a...",Not_TD
80029,2.000755e+10,IssuesEvent,2022-02-01 00:00:03,BespokeSynth/BespokeSynth,https://api.github.com/repos/BespokeSynth/Besp...,closed,No audio input on macOS,bug,## Describe the bug\r\n\r\nThe audio interface...,Not_TD
80030,2.000755e+10,IssuesEvent,2022-02-01 00:00:20,fritz-marshal/fritz,https://api.github.com/repos/fritz-marshal/fritz,opened,cannot save archival source to any group,bug,**Describe the bug**\r\nWhile trying to save a...,Not_TD
80031,2.000755e+10,IssuesEvent,2022-02-01 00:00:28,PathOfBuildingCommunity/PathOfBuilding,https://api.github.com/repos/PathOfBuildingCom...,closed,Unable to update from 2.11 to 2.13,bug,### Check version\n\n- [X] I'm running the lat...,Not_TD
80032,2.000755e+10,IssuesEvent,2022-02-01 00:00:31,Azure/aks-hci,https://api.github.com/repos/Azure/aks-hci,opened,[BUG] Moc agent log rotation is failing,bug,**Describe the bug**\r\nMoc agents are expecte...,Not_TD
...,...,...,...,...,...,...,...,...,...,...
666861,2.297185e+10,IssuesEvent,2022-07-20 04:27:22,LmeSzinc/AzurLaneAutoScript,https://api.github.com/repos/LmeSzinc/AzurLane...,closed,增加每日主线困难图出击次数选择,wontfix,### 你的功能请求是否与问题有关？\n\n希望可以为每日任务 > 困难图 增加次数选择功能...,Not_TD
666862,2.297200e+10,IssuesEvent,2022-07-20 04:40:38,mrlesmithjr/ansible-manage-lvm,https://api.github.com/repos/mrlesmithjr/ansib...,closed,Need more condition: If disk is not in lvm for...,wontfix,[root@localhost ~]# lsblk \r\nNAME ...,Not_TD
666863,2.297205e+10,IssuesEvent,2022-07-20 04:45:39,wang-xinyu/tensorrtx,https://api.github.com/repos/wang-xinyu/tensorrtx,closed,lenet5 make failed,wontfix,"## Env\r\n\r\n- GPU, RTX1060\r\n- OS, Ubuntu1...",Not_TD
666864,2.297205e+10,IssuesEvent,2022-07-20 04:45:40,wang-xinyu/tensorrtx,https://api.github.com/repos/wang-xinyu/tensorrtx,closed,Low landmark accuracy for retinaface (mnet) af...,wontfix,"## Env\r\n\r\n- GPU, 1080ti\r\n- OS, Ubuntu18....",Not_TD


In [14]:
Non_TD = Non_TD.sample(frac=0.15 , random_state= 2022)


In [15]:
Non_TD

Unnamed: 0,id,type,created_at,repo,repo_url,action,title,labels,body,class
505754,2.204597e+10,IssuesEvent,2022-05-30 01:45:53,FortuneStreetModding/CustomStreetWorldTour,https://api.github.com/repos/FortuneStreetModd...,opened,[Feature Request] Change the Default Save ID o...,enhancement,"Currently, new ROMs of CSWT are saved as STE70...",Not_TD
87779,2.007484e+10,IssuesEvent,2022-02-04 11:29:59,odpi/egeria-connector-xtdb,https://api.github.com/repos/odpi/egeria-conne...,opened,Edge case in searching produces `xtdb.IllegalA...,bug,If running a search that includes _all_ of the...,Not_TD
552041,2.257475e+10,IssuesEvent,2022-06-28 06:06:06,kanisterio/kanister,https://api.github.com/repos/kanisterio/kanister,opened,Validating Webhook should accept TLS cert in K...,enhancement,The validating webhook should accept a TLS cer...,Not_TD
211282,2.160782e+10,IssuesEvent,2022-05-04 06:44:16,debtdao/smart-contracts,https://api.github.com/repos/debtdao/smart-con...,closed,Escrow contract calls accrueInterest which cal...,bug,,Not_TD
600888,2.295756e+10,IssuesEvent,2022-07-19 12:56:11,mobile-shell/mosh,https://api.github.com/repos/mobile-shell/mosh,opened,Support roaming between NAT64 and native IPv4 ...,feature,I've recently noticed that some wifi deploymen...,Not_TD
...,...,...,...,...,...,...,...,...,...,...
269024,2.215739e+10,IssuesEvent,2022-06-04 02:11:19,eclipse-vertx/vert.x,https://api.github.com/repos/eclipse-vertx/vert.x,opened,SimpleConnectionPool leaks streams and connect...,bug,### Problem Description\r\nIn case the origina...,Not_TD
361731,2.025877e+10,IssuesEvent,2022-02-15 03:55:44,Connor2h/pizza-hunt,https://api.github.com/repos/Connor2h/pizza-hunt,closed,"Users can create, read, update, and delete dat...",enhancement,"* As a user, I can create and customize my own...",Not_TD
559654,2.263855e+10,IssuesEvent,2022-06-30 21:53:14,thexaero/open-parties-and-claims,https://api.github.com/repos/thexaero/open-par...,opened,Protect chunks against lightning bolts caused ...,enhancement,,Not_TD
359973,2.024838e+10,IssuesEvent,2022-02-14 15:40:30,hivedb/hive,https://api.github.com/repos/hivedb/hive,opened,Make TypeAdapter.typeId a string,enhancement,It looks like there may be a concern of type a...,Not_TD


In [16]:
Non_TD["label"] = 0


In [17]:
Data = pd.concat([TD,Non_TD] , ignore_index = True)

In [18]:
Data = Data[["body", "class", "label"]]


In [19]:
Data

Unnamed: 0,body,class,label
0,- Wallet actor has a connection to electrum vi...,TD,
1,The ImportMap should show a tree structure of ...,TD,
2,![image.png](https://images.zenhubusercontent....,TD,
3,Create utility functions to encapsulate the co...,TD,
4,Create utility functions to encapsulate the co...,TD,
...,...,...,...
168049,### Problem Description\r\nIn case the origina...,Not_TD,0.0
168050,"* As a user, I can create and customize my own...",Not_TD,0.0
168051,,Not_TD,0.0
168052,It looks like there may be a concern of type a...,Not_TD,0.0


In [20]:
df = Data.drop_duplicates(subset=['body'], keep='last')


In [21]:
df

Unnamed: 0,body,class,label
0,- Wallet actor has a connection to electrum vi...,TD,
2,![image.png](https://images.zenhubusercontent....,TD,
5,"Replace hard-coded `[""TEST""]` asset lists in v...",TD,
6,In @bchen1116 's recent analysis of our ensemb...,TD,
9,**As a** Service provide\r\n **I need** to dep...,TD,
...,...,...,...
168049,### Problem Description\r\nIn case the origina...,Not_TD,0.0
168050,"* As a user, I can create and customize my own...",Not_TD,0.0
168051,,Not_TD,0.0
168052,It looks like there may be a concern of type a...,Not_TD,0.0


In [22]:
df.reset_index(inplace=True)


In [23]:
df["label"].value_counts()


0.0    71216
Name: label, dtype: int64

In [24]:
df

Unnamed: 0,index,body,class,label
0,0,- Wallet actor has a connection to electrum vi...,TD,
1,2,![image.png](https://images.zenhubusercontent....,TD,
2,5,"Replace hard-coded `[""TEST""]` asset lists in v...",TD,
3,6,In @bchen1116 's recent analysis of our ensemb...,TD,
4,9,**As a** Service provide\r\n **I need** to dep...,TD,
...,...,...,...,...
127242,168049,### Problem Description\r\nIn case the origina...,Not_TD,0.0
127243,168050,"* As a user, I can create and customize my own...",Not_TD,0.0
127244,168051,,Not_TD,0.0
127245,168052,It looks like there may be a concern of type a...,Not_TD,0.0


In [25]:
df.drop(columns=["index"], inplace=True)


A value is trying to be set on a copy of a slice from a DataFrame

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df.drop(columns=["index"], inplace=True)


In [26]:
df["text_body"] = df["body"]


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df["text_body"] = df["body"]


In [31]:
df

Unnamed: 0,body,class,label,text_body
0,- Wallet actor has a connection to electrum vi...,TD,1,- Wallet actor has a connection to electrum vi...
1,![image.png](https://images.zenhubusercontent....,TD,1,![image.png](https://images.zenhubusercontent....
2,"Replace hard-coded `[""TEST""]` asset lists in v...",TD,1,"Replace hard-coded `[""TEST""]` asset lists in v..."
3,In @bchen1116 's recent analysis of our ensemb...,TD,1,In @bchen1116 's recent analysis of our ensemb...
4,**As a** Service provide\r\n **I need** to dep...,TD,1,**As a** Service provide\r\n **I need** to dep...
...,...,...,...,...
127242,### Problem Description\r\nIn case the origina...,Not_TD,0,### Problem Description\r\nIn case the origina...
127243,"* As a user, I can create and customize my own...",Not_TD,0,"* As a user, I can create and customize my own..."
127244,,Not_TD,0,
127245,It looks like there may be a concern of type a...,Not_TD,0,It looks like there may be a concern of type a...


In [27]:
import re
from string import punctuation


In [28]:
def clean_text(text):
    '''Make text lowercase, remove text in square brackets,remove links,remove punctuation
    and remove words containing numbers.'''
    text = str(text).lower()
    text = re.sub('\[.*?\]', '', text)
    text = re.sub('https?://\S+|www\.\S+', '', text)
    text = re.sub('<.*?>+', '', text)
    text = re.sub('[%s]' % re.escape(punctuation), '', text)
    text = re.sub('\n', '', text)
    text = re.sub('\w*\d\w*', '', text)
    return text


In [29]:
df["text"] = df["text_body"].map(clean_text)


A value is trying to be set on a copy of a slice from a DataFrame.
Try using .loc[row_indexer,col_indexer] = value instead

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df["text"] = df["text_body"].map(clean_text)


In [30]:
df = df.sample(frac=1 , random_state=2022)

In [31]:
df

Unnamed: 0,body,class,label,text_body,text
68516,### What happened?\n\nWhen generating a new pr...,Not_TD,0.0,### What happened?\n\nWhen generating a new pr...,what happenedwhen generating a new project th...
76857,### Describe the bug with a clear and concise ...,Not_TD,0.0,### Describe the bug with a clear and concise ...,describe the bug with a clear and concise des...
43354,<!--\r\nThanks for submitting a bug report. Pl...,TD,,<!--\r\nThanks for submitting a bug report. Pl...,\rthanks for submitting a bug report please fi...
108957,"In der Adapterkonfig gibt es einen Button: ""al...",Not_TD,0.0,"In der Adapterkonfig gibt es einen Button: ""al...",in der adapterkonfig gibt es einen button alle...
39873,Testing https://github.com/microsoft/vscode/is...,TD,,Testing https://github.com/microsoft/vscode/is...,testing \r\rmoving opacity from settingitemove...
...,...,...,...,...,...
46769,"Since migrating from tslint, there is no styli...",TD,,"Since migrating from tslint, there is no styli...",since migrating from tslint there is no stylin...
103024,## Summary \r\n\r\nWe mistakenly configured an...,Not_TD,0.0,## Summary \r\n\r\nWe mistakenly configured an...,summary \r\rwe mistakenly configured an inval...
16557,<!--\r\nFILL OUT THE FORM BELOW OR THE ISSUE W...,TD,,<!--\r\nFILL OUT THE FORM BELOW OR THE ISSUE W...,\rfill out the form below or the issue will be...
1244,Creating this ticket per @mjtravers \n\nThere ...,TD,,Creating this ticket per @mjtravers \n\nThere ...,creating this ticket per mjtravers there are s...


In [32]:
df2 = df[["text", "label"]]


In [33]:
df2.reset_index(inplace=True)


In [34]:
df2.drop(columns = ["index"] , inplace = True)

A value is trying to be set on a copy of a slice from a DataFrame

See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy
  df2.drop(columns = ["index"] , inplace = True)


In [66]:
df2.to_csv("TD_dataset_clean.csv")

In [68]:
train , test = train_test_split(df2)

In [69]:
train

Unnamed: 0,text,label
68516,let me explain we need to install for example ...,0
76857,currently all the jsonrpc handling between gob...,0
43354,we have allot of conditional statements in the...,1
108957,describe the bugautocrafting high tier essenc...,0
39873,eclipse ide for cc developers on linux\respi...,0
...,...,...
91482,situation\rhello\r i have a step in my wo...,0
77118,is there an existing issue for this i have s...,0
102123,as a developer\ri need to create a travisyml f...,1
48949,describe the solution youd like\r is part of g...,1


In [70]:
test

Unnamed: 0,text,label
52008,this is about\r a typo \r innaccuratemislead...,0
59120,has been deprecated\r\rthe replacement is sup...,1
16734,as a maintainer\ri want to have queries to rmq...,1
7418,what were after\rwe need to consider and desig...,1
69441,since we no longer require them by default for...,1
...,...,...
46769,research the possibility of playing audio whil...,0
103024,this test contains a list of stat names to che...,1
16557,example \r\r\ronchange rawvalues values setval...,0
1244,teknik borcun açıklaması\röğrencinin ders seç...,1


In [35]:
Data = pd.concat([TD,Non_TD] , ignore_index = True)

In [49]:
owncloud_debt = TD[(TD["repo"] == "owncloud/core")]

not_owncloud_debt = Data[(
    Data["repo"] != "owncloud/core")]
owncloud_debt.to_csv("owncloud_debt.csv")
not_owncloud_debt.to_csv("not_owncloud_debt.csv")


In [50]:
owncloud_debt

Unnamed: 0,id,type,created_at,repo,repo_url,action,title,labels,body,class
5031,2.491511e+09,IssuesEvent,2015-01-03 16:08:55,owncloud/core,https://api.github.com/repos/owncloud/core,opened,Refactoring of Provisioning_API,1 - Backlog enhancement - proposed technical debt,Non exhaustive list of improvements: \r\n\r\n ...,TD
5043,2.493007e+09,IssuesEvent,2015-01-05 09:40:31,owncloud/core,https://api.github.com/repos/owncloud/core,opened,Config file is checked multiple times with dif...,technical debt,From https://github.com/owncloud/documentation...,TD
5044,2.493012e+09,IssuesEvent,2015-01-05 09:43:26,owncloud/core,https://api.github.com/repos/owncloud/core,closed,OCP\Config::setUserValue returns false if no r...,bug sev3-medium technical debt,### Steps to reproduce\r\n1. Use OCP\Config::s...,TD
5061,2.497768e+09,IssuesEvent,2015-01-07 10:43:43,owncloud/core,https://api.github.com/repos/owncloud/core,opened,Introduce foreign keys / cascading delete,technical debt,Currently it is quite difficult to keep the da...,TD
5063,2.497880e+09,IssuesEvent,2015-01-07 11:57:35,owncloud/core,https://api.github.com/repos/owncloud/core,closed,escape t() variables by default,5 - To review bug Enhancement Junior Job Secur...,The `escapeHTML()` should be called while repl...,TD
...,...,...,...,...,...,...,...,...,...,...
73633,1.807631e+10,IssuesEvent,2021-09-21 10:16:17,owncloud/core,https://api.github.com/repos/owncloud/core,closed,OCS/cloud/users/ quota differs from WebDAV's,Type:Bug technical debt app:provisioning_api d...,@davigonz discovered just now that #owncloud/a...,TD
73636,1.807727e+10,IssuesEvent,2021-09-21 11:16:13,owncloud/core,https://api.github.com/repos/owncloud/core,closed,LIKE queries do not properly escape special ch...,Type:Bug db:sqlite db:mysql db:postgresql db:o...,While reviewing https://github.com/owncloud/co...,TD
73637,1.807727e+10,IssuesEvent,2021-09-21 11:16:15,owncloud/core,https://api.github.com/repos/owncloud/core,closed,"""federated cloud"" share users are anonymous in...",Type:Bug technical debt feature:federated-clou...,## Steps to reproduce\n1. Share a Folder as pu...,TD
73902,1.820739e+10,IssuesEvent,2021-09-29 15:43:09,owncloud/core,https://api.github.com/repos/owncloud/core,closed,Code style + static analysis,technical debt,"After 10.0.9 is out, we should focus on first ...",TD


In [51]:
not_owncloud_debt

Unnamed: 0,id,type,created_at,repo,repo_url,action,title,labels,body,class,label
0,2.000892e+10,IssuesEvent,2022-02-01 02:13:09,itchysats/itchysats,https://api.github.com/repos/itchysats/itchysats,opened,Wallet actor does not follow ADR006,tech-debt,- Wallet actor has a connection to electrum vi...,TD,
1,2.000928e+10,IssuesEvent,2022-02-01 02:59:01,TonyLB/maketheworld,https://api.github.com/repos/TonyLB/maketheworld,closed,Denormalize ImportMap into Assets and Ephemera,techdebt,The ImportMap should show a tree structure of ...,TD,
2,2.000929e+10,IssuesEvent,2022-02-01 03:00:25,microsoft/vscode-jupyter,https://api.github.com/repos/microsoft/vscode-...,closed,notebookAndWebview tests failing,debt engineering,![image.png](https://images.zenhubusercontent....,TD,
3,2.000930e+10,IssuesEvent,2022-02-01 03:01:00,TonyLB/maketheworld,https://api.github.com/repos/TonyLB/maketheworld,opened,Revise Ephemera to abstract away from DynamoDB,techdebt,Create utility functions to encapsulate the co...,TD,
4,2.000933e+10,IssuesEvent,2022-02-01 03:03:19,TonyLB/maketheworld,https://api.github.com/repos/TonyLB/maketheworld,opened,Revise controlChannel to abstract away from Dy...,techdebt,Create utility functions to encapsulate the co...,TD,
...,...,...,...,...,...,...,...,...,...,...,...
168049,2.215739e+10,IssuesEvent,2022-06-04 02:11:19,eclipse-vertx/vert.x,https://api.github.com/repos/eclipse-vertx/vert.x,opened,SimpleConnectionPool leaks streams and connect...,bug,### Problem Description\r\nIn case the origina...,Not_TD,0.0
168050,2.025877e+10,IssuesEvent,2022-02-15 03:55:44,Connor2h/pizza-hunt,https://api.github.com/repos/Connor2h/pizza-hunt,closed,"Users can create, read, update, and delete dat...",enhancement,"* As a user, I can create and customize my own...",Not_TD,0.0
168051,2.263855e+10,IssuesEvent,2022-06-30 21:53:14,thexaero/open-parties-and-claims,https://api.github.com/repos/thexaero/open-par...,opened,Protect chunks against lightning bolts caused ...,enhancement,,Not_TD,0.0
168052,2.024838e+10,IssuesEvent,2022-02-14 15:40:30,hivedb/hive,https://api.github.com/repos/hivedb/hive,opened,Make TypeAdapter.typeId a string,enhancement,It looks like there may be a concern of type a...,Not_TD,0.0


In [54]:
bcgov_entity_debt = TD[(TD["repo"] == "bcgov/entity")]

not_bcgov_entity_debt = Data[(
    Data["repo"] != "bcgov/entity")]
bcgov_entity_debt.to_csv("bcgov_entity_debt.csv")
not_bcgov_entity_debt.to_csv("not_bcgov_entity_debt.csv")


In [55]:
bcgov_entity_debt

Unnamed: 0,id,type,created_at,repo,repo_url,action,title,labels,body,class
541,2.025191e+10,IssuesEvent,2022-02-14 18:45:53,bcgov/entity,https://api.github.com/repos/bcgov/entity,closed,Create UI: move new FED component to shared li...,ENTITY techdebt,"The ""Incorporation Date Time"" component was or...",TD
543,2.025204e+10,IssuesEvent,2022-02-14 18:53:59,bcgov/entity,https://api.github.com/repos/bcgov/entity,closed,clean up obsolete items in OpenShift,devops ENTITY techdebt Name Request,Some OpenShift projects have left-over (obsole...,TD
545,2.025204e+10,IssuesEvent,2022-02-14 18:54:24,bcgov/entity,https://api.github.com/repos/bcgov/entity,closed,"Enum Implementation for NR Request, Location a...",ENTITY techdebt Name Request,## What is the problem?\t\n* We currently use...,TD
546,2.025206e+10,IssuesEvent,2022-02-14 18:55:05,bcgov/entity,https://api.github.com/repos/bcgov/entity,closed,NameRequest UI components should have IDs and ...,ENTITY techdebt Name Request,_This ticket is related to testing and could t...,TD
547,2.025210e+10,IssuesEvent,2022-02-14 18:57:45,bcgov/entity,https://api.github.com/repos/bcgov/entity,closed,Reduce the amount of CPU's for the NameX Prod POD,NameX devops ENTITY STORY techdebt,We should reduce the amount of resources we’re...,TD
...,...,...,...,...,...,...,...,...,...,...
79292,1.985739e+10,IssuesEvent,2022-01-21 18:56:15,bcgov/entity,https://api.github.com/repos/bcgov/entity,opened,BCRegistry - logout error + unit tests,ENTITY techdebt Assets,Carried over from #10697:\n\n- [ ] fix error l...,TD
79293,1.985740e+10,IssuesEvent,2022-01-21 18:56:58,bcgov/entity,https://api.github.com/repos/bcgov/entity,opened,BCRegistry - logout error + unit tests,ENTITY techdebt Assets,Carried over from #10697:\n\n- [ ] fix error l...,TD
79310,1.986064e+10,IssuesEvent,2022-01-21 23:09:07,bcgov/entity,https://api.github.com/repos/bcgov/entity,opened,Create one-time job to change state of CP's th...,ENTITY techdebt,CP0001880 was dissolved in COBRS and brought o...,TD
79419,1.987569e+10,IssuesEvent,2022-01-23 21:08:10,bcgov/entity,https://api.github.com/repos/bcgov/entity,closed,BCRegistry - logout error + unit tests,ENTITY techdebt Assets,Carried over from #10697:\n\n- [ ] fix error l...,TD


In [52]:
mattermost_debt = TD[(TD["repo"] == "mattermost/mattermost-server")]

not_mattermost_debt = Data[(
    Data["repo"] != "mattermost/mattermost-server")]
mattermost_debt.to_csv("mattermost_debt.csv")
not_mattermost_debt.to_csv("not_mattermost_debt.csv")


In [53]:
mattermost_debt

Unnamed: 0,id,type,created_at,repo,repo_url,action,title,labels,body,class
1312,2.081671e+10,IssuesEvent,2022-03-18 11:06:18,mattermost/mattermost-server,https://api.github.com/repos/mattermost/matter...,closed,Migrate 'components/edit_post_modal' module an...,Difficulty/1:Easy Hacktoberfest Good First Iss...,We are starting to migrate the mattermost-weba...,TD
1720,2.099463e+10,IssuesEvent,2022-03-29 12:31:01,mattermost/mattermost-server,https://api.github.com/repos/mattermost/matter...,closed,Migrate 'components/admin_console/user_autocom...,Difficulty/1:Easy Hacktoberfest Good First Iss...,We are starting to migrate the mattermost-weba...,TD
1728,2.099638e+10,IssuesEvent,2022-03-29 13:49:53,mattermost/mattermost-server,https://api.github.com/repos/mattermost/matter...,closed,Migrate 'components/admin_console/permission_s...,Difficulty/1:Easy Hacktoberfest Good First Iss...,We are starting to migrate the mattermost-weba...,TD
1946,2.109831e+10,IssuesEvent,2022-04-04 12:28:36,mattermost/mattermost-server,https://api.github.com/repos/mattermost/matter...,closed,Migrate 'components/admin_console/jobs' and as...,Difficulty/1:Easy Hacktoberfest Good First Iss...,We are starting to migrate the mattermost-weba...,TD
2083,2.119420e+10,IssuesEvent,2022-04-08 21:21:39,mattermost/mattermost-server,https://api.github.com/repos/mattermost/matter...,closed,Migrate 'components/admin_console/license_sett...,Difficulty/1:Easy Hacktoberfest Good First Iss...,We are starting to migrate the mattermost-weba...,TD
...,...,...,...,...,...,...,...,...,...,...
74632,1.854317e+10,IssuesEvent,2021-10-21 18:34:03,mattermost/mattermost-server,https://api.github.com/repos/mattermost/matter...,closed,Migrate 'components/mfa' and associated tests ...,Difficulty/1:Easy Hacktoberfest Good First Iss...,We are starting to migrate the mattermost-weba...,TD
74695,1.868744e+10,IssuesEvent,2021-11-01 14:05:19,mattermost/mattermost-server,https://api.github.com/repos/mattermost/matter...,closed,Migrate 'components/admin_console/group_settin...,Difficulty/1:Easy Up For Grabs Hacktoberfest G...,We are starting to migrate the mattermost-weba...,TD
74831,1.872233e+10,IssuesEvent,2021-11-03 13:10:57,mattermost/mattermost-server,https://api.github.com/repos/mattermost/matter...,closed,Migrate 'components/reset_status_modal' module...,Difficulty/1:Easy Hacktoberfest Good First Iss...,We are starting to migrate the mattermost-weba...,TD
75289,1.883700e+10,IssuesEvent,2021-11-11 03:00:37,mattermost/mattermost-server,https://api.github.com/repos/mattermost/matter...,closed,Migrate string-refs to functional ones: this.r...,Difficulty/1:Easy Up For Grabs Hacktoberfest H...,## Context:\n\nString references are deprecate...,TD


In [46]:
UBC_thunder_debt = TD[(TD["repo"] == "UBC-Thunderbots/Software")]

not_UBC_thunder_debt = Data[(
    Data["repo"] != "UBC-Thunderbots/Software")]
UBC_thunder_debt.to_csv("UBC_thunder_debt.csv")
not_UBC_thunder_debt.to_csv("not_UBC_thunder_debt.csv")


In [47]:
UBC_thunder_debt

Unnamed: 0,id,type,created_at,repo,repo_url,action,title,labels,body,class
37333,1.046375e+10,IssuesEvent,2019-09-20 21:43:30,UBC-Thunderbots/Software,https://api.github.com/repos/UBC-Thunderbots/S...,opened,"Seperate ""FreeKickPlay"" into ""DirectFreeKickPl...",Est. Difficulty - 7 G2 - Paying Tech Debt,### Description of the task\r\n- Separate dire...,TD
37334,1.046379e+10,IssuesEvent,2019-09-20 21:52:13,UBC-Thunderbots/Software,https://api.github.com/repos/UBC-Thunderbots/S...,opened,Implement Print Operators For The Timestamp An...,Est. Difficulty - 1 G2 - Paying Tech Debt,### Description of the task\r\nSee title. Gene...,TD
37335,1.046380e+10,IssuesEvent,2019-09-20 21:55:54,UBC-Thunderbots/Software,https://api.github.com/repos/UBC-Thunderbots/S...,opened,Redesign PassGenerator To Be Deterministic,Est. Difficulty - 13 G2 - Paying Tech Debt,"### Description of the task\r\nCurrently, `Pas...",TD
37336,1.046384e+10,IssuesEvent,2019-09-20 22:03:12,UBC-Thunderbots/Software,https://api.github.com/repos/UBC-Thunderbots/S...,opened,"Review All Usages Of ""loop_forever"" in Tactics...",Est. Difficulty - 3 G2 - Paying Tech Debt,### Description of the task\r\nReview all usag...,TD
37337,1.046388e+10,IssuesEvent,2019-09-20 22:13:08,UBC-Thunderbots/Software,https://api.github.com/repos/UBC-Thunderbots/S...,opened,Design A Super Simple Test Framework / Simulat...,Est. Difficulty - 7 G2 - Paying Tech Debt T - ...,### Description of the task\r\nCurrently we ha...,TD
...,...,...,...,...,...,...,...,...,...,...
54549,1.354754e+10,IssuesEvent,2020-09-17 04:24:40,UBC-Thunderbots/Software,https://api.github.com/repos/UBC-Thunderbots/S...,closed,Update GenericFactory To Use A Function To Get...,Difficulty - 7 G2 - Paying Tech Debt,"### Description of the task\r\nCurrently, the ...",TD
54601,1.356137e+10,IssuesEvent,2020-09-18 04:21:45,UBC-Thunderbots/Software,https://api.github.com/repos/UBC-Thunderbots/S...,closed,Add start()/stop() methods to the PassGenerator,Difficulty - 7 G2 - Paying Tech Debt,<!--\r\n Make sure to complete the followin...,TD
54602,1.356147e+10,IssuesEvent,2020-09-18 04:38:26,UBC-Thunderbots/Software,https://api.github.com/repos/UBC-Thunderbots/S...,closed,STP: General Cleanup List,Difficulty - 21 G2 - Paying Tech Debt G9 - Pla...,### Description of the task\r\n\r\n<!--\r\n ...,TD
54669,1.357212e+10,IssuesEvent,2020-09-18 23:09:32,UBC-Thunderbots/Software,https://api.github.com/repos/UBC-Thunderbots/S...,closed,Simulator: Make sure dribbler doesn't affect k...,Difficulty - 3 G2 - Paying Tech Debt T - Maint...,### Description of the task\r\n\r\n<!--\r\n ...,TD


In [48]:
not_UBC_thunder_debt


Unnamed: 0,id,type,created_at,repo,repo_url,action,title,labels,body,class,label
0,2.000892e+10,IssuesEvent,2022-02-01 02:13:09,itchysats/itchysats,https://api.github.com/repos/itchysats/itchysats,opened,Wallet actor does not follow ADR006,tech-debt,- Wallet actor has a connection to electrum vi...,TD,
1,2.000928e+10,IssuesEvent,2022-02-01 02:59:01,TonyLB/maketheworld,https://api.github.com/repos/TonyLB/maketheworld,closed,Denormalize ImportMap into Assets and Ephemera,techdebt,The ImportMap should show a tree structure of ...,TD,
2,2.000929e+10,IssuesEvent,2022-02-01 03:00:25,microsoft/vscode-jupyter,https://api.github.com/repos/microsoft/vscode-...,closed,notebookAndWebview tests failing,debt engineering,![image.png](https://images.zenhubusercontent....,TD,
3,2.000930e+10,IssuesEvent,2022-02-01 03:01:00,TonyLB/maketheworld,https://api.github.com/repos/TonyLB/maketheworld,opened,Revise Ephemera to abstract away from DynamoDB,techdebt,Create utility functions to encapsulate the co...,TD,
4,2.000933e+10,IssuesEvent,2022-02-01 03:03:19,TonyLB/maketheworld,https://api.github.com/repos/TonyLB/maketheworld,opened,Revise controlChannel to abstract away from Dy...,techdebt,Create utility functions to encapsulate the co...,TD,
...,...,...,...,...,...,...,...,...,...,...,...
168049,2.215739e+10,IssuesEvent,2022-06-04 02:11:19,eclipse-vertx/vert.x,https://api.github.com/repos/eclipse-vertx/vert.x,opened,SimpleConnectionPool leaks streams and connect...,bug,### Problem Description\r\nIn case the origina...,Not_TD,0.0
168050,2.025877e+10,IssuesEvent,2022-02-15 03:55:44,Connor2h/pizza-hunt,https://api.github.com/repos/Connor2h/pizza-hunt,closed,"Users can create, read, update, and delete dat...",enhancement,"* As a user, I can create and customize my own...",Not_TD,0.0
168051,2.263855e+10,IssuesEvent,2022-06-30 21:53:14,thexaero/open-parties-and-claims,https://api.github.com/repos/thexaero/open-par...,opened,Protect chunks against lightning bolts caused ...,enhancement,,Not_TD,0.0
168052,2.024838e+10,IssuesEvent,2022-02-14 15:40:30,hivedb/hive,https://api.github.com/repos/hivedb/hive,opened,Make TypeAdapter.typeId a string,enhancement,It looks like there may be a concern of type a...,Not_TD,0.0


In [43]:
apache_traffic_debt = TD[(TD["repo"] == "apache/trafficcontrol")]

not_apache_traffic_debt = Data[(
    Data["repo"] != "apache/trafficcontrol")]
apache_traffic_debt.to_csv("apache_traffic_debt.csv")
not_apache_traffic_debt.to_csv("not_apache_traffic_debt.csv")


In [44]:
apache_traffic_debt

Unnamed: 0,id,type,created_at,repo,repo_url,action,title,labels,body,class
1656,2.097965e+10,IssuesEvent,2022-03-28 18:33:54,apache/trafficcontrol,https://api.github.com/repos/apache/trafficcon...,opened,Remove Traffic Ops APIv2,Traffic Ops tech debt improvement,"## This Improvement request (usability, perfor...",TD
1657,2.097969e+10,IssuesEvent,2022-03-28 18:36:12,apache/trafficcontrol,https://api.github.com/repos/apache/trafficcon...,opened,Squash database migrations,Traffic Ops tech debt database improvement,"## This Improvement request (usability, perfor...",TD
1674,2.098324e+10,IssuesEvent,2022-03-28 22:28:29,apache/trafficcontrol,https://api.github.com/repos/apache/trafficcon...,closed,Reduce Traffic Monitor dependency on CRConfig ...,Traffic Ops Traffic Monitor tech debt medium i...,"## This Improvement request (usability, perfor...",TD
3239,2.194388e+10,IssuesEvent,2022-05-23 21:16:55,apache/trafficcontrol,https://api.github.com/repos/apache/trafficcon...,closed,Remove `user` JSON object wrapper from `user/c...,low impact tech debt Traffic Ops API Next impr...,\r\n<!-- Do not submit security vulnerabilitie...,TD
3939,2.233772e+10,IssuesEvent,2022-06-14 20:17:28,apache/trafficcontrol,https://api.github.com/repos/apache/trafficcon...,opened,Remove infrastructure/docker cruft,low impact tech debt tools low effort,## This tech debt affects these Traffic Contro...,TD
...,...,...,...,...,...,...,...,...,...,...
78605,1.966748e+10,IssuesEvent,2022-01-11 01:01:55,apache/trafficcontrol,https://api.github.com/repos/apache/trafficcon...,opened,Update Cache Stats table to use AG-Grid instea...,Traffic Portal tech debt improvement,"## This Improvement request (usability, perfor...",TD
78606,1.966749e+10,IssuesEvent,2022-01-11 01:02:36,apache/trafficcontrol,https://api.github.com/repos/apache/trafficcon...,opened,Update Delivery Service URL Signature Keys tab...,Traffic Portal tech debt improvement,"## This Improvement request (usability, perfor...",TD
78883,1.974518e+10,IssuesEvent,2022-01-14 18:07:07,apache/trafficcontrol,https://api.github.com/repos/apache/trafficcon...,closed,Deprecate/remove /capabilities TO API endpoint,Traffic Ops documentation tech debt medium imp...,"## This Improvement request (usability, perfor...",TD
79064,1.979683e+10,IssuesEvent,2022-01-18 17:22:36,apache/trafficcontrol,https://api.github.com/repos/apache/trafficcon...,closed,Document Traffic Router API Fully,Traffic Router documentation tech debt medium ...,The TR API has docs: https://traffic-control-c...,TD


In [45]:
not_apache_traffic_debt

Unnamed: 0,id,type,created_at,repo,repo_url,action,title,labels,body,class,label
0,2.000892e+10,IssuesEvent,2022-02-01 02:13:09,itchysats/itchysats,https://api.github.com/repos/itchysats/itchysats,opened,Wallet actor does not follow ADR006,tech-debt,- Wallet actor has a connection to electrum vi...,TD,
1,2.000928e+10,IssuesEvent,2022-02-01 02:59:01,TonyLB/maketheworld,https://api.github.com/repos/TonyLB/maketheworld,closed,Denormalize ImportMap into Assets and Ephemera,techdebt,The ImportMap should show a tree structure of ...,TD,
2,2.000929e+10,IssuesEvent,2022-02-01 03:00:25,microsoft/vscode-jupyter,https://api.github.com/repos/microsoft/vscode-...,closed,notebookAndWebview tests failing,debt engineering,![image.png](https://images.zenhubusercontent....,TD,
3,2.000930e+10,IssuesEvent,2022-02-01 03:01:00,TonyLB/maketheworld,https://api.github.com/repos/TonyLB/maketheworld,opened,Revise Ephemera to abstract away from DynamoDB,techdebt,Create utility functions to encapsulate the co...,TD,
4,2.000933e+10,IssuesEvent,2022-02-01 03:03:19,TonyLB/maketheworld,https://api.github.com/repos/TonyLB/maketheworld,opened,Revise controlChannel to abstract away from Dy...,techdebt,Create utility functions to encapsulate the co...,TD,
...,...,...,...,...,...,...,...,...,...,...,...
168049,2.215739e+10,IssuesEvent,2022-06-04 02:11:19,eclipse-vertx/vert.x,https://api.github.com/repos/eclipse-vertx/vert.x,opened,SimpleConnectionPool leaks streams and connect...,bug,### Problem Description\r\nIn case the origina...,Not_TD,0.0
168050,2.025877e+10,IssuesEvent,2022-02-15 03:55:44,Connor2h/pizza-hunt,https://api.github.com/repos/Connor2h/pizza-hunt,closed,"Users can create, read, update, and delete dat...",enhancement,"* As a user, I can create and customize my own...",Not_TD,0.0
168051,2.263855e+10,IssuesEvent,2022-06-30 21:53:14,thexaero/open-parties-and-claims,https://api.github.com/repos/thexaero/open-par...,opened,Protect chunks against lightning bolts caused ...,enhancement,,Not_TD,0.0
168052,2.024838e+10,IssuesEvent,2022-02-14 15:40:30,hivedb/hive,https://api.github.com/repos/hivedb/hive,opened,Make TypeAdapter.typeId a string,enhancement,It looks like there may be a concern of type a...,Not_TD,0.0


In [38]:
va_gov_debt = TD[(TD["repo"] == "department-of-veterans-affairs/va.gov-team")]

not_va_gov_debt = Data[(
    Data["repo"] != "department-of-veterans-affairs/va.gov-team")]
va_gov_debt.to_csv("va_gov_debt.csv")
not_va_gov_debt.to_csv("not_va_gov_debt.csv")


In [39]:
va_gov_debt

Unnamed: 0,id,type,created_at,repo,repo_url,action,title,labels,body,class
78,2.002538e+10,IssuesEvent,2022-02-01 20:41:03,department-of-veterans-affairs/va.gov-team,https://api.github.com/repos/department-of-vet...,opened,Combined VBA + VHA debt portal from The Debt R...,vsa-debt sitewide content sitewide content-pro...,## What does your team need support for? Check...,TD
218,2.011435e+10,IssuesEvent,2022-02-07 17:54:13,department-of-veterans-affairs/va.gov-team,https://api.github.com/repos/department-of-vet...,reopened,"Remove references to ""content brief"" in Collab...",tech-debt collaboration-cycle governance-team,## Issue Description\nThe Sitewide Content tea...,TD
221,2.011482e+10,IssuesEvent,2022-02-07 18:21:53,department-of-veterans-affairs/va.gov-team,https://api.github.com/repos/department-of-vet...,closed,Analytics Implementation and QA Support for E...,analytics-insights analytics-request vsa-debt ...,# Google Analytics Implementation or QA Reques...,TD
225,2.011531e+10,IssuesEvent,2022-02-07 18:52:23,department-of-veterans-affairs/va.gov-team,https://api.github.com/repos/department-of-vet...,opened,[VBA Debt Portal] Bug - The existing empty sta...,bug frontend vsa vsa-debt Debt Letters,## Issue Description\n\n### Bug explanation\n\...,TD
231,2.011792e+10,IssuesEvent,2022-02-07 21:41:54,department-of-veterans-affairs/va.gov-team,https://api.github.com/repos/department-of-vet...,opened,[Debt Letters] eslint (depricate/import) - Loa...,frontend tech-debt vsa-debt Debt Letters,## Issue Description\nPlatform deprecated `<Lo...,TD
...,...,...,...,...,...,...,...,...,...,...
79991,2.000216e+10,IssuesEvent,2022-01-31 17:41:19,department-of-veterans-affairs/va.gov-team,https://api.github.com/repos/department-of-vet...,opened,[MCP] eslint (import/order),frontend tech-debt vsa-debt MCP,## Issue Description\nReceiving following esli...,TD
79992,2.000235e+10,IssuesEvent,2022-01-31 17:53:04,department-of-veterans-affairs/va.gov-team,https://api.github.com/repos/department-of-vet...,opened,[MCP] eslint (react/prop-types),frontend tech-debt vsa-debt MCP,## Issue Description\nReceiving following esli...,TD
79993,2.000249e+10,IssuesEvent,2022-01-31 18:01:18,department-of-veterans-affairs/va.gov-team,https://api.github.com/repos/department-of-vet...,opened,[MCP] eslint (react/jsx-no-bind),frontend tech-debt vsa-debt MCP,## Issue Description\nReceiving following esli...,TD
79995,2.000304e+10,IssuesEvent,2022-01-31 18:34:05,department-of-veterans-affairs/va.gov-team,https://api.github.com/repos/department-of-vet...,opened,[MCP] eslint (react/jsx-one-expression-per-line),frontend tech-debt vsa-debt MCP,## Issue Description\nReceiving following esli...,TD


In [41]:
not_va_gov_debt

Unnamed: 0,id,type,created_at,repo,repo_url,action,title,labels,body,class,label
0,2.000892e+10,IssuesEvent,2022-02-01 02:13:09,itchysats/itchysats,https://api.github.com/repos/itchysats/itchysats,opened,Wallet actor does not follow ADR006,tech-debt,- Wallet actor has a connection to electrum vi...,TD,
1,2.000928e+10,IssuesEvent,2022-02-01 02:59:01,TonyLB/maketheworld,https://api.github.com/repos/TonyLB/maketheworld,closed,Denormalize ImportMap into Assets and Ephemera,techdebt,The ImportMap should show a tree structure of ...,TD,
2,2.000929e+10,IssuesEvent,2022-02-01 03:00:25,microsoft/vscode-jupyter,https://api.github.com/repos/microsoft/vscode-...,closed,notebookAndWebview tests failing,debt engineering,![image.png](https://images.zenhubusercontent....,TD,
3,2.000930e+10,IssuesEvent,2022-02-01 03:01:00,TonyLB/maketheworld,https://api.github.com/repos/TonyLB/maketheworld,opened,Revise Ephemera to abstract away from DynamoDB,techdebt,Create utility functions to encapsulate the co...,TD,
4,2.000933e+10,IssuesEvent,2022-02-01 03:03:19,TonyLB/maketheworld,https://api.github.com/repos/TonyLB/maketheworld,opened,Revise controlChannel to abstract away from Dy...,techdebt,Create utility functions to encapsulate the co...,TD,
...,...,...,...,...,...,...,...,...,...,...,...
168049,2.215739e+10,IssuesEvent,2022-06-04 02:11:19,eclipse-vertx/vert.x,https://api.github.com/repos/eclipse-vertx/vert.x,opened,SimpleConnectionPool leaks streams and connect...,bug,### Problem Description\r\nIn case the origina...,Not_TD,0.0
168050,2.025877e+10,IssuesEvent,2022-02-15 03:55:44,Connor2h/pizza-hunt,https://api.github.com/repos/Connor2h/pizza-hunt,closed,"Users can create, read, update, and delete dat...",enhancement,"* As a user, I can create and customize my own...",Not_TD,0.0
168051,2.263855e+10,IssuesEvent,2022-06-30 21:53:14,thexaero/open-parties-and-claims,https://api.github.com/repos/thexaero/open-par...,opened,Protect chunks against lightning bolts caused ...,enhancement,,Not_TD,0.0
168052,2.024838e+10,IssuesEvent,2022-02-14 15:40:30,hivedb/hive,https://api.github.com/repos/hivedb/hive,opened,Make TypeAdapter.typeId a string,enhancement,It looks like there may be a concern of type a...,Not_TD,0.0


In [60]:
vscode_debt = Data[(Data["repo"] == "microsoft/vscode") |
     (Data["repo"] == "Microsoft/vscode")]


In [64]:
vscode_debt.to_csv("vscode_debt.csv")

In [62]:
not_vscode = Data[(Data["repo"] != "microsoft/vscode") &
                   (Data["repo"] != "Microsoft/vscode")]


In [65]:
not_vscode.to_csv("not_vscode_debt.csv")
