diff --git a/conf/ambari.yml b/conf/ambari.yml index 405ad4d..a81d84a 100644 --- a/conf/ambari.yml +++ b/conf/ambari.yml @@ -51,28 +51,44 @@ version_control: - branch-2.5 mailing_list: - # Where is the mbox located locally? - mbox: ../../rawdata/mbox/ambari-dev.mbox - # What is the domain of the chosen mailing list archive? - domain: http://mail-archives.apache.org/mod_mbox - # Which lists of the domain will be used? - list_key: - - ambari-dev + mod_mbox: + mail_key_1: + archive_url: http://mail-archives.apache.org/mod_mbox/ambari-dev + mbox: ../../rawdata/ambari/mod_mbox/ambari-dev/ + mailing_list: ambari-dev + archive_type: apache + mail_key_2: + archive_url: http://mail-archives.apache.org/mod_mbox/ambari-user + mbox: ../../rawdata/geronimo/mod_mbox/ambari-user/ + mailing_list: ambari-user + archive_type: apache + pipermail: + mail_key_1: + archive_url: http://some/pipermail/url + mbox: ../../rawdata/geronimo/pipermail/geronimo-dev/ issue_tracker: jira: - # Obtained from the project's JIRA URL - domain: https://issues.apache.org/jira - project_key: AMBARI - # Download using `download_jira_data.Rmd` - #issues: ../../rawdata/issue_tracker/ambari_issues.json - #issue_comments: ../../rawdata/issue_tracker/ambari_issue_comments.json + project_key_1: + # Obtained from the project's JIRA URL + domain: https://issues.apache.org/jira + project_key: AMBARI + # Download using `download_jira_data.Rmd` + # issues: ../../rawdata/ambari/jira/issues/ambari/ + # issue_comments: ../../rawdata/ambari/jira/issue_comments/ambari/ github: - # Obtained from the project's GitHub URL - owner: apache - repo: ambari - # Download using `download_github_comments.Rmd` - #replies: ../../rawdata/github/ambari/ + project_key_1: + # Obtained from the project's GitHub URL + owner: apache + repo: ambari + # Download using `download_github_comments.Rmd` + issue_or_pr_comment: ../../rawdata/ambari/github/issue_or_pr_comment/apache_ambari/ + issue: ../../rawdata/ambari/github/issue/apache_ambari/ + issue_search: ../..rawdata/ambari/github/issue_search/apache_ambari/ + pull_request: ../../rawdata/ambari/github/pull_request/apache_ambari/ + commit: ../../rawdata/ambari/github/commit/apache_ambari/ + # bugzilla: + # project_key: ambari #vulnerabilities: # Folder path with nvd cve feeds (e.g. nvdcve-1.1-2018.json) diff --git a/conf/apr.yml b/conf/apr.yml index 65892ed..9558d71 100644 --- a/conf/apr.yml +++ b/conf/apr.yml @@ -45,28 +45,39 @@ version_control: - trunk mailing_list: - # Where is the mbox located locally? - mbox: ../../rawdata/mbox/apr-dev_2012_2019.mbox - # What is the domain of the chosen mailing list archive? - domain: http://mail-archives.apache.org/mod_mbox - # Which lists of the domain will be used? - list_key: - - apr-dev + mod_mbox: + mail_key_1: + archive_url: http://mail-archives.apache.org/mod_mbox/apr-dev + mbox: ../../rawdata/apr/mod_mbox/apr-dev/ + mailing_list: apr-dev + archive_type: apache + pipermail: + mail_key_1: + archive_url: http://some/pipermail/url + mbox: ../../rawdata/geronimo/pipermail/geronimo-dev/ issue_tracker: jira: - # Obtained from the project's JIRA URL - domain: https://issues.apache.org/jira - #project_key: HELIX - # Download using `download_jira_data.Rmd` - #issues: ../../rawdata/issue_tracker/helix_issues.json - #issue_comments: ../../rawdata/issue_tracker/helix_issue_comments.json + project_key_1: + # Obtained from the project's JIRA URL + domain: https://issues.apache.org/jira + #project_key: HELIX + # Download using `download_jira_data.Rmd` + # issues: ../../rawdata/apr/jira/issues/helix/ + # issue_comments: ../../rawdata/apr/jira/issue_comments/helix/ github: - # Obtained from the project's GitHub URL - owner: apache - repo: apr - # Download using `download_github_comments.Rmd` - replies: ../../rawdata/github/apr/ + project_key_1: + # Obtained from the project's GitHub URL + owner: apache + repo: apr + # Download using `download_github_comments.Rmd` + issue_or_pr_comment: ../../rawdata/apr/github/issue_or_pr_comment/apache_apr/ + issue: ../../rawdata/apr/github/issue/apache_apr/ + issue_search: ../..rawdata/apr/github/issue_search/apache_apr/ + pull_request: ../../rawdata/apr/github/pull_request/apache_apr/ + commit: ../../rawdata/apr/github/commit/apache_apr/ + + #vulnerabilities: # Folder path with nvd cve feeds (e.g. nvdcve-1.1-2018.json) diff --git a/conf/calculator.yml b/conf/calculator.yml index 2b95b6f..7184b59 100644 --- a/conf/calculator.yml +++ b/conf/calculator.yml @@ -58,14 +58,32 @@ mailing_list: # domain: https://issues.apache.org/jira #project_key: HELIX # Download using `download_jira_data.Rmd` - #issues: ../../rawdata/issue_tracker/helix_issues.json - #issue_comments: ../../rawdata/issue_tracker/helix_issue_comments.json + #issues: ../../rawdata/helix/jira/issues/ + #issue_comments: ../../rawdata/helix/jira/issue_comments/ github: - # Obtained from the project's GitHub URL - owner: HouariZegai - repo: Calculator - # Download using `download_github_comments.Rmd` - replies: ../../rawdata/github/Calculator/ + + replies: ../../rawdata/Calculator/github/ + +issue_tracker: + jira: + project_key_1: + # Obtained from the project's JIRA URL + # domain: https://issues.apache.org/jira + # project_key: HELIX + # Download using `download_jira_data.Rmd` + # issues: ../../rawdata/helix/jira/issues/helix/ + # issue_comments: ../../rawdata/helix/jira/issue_comments/helix/ + github: + project_key_1: + # Obtained from the project's GitHub URL + owner: HouariZegai + repo: Calculator + # Download using `download_github_comments.Rmd` + issue_or_pr_comment: ../../rawdata/Calculator/github/issue_or_pr_comment/HouariZegai_Calculator/ + issue: ../../rawdata/Calculator/github/issue/HouariZegai_Calculator/ + issue_search: ../../rawdata/Calculator/github/issue_search/HouariZegai_Calculator/ + pull_request: ../../rawdata/Calculator/github/pull_request/HouariZegai_Calculator/ + commit: ../../rawdata/Calculator/github/commit/HouariZegai_Calculator/ #vulnerabilities: # Folder path with nvd cve feeds (e.g. nvdcve-1.1-2018.json) diff --git a/conf/camel.yml b/conf/camel.yml index 7a14fa7..284dfcf 100644 --- a/conf/camel.yml +++ b/conf/camel.yml @@ -46,14 +46,22 @@ version_control: - camel-3.21.0 - camel-1.0.0 -#mailing_list: - # Where is the mbox located locally? -# mbox: ../../rawdata/mbox/apr-dev_2012_2019.mbox - # What is the domain of the chosen mailing list archive? -# domain: http://mail-archives.apache.org/mod_mbox - # Which lists of the domain will be used? -# list_key: -# - apr-dev +mailing_list: + mod_mbox: + mail_key_1: + archive_url: http://mail-archives.apache.org/mod_mbox/camel-dev + mbox: ../../rawdata/camel/mod_mbox/camel-dev/ + mailing_list: camel-dev + archive_type: apache + mail_key_2: + archive_url: http://mail-archives.apache.org/mod_mbox/camel-users + mbox: ../../rawdata/camel/mod_mbox/camel-users/ + mailing_list: camel-users + archive_type: apache + pipermail: + mail_key_1: + archive_url: http://some/pipermail/url + mbox: ../../rawdata/geronimo/pipermail/geronimo-dev/ issue_tracker: jira: @@ -61,14 +69,37 @@ issue_tracker: # domain: https://issues.apache.org/jira project_key: CAMEL # Download using `download_jira_data.Rmd` - issues: ../../rawdata/issue_tracker/camel_issues.json - issue_comments: ../../rawdata/issue_tracker/camel_issue_comments.json + issues: ../../rawdata/camel/jira/issues/ + issue_comments: ../../rawdata/camel/jira/issue_comments/ # github: # Obtained from the project's GitHub URL # owner: apache # repo: apr # Download using `download_github_comments.Rmd` -# replies: ../../rawdata/github/apr/ +# replies: ../../rawdata/apr/github/ + + +issue_tracker: + jira: + project_key_1: + # Obtained from the project's JIRA URL + # domain: https://issues.apache.org/jira + project_key: CAMEL + # Download using `download_jira_data.Rmd` + issues: ../../rawdata/camel/jira/issues/camel/ + issue_comments: ../../rawdata/camel/jira/issue_comments/camel/ + github: + project_key_1: + # Obtained from the project's GitHub URL + # owner: apache + # repo: apr + # Download using `download_github_comments.Rmd` + # issue_or_pr_comment: ../../rawdata/apr/github/issue_or_pr_comment/apache_apr/ + # issue: ../../rawdata/apr/github/issue/apache_apr/ + # issue_search: ../../rawdata/apr/github/issue_search/apache_apr/ + # pull_request: ../../rawdata/apr/github/pull_request/apache_apr/ + # commit: ../../rawdata/apr/github/commit/apache_apr/ + #vulnerabilities: # Folder path with nvd cve feeds (e.g. nvdcve-1.1-2018.json) diff --git a/conf/chromium.yml b/conf/chromium.yml index 3d0f128..cafed7a 100644 --- a/conf/chromium.yml +++ b/conf/chromium.yml @@ -54,18 +54,24 @@ mailing_list: issue_tracker: jira: - # Obtained from the project's JIRA URL - #domain: https://issues.apache.org/jira - #project_key: GERONIMO - # Download using `download_jira_data.Rmd` - #issues: ../../rawdata/issue_tracker/geronimo_issues.json - #issue_comments: ../../rawdata/issue_tracker/geronimo_issue_comments.json + project_key_1: + # Obtained from the project's JIRA URL + # domain: https://issues.apache.org/jira + #project_key: HELIX + # Download using `download_jira_data.Rmd` + # issues: ../../rawdata/helix/jira/issues/helix/ + # issue_comments: ../../rawdata/helix/jira/issue_comments/helix/ github: - # Obtained from the project's GitHub URL - #owner: sailuh - #repo: kaiaulu - # Download using `download_github_comments.Rmd` - #replies: ../../rawdata/github/kaiaulu/ + project_key_1: + # Obtained from the project's GitHub URL + # owner: apache + # repo: apr + # # Download using `download_github_comments.Rmd` + # issue_or_pr_comment: ../../rawdata/apr/github/issue_or_pr_comment/apache_apr/ + # issue: ../../rawdata/apr/github/issue/apache_apr/ + # issue_search: ../..rawdata/apr/github/issue_search/apache_apr/ + # pull_request: ../../rawdata/apr/github/pull_request/apache_apr/ + # commit: ../../rawdata/apr/github/commit/apache_apr/ vulnerabilities: # Folder path with nvd cve feeds (e.g. nvdcve-1.1-2018.json) diff --git a/conf/geronimo.yml b/conf/geronimo.yml index 99ee59a..55161d3 100644 --- a/conf/geronimo.yml +++ b/conf/geronimo.yml @@ -44,28 +44,42 @@ version_control: - trunk mailing_list: - # Where is the mbox located locally? - mbox: ../../rawdata/mbox/geronimo-dev.mbox - # What is the domain of the chosen mailing list archive? - domain: http://mail-archives.apache.org/mod_mbox - # Which lists of the domain will be used? - list_key: - - geronimo-dev + mod_mbox: + mail_key_1: + archive_url: http://mail-archives.apache.org/mod_mbox/geronimo-dev + mbox: ../../rawdata/geronimo/mod_mbox/geronimo-dev/ + mailing_list: geronimo-dev + archive_type: apache + mail_key_2: + archive_url: http://mail-archives.apache.org/mod_mbox/geronimo-user + mbox: ../../rawdata/geronimo/mod_mbox/geronimo-user/ + mailing_list: geronimo-user + archive_type: apache + pipermail: + mail_key_1: + archive_url: http://some/pipermail/url + mbox: ../../rawdata/geronimo/pipermail/geronimo-dev/ issue_tracker: jira: - # Obtained from the project's JIRA URL - domain: https://issues.apache.org/jira - project_key: GERONIMO - # Download using `download_jira_data.Rmd` - issues: ../../rawdata/issue_tracker/geronimo_issues.json - issue_comments: ../../rawdata/issue_tracker/geronimo_issue_comments.json + project_key_1: + # Obtained from the project's JIRA URL + domain: https://issues.apache.org/jira + project_key: GERONIMO + # Download using `download_jira_data.Rmd` + issues: ../../rawdata/geronimo/jira/issues/geronimo + issue_comments: ../../rawdata/geronimo/jira/issue_comments/geronimo github: - # Obtained from the project's GitHub URL - owner: apache - repo: geronimo - # Download using `download_github_comments.Rmd` - replies: ../../rawdata/github/geronimo/ + project_key_1: + # Obtained from the project's GitHub URL + owner: apache + repo: geronimo + # Download using `download_github_comments.Rmd` + issue_or_pr_comment: ../../rawdata/geronimo/github/issue_or_pr_comment/apache_geronimo/ + issue: ../../rawdata/geronimo/github/issue/apache_geronimo/ + issue_search: ../../rawdata/geronimo/github/issue_search/apache_geronimo/ + pull_request: ../../rawdata/geronimo/github/pull_request/apache_geronimo/ + commit: ../../rawdata/geronimo/github/commit/apache_geronimo/ #vulnerabilities: # Folder path with nvd cve feeds (e.g. nvdcve-1.1-2018.json) diff --git a/conf/helix.yml b/conf/helix.yml index 2effc52..fa48ad5 100644 --- a/conf/helix.yml +++ b/conf/helix.yml @@ -48,30 +48,44 @@ version_control: - revert-1685-master mailing_list: - # Where is the mbox located locally? - # This is the path to the .git of the project repository you are analyzing. - # The .git is hidden, so you can see it using `ls -a` - mbox: ../../rawdata/mbox/helix_mbox - # What is the domain of the chosen mailing list archive? - domain: http://mail-archives.apache.org/mod_mbox - # Which lists of the domain will be used? - list_key: - - helix-dev + mod_mbox: + mail_key_1: + archive_url: http://mail-archives.apache.org/mod_mbox/helix-dev + mbox: ../../rawdata/helix/mod_mbox/helix-dev/ + mailing_list: helix-dev + archive_type: apache + mail_key_2: + archive_url: http://mail-archives.apache.org/mod_mbox/helix-user + mbox: ../../rawdata/helix/mod_mbox/helix-user/ + mailing_list: helix-user + archive_type: apache + pipermail: + mail_key_1: + archive_url: http://some/pipermail/url + mbox: ../../rawdata/geronimo/pipermail/geronimo-dev/ issue_tracker: jira: - # Obtained from the project's JIRA URL - domain: https://issues.apache.org/jira - project_key: HELIX - # Download using `download_jira_data.Rmd` - issues: ../../rawdata/issue_tracker/helix_issues.json - issue_comments: ../../rawdata/issue_tracker/helix_issue_comments.json + project_key_1: + # Obtained from the project's JIRA URL + domain: https://issues.apache.org/jira + project_key: HELIX + # Download using `download_jira_data.Rmd` + issues: ../../rawdata/helix/jira/issues/helix + issue_comments: ../../rawdata/helix/jira/issue_comments/helix github: - # Obtained from the project's GitHub URL - owner: apache - repo: helix - # Download using `download_github_comments.Rmd` - replies: ../../rawdata/github/helix/ + project_key_1: + # Obtained from the project's GitHub URL + owner: apache + repo: helix + # Download using `download_github_comments.Rmd` + issue_or_pr_comment: ../../rawdata/helix/github/issue_or_pr_comment/apache_helix/ + issue: ../../rawdata/helix/github/issue/apache_helix/ + issue_search: ../../rawdata/helix/github/issue_search/apache_helix/ + pull_request: ../../rawdata/helix/github/pull_request/apache_helix/ + commit: ../../rawdata/helix/github/commit/apache_helix/ + #bugzilla: + #project_key: helix #vulnerabilities: # Folder path with nvd cve feeds (e.g. nvdcve-1.1-2018.json) diff --git a/conf/junit5.yml b/conf/junit5.yml index cdf0a33..25c4cb6 100644 --- a/conf/junit5.yml +++ b/conf/junit5.yml @@ -52,20 +52,26 @@ version_control: # list_key: # - apr-dev -#issue_tracker: -# jira: - # Obtained from the project's JIRA URL -# domain: https://issues.apache.org/jira - #project_key: HELIX - # Download using `download_jira_data.Rmd` - #issues: ../../rawdata/issue_tracker/helix_issues.json - #issue_comments: ../../rawdata/issue_tracker/helix_issue_comments.json -# github: - # Obtained from the project's GitHub URL -# owner: apache -# repo: apr - # Download using `download_github_comments.Rmd` -# replies: ../../rawdata/github/apr/ +# issue_tracker: +# jira: +# project_key_1: +# # Obtained from the project's JIRA URL +# domain: https://issues.apache.org/jira +# #project_key: HELIX +# # Download using `download_jira_data.Rmd` +# # issues: ../../rawdata/helix/jira/issues/helix/ +# # issue_comments: ../../rawdata/helix/jira/issue_comments/helix/ +# github: +# project_key_1: +# # Obtained from the project's GitHub URL +# owner: apache +# repo: apr +# # Download using `download_github_comments.Rmd` +# issue_or_pr_comment: ../../rawdata/apr/github/issue_or_pr_comment/apache_apr/ +# issue: ../../rawdata/apr/github/issue/apache_apr/ +# issue_search: ../../rawdata/apr/github/issue_search/apache_apr/ +# pull_request: ../../rawdata/apr/github/pull_request/apache_apr/ +# commit: ../../rawdata/apr/github/commit/apache_apr/ #vulnerabilities: # Folder path with nvd cve feeds (e.g. nvdcve-1.1-2018.json) diff --git a/conf/kaiaulu.yml b/conf/kaiaulu.yml index a5f007c..fc26a92 100644 --- a/conf/kaiaulu.yml +++ b/conf/kaiaulu.yml @@ -54,18 +54,37 @@ mailing_list: issue_tracker: jira: - # Obtained from the project's JIRA URL - #domain: https://issues.apache.org/jira - #project_key: GERONIMO - # Download using `download_jira_data.Rmd` - #issues: ../../rawdata/issue_tracker/geronimo_issues.json - #issue_comments: ../../rawdata/issue_tracker/geronimo_issue_comments.json + project_key_1: + # Obtained from the project's JIRA URL + domain: https://sailuh.atlassian.net + project_key: SAILUH + # Download using `download_jira_data.Rmd` + issues: ../../rawdata/kaiaulu/jira/issues/sailuh/ + issue_comments: ../../rawdata/kaiaulu/jira/issue_comments/sailuh/ github: - # Obtained from the project's GitHub URL - owner: sailuh - repo: kaiaulu - # Download using `download_github_comments.Rmd` - replies: ../../rawdata/github/kaiaulu + project_key_1: + # Obtained from the project's GitHub URL + owner: sailuh + repo: kaiaulu + # Download using `download_github_comments.Rmd` + issue_or_pr_comment: ../../rawdata/kaiaulu/github/issue_or_pr_comment/sailuh_kaiaulu/ + issue: ../../rawdata/kaiaulu/github/issue/sailuh_kaiaulu/ + issue_search: ../..rawdata/kaiaulu/github/issue_search/sailuh_kaiaulu/ + pull_request: ../../kaiaulu/github/pull_request/sailuh_kaiaulu/ + commit: ../../rawdata/kaiaulu/github/commit/sailuh_kaiaulu/ + # project_key_2: + # # Obtained from the project's GitHub URL + # owner: ssunoo2 + # repo: kaiaulu + # # Download using `download_github_comments.Rmd` + # issue_or_pr_comment: ../../rawdata/kaiaulu/github/issue_or_pr_comment/ssunoo2_kaiaulu/ + # issue: ../../rawdata/kaiaulu/github/issue/ssunoo2_kaiaulu/ + # refresh_issues: ../..rawdata/kaiaulu/github/refresh_issues/ssunoo2_kaiaulu + # pull_request: ../../kaiaulu/github/pull_request/ssunoo2_kaiaulu/ + # commit: ../../rawdata/kaiaulu/github/commit/ssunoo2_kaiaulu/ + #bugzilla: + #project_key: kaiaulu + #vulnerabilities: # Folder path with nvd cve feeds (e.g. nvdcve-1.1-2018.json) diff --git a/conf/openssl.yml b/conf/openssl.yml index aa7b225..6f88a9b 100644 --- a/conf/openssl.yml +++ b/conf/openssl.yml @@ -45,29 +45,46 @@ version_control: - master mailing_list: - # Where is the mbox located locally? - #mbox: ../../rawdata/mbox/openssl_dev_mbox # 2004-2008 fields are complete - mbox: ../../rawdata/mbox/openssl-dev.mbx # 2002-2019 gmail field is redacted due to google groups - # What is the domain of the chosen mailing list archive? - #domain: http://mail-archives.apache.org/mod_mbox - # Which lists of the domain will be used? - #list_key: - # - apr-dev + mod_mbox: + mail_key_1: + archive_url: http://mail-archives.apache.org/mod_mbox/apr-dev + mbox: ../../rawdata/apr/mod_mbox/apr-dev/ + mailing_list: apr-dev + archive_type: apache + pipermail: + mail_key_1: + archive_url: https://mta.openssl.org/pipermail/openssl-dev/ + mbox: ../../rawdata/openssl/pipermail/openssl-dev/ + mailing_list: openssl-dev + archive_type: mta + mail_key_2: + archive_url: https://mta.openssl.org/pipermail/openssl-users/ + mbox: ../../rawdata/openssl/pipermail/openssl-users/ + mailing_list: openssl-users + archive_type: mta -#issue_tracker: - #jira: - # Obtained from the project's JIRA URL - #domain: https://issues.apache.org/jira - #project_key: HELIX - # Download using `download_jira_data.Rmd` - #issues: ../../rawdata/issue_tracker/helix_issues.json - #issue_comments: ../../rawdata/issue_tracker/helix_issue_comments.json - #github: - # Obtained from the project's GitHub URL - #owner: apache - #repo: apr - # Download using `download_github_comments.Rmd` - #replies: ../../rawdata/github/apr/ +# issue_tracker: +# jira: +# project_key_1: +# # Obtained from the project's JIRA URL +# domain: https://issues.apache.org/jira +# #project_key: HELIX +# # Download using `download_jira_data.Rmd` +# # issues: ../../rawdata/helix/jira/issues/helix/ +# # issue_comments: ../../rawdata/helix/jira/issue_comments/helix/ +# github: +# project_key_1: +# # Obtained from the project's GitHub URL +# owner: apache +# repo: apr +# # Download using `download_github_comments.Rmd` +# issue_or_pr_comment: ../../rawdata/apr/github/issue_or_pr_comment/apache_apr/ +# issue: ../../rawdata/apr/github/issue/apache_apr/ +# issue_search: ../../rawdata/apr/github/issue_search/apache_apr/ +# pull_request: ../../rawdata/apr/github/pull_request/apache_apr/ +# commit: ../../rawdata/apr/github/commit/apache_apr/ +# bugzilla: +# project_key: openssl vulnerabilities: # Folder path with nvd cve feeds (e.g. nvdcve-1.1-2018.json) diff --git a/conf/redhat.yml b/conf/redhat.yml new file mode 100644 index 0000000..611ef93 --- /dev/null +++ b/conf/redhat.yml @@ -0,0 +1,172 @@ +# -*- yaml -*- +# https://github.com/sailuh/kaiaulu +# +# Copying and distribution of this file, with or without modification, +# are permitted in any medium without royalty provided the copyright +# notice and this notice are preserved. This file is offered as-is, +# without any warranty. + +# Project Configuration File # +# +# To perform analysis on open source projects, you need to manually +# collect some information from the project's website. As there is +# no standardized website format, this file serves to distill +# important data source information so it can be reused by others +# and understood by Kaiaulu. +# +# Please check https://github.com/sailuh/kaiaulu/tree/master/conf to +# see if a project configuration file already exists. Otherwise, we +# would appreciate if you share your curated file with us by sending a +# Pull Request: https://github.com/sailuh/kaiaulu/pulls +# +# Note, you do NOT need to specify this entire file to conduct analysis. +# Each R Notebook uses a different portion of this file. To know what +# information is used, see the project configuration file section at +# the start of each R Notebook. +# +# Please comment unused parameters instead of deleting them for clarity. +# If you have questions, please open a discussion: +# https://github.com/sailuh/kaiaulu/discussions + +project: + website: http://itm0.shidler.hawaii.edu/kaiaulu + openhub: https://www.openhub.net/p/kaiaulu + +version_control: + # Where is the git log located locally? + # This is the path to the .git of the project repository you are analyzing. + # The .git is hidden, so you can see it using `ls -a` + log: ../../rawdata/git_repo/kaiaulu/.git + # From where the git log was downloaded? + log_url: https://github.com/sailuh/kaiaulu + # List of branches used for analysis + branch: + - master + +mailing_list: + # Where is the mbox located locally? + #mbox: ../../rawdata/mbox/geronimo-dev.mbox + # What is the domain of the chosen mailing list archive? + #domain: http://mail-archives.apache.org/mod_mbox + # Which lists of the domain will be used? + #list_key: + # - geronimo-dev + +issue_tracker: + jira: + project_key_1: + # Obtained from the project's JIRA URL + domain: https://sailuh.atlassian.net + project_key: SAILUH + # Download using `download_jira_data.Rmd` + issues: ../../rawdata/kaiaulu/jira/issues/sailuh/ + issue_comments: ../../rawdata/kaiaulu/jira/issue_comments/sailuh/ + github: + project_key_1: + # Obtained from the project's GitHub URL + owner: sailuh + repo: kaiaulu + # Download using `download_github_comments.Rmd` + issue_or_pr_comment: ../../rawdata/kaiaulu/github/issue_or_pr_comment/sailuh_kaiaulu/ + issue: ../../rawdata/kaiaulu/github/issue/sailuh_kaiaulu/ + issue_search: ../..rawdata/kaiaulu/github/issue_search/sailuh_kaiaulu/ + pull_request: ../../kaiaulu/github/pull_request/sailuh_kaiaulu/ + commit: ../../rawdata/kaiaulu/github/commit/sailuh_kaiaulu/ + # project_key_2: + # # Obtained from the project's GitHub URL + # owner: ssunoo2 + # repo: kaiaulu + # # Download using `download_github_comments.Rmd` + # issue_or_pr_comment: ../../rawdata/kaiaulu/github/issue_or_pr_comment/ssunoo2_kaiaulu/ + # issue: ../../rawdata/kaiaulu/github/issue/ssunoo2_kaiaulu/ + # refresh_issues: ../..rawdata/kaiaulu/github/refresh_issues/ssunoo2_kaiaulu + # pull_request: ../../kaiaulu/github/pull_request/ssunoo2_kaiaulu/ + # commit: ../../rawdata/kaiaulu/github/commit/ssunoo2_kaiaulu/ + bugzilla: + project_key: redhat + + +#vulnerabilities: + # Folder path with nvd cve feeds (e.g. nvdcve-1.1-2018.json) + # Download at: https://nvd.nist.gov/vuln/data-feeds + #nvd_feed: rawdata/nvdfeed + +# Commit message CVE or Issue Regular Expression (regex) +# See project's commit message for examples to create the regex +commit_message_id_regex: + issue_id: \#[0-9]+ + #cve_id: ? + +filter: + keep_filepaths_ending_with: + - R + remove_filepaths_containing: + - test + + +# Third Party Tools Configuration # +# +# See Kaiaulu's README.md for details on how to setup these tools. +tool: + # Depends allow to parse file-file static dependencies. + depends: + # accepts one language at a time: cpp, java, ruby, python, pom + # You can obtain this information on OpenHub or the project GiHub page right pane. + code_language: java + # Specify which types of Dependencies to keep - see the Depends tool README.md for details. + keep_dependencies_type: + - Cast + - Call + - Import + - Return + - Set + - Use + - Implement + - ImplLink + - Extend + - Create + - Throw + - Parameter + - Contain + # Uctags allows finer file-file dependency parsing (e.g. functions, classes, structs) + uctags: + # See https://github.com/sailuh/kaiaulu/wiki/Universal-Ctags for details + # What types of file-file dependencies should be considered? If all + # dependencies are specified, Kaiaulu will use all of them if available. + keep_lines_type: + c: + - f # function definition + cpp: + - c # classes + - f # function definition + java: + - c # classes + - m # methods + python: + - c # classes + - f # functions + r: + - f # functions + +# Analysis Configuration # +analysis: + # You can specify the intervals in 2 ways: window, or enumeration + window: + # If using gitlog, use start_commit and end_commit. Timestamp is inferred from gitlog + start_commit: 224a729f44f554af311ca52cf01b105ded87499b + end_commit: 74cd4d4835a02e01e310476c6776192ad0d97173 + # Use datetime only if no gitlog is used in the analysis. + #start_datetime: 2013-05-01 00:00:00 + #end_datetime: 2013-11-01 00:00:00 + size_days: 30 +# enumeration: + # If using gitlog, specify the commits +# commit: +# - 9eae9e96f15e1f216162810cef4271a439a74223 +# - f1d2d568776b3708dd6a3077376e2331f9268b04 +# - c33a2ce74c84f0d435bfa2dd8953d132ebf7a77a + # Use datetime only if no gitlog is used in the analysis. Timestamp is inferred from gitlog +# datetime: +# - 2013-05-01 00:00:00 +# - 2013-08-01 00:00:00 +# - 2013-11-01 00:00:00 diff --git a/conf/spark.yml b/conf/spark.yml index bafca66..d861e80 100644 --- a/conf/spark.yml +++ b/conf/spark.yml @@ -42,28 +42,42 @@ version_control: - master mailing_list: - # Where is the mbox located locally? - #mbox: ../rawdata/mbox/spark-dev.mbox - # What is the domain of the chosen mailing list archive? - #domain: http://mail-archives.apache.org/mod_mbox - # Which lists of the domain will be used? - #list_key: - # - spark-dev + mod_mbox: + mail_key_1: + archive_url: http://mail-archives.apache.org/mod_mbox/spark-dev + mbox: ../../rawdata/spark/mod_mbox/spark-dev/ + mailing_list: spark-dev + archive_type: apache + mail_key_2: + archive_url: http://mail-archives.apache.org/mod_mbox/spark-user + mbox: ../../rawdata/spark/mod_mbox/spark-user/ + mailing_list: spark-user + archive_type: apache + pipermail: + mail_key_1: + archive_url: http://some/pipermail/url + mbox: ../../rawdata/geronimo/pipermail/geronimo-dev/ -issue_tracker: - jira: - # Obtained from the project's JIRA URL - #domain: https://issues.apache.org/jira - #project_key: SPARK - # Download using `download_jira_data.Rmd` - #issues: ../../rawdata/issue_tracker/spark_issues.json - #issue_comments: ../../rawdata/issue_tracker/sparj_issue_comments.json - github: - # Obtained from the project's GitHub URL - #owner: apache - #repo: spark - # Download using `download_github_comments.Rmd` - #replies: ../../rawdata/github/spark/ +# issue_tracker: +# jira: +# project_key_1: +# # Obtained from the project's JIRA URL +# domain: https://issues.apache.org/jira +# #project_key: HELIX +# # Download using `download_jira_data.Rmd` +# # issues: ../../rawdata/helix/jira/issues/helix/ +# # issue_comments: ../../rawdata/helix/jira/issue_comments/helix/ +# github: +# project_key_1: +# # Obtained from the project's GitHub URL +# owner: apache +# repo: apr +# # Download using `download_github_comments.Rmd` +# issue_or_pr_comment: ../../rawdata/apr/github/issue_or_pr_comment/apache_apr/ +# issue: ../../rawdata/apr/github/issue/apache_apr/ +# issue_search: ../../rawdata/apr/github/issue_search/apache_apr/ +# pull_request: ../../rawdata/apr/github/pull_request/apache_apr/ +# commit: ../../rawdata/apr/github/commit/apache_apr/ #vulnerabilities: # Folder path with nvd cve feeds (e.g. nvdcve-1.1-2018.json) diff --git a/conf/thrift.yml b/conf/thrift.yml index f47062b..25959b3 100644 --- a/conf/thrift.yml +++ b/conf/thrift.yml @@ -42,28 +42,42 @@ version_control: - master mailing_list: - # Where is the mbox located locally? - mbox: ../../rawdata/mbox/thrift-dev.mbox # Download here: https://cdn.lfdr.de/stmc/ieee_tse_data/mail/thrift-dev.mbox - # What is the domain of the chosen mailing list archive? - domain: http://mail-archives.apache.org/mod_mbox - # Which lists of the domain will be used? - list_key: - - thrift-dev + mod_mbox: + mail_key_1: + archive_url: http://mail-archives.apache.org/mod_mbox/thrift-dev + mbox: ../../rawdata/thrift/mod_mbox/thrift-dev/ + mailing_list: thrift-dev + archive_type: apache + mail_key_2: + archive_url: http://mail-archives.apache.org/mod_mbox/thrift-user + mbox: ../../rawdata/thrift/mod_mbox/thrift-user/ + mailing_list: thrift-user + archive_type: apache + pipermail: + mail_key_1: + archive_url: http://some/pipermail/url + mbox: ../../rawdata/geronimo/pipermail/geronimo-dev/ issue_tracker: jira: - # Obtained from the project's JIRA URL - domain: https://issues.apache.org/jira - project_key: THRIFT - # Download using `download_jira_data.Rmd` - issues: ../../rawdata/issue_tracker/thrift_issues.json - issue_comments: ../../rawdata/issue_tracker/thrift_issue_comments.json + project_key_1: + # Obtained from the project's JIRA URL + domain: https://issues.apache.org/jira + project_key: THRIFT + # Download using `download_jira_data.Rmd` + issues: ../../rawdata/thrift/jira/issues/thrift/ + issue_comments: ../../rawdata/thrift/jira/issue_comments/thrift/ github: - # Obtained from the project's GitHub URL - owner: apache - repo: thrift - # Download using `download_github_comments.Rmd` - replies: ../../rawdata/github/thrift/ + project_key_1: + # Obtained from the project's GitHub URL + owner: apache + repo: thrift + # Download using `download_github_comments.Rmd` + issue_or_pr_comment: ../../rawdata/thrift/github/issue_or_pr_comment/apache_thrift/ + issue: ../../rawdata/thrift/github/issue/apache_thrift/ + issue_search: ../../rawdata/thrift/github/issue_search/apache_thrift/ + pull_request: ../../rawdata/thrift/github/pull_request/apache_thrift/ + commit: ../../rawdata/thrift/github/commit/apache_thrift/ #vulnerabilities: # Folder path with nvd cve feeds (e.g. nvdcve-1.1-2018.json) diff --git a/conf/tomcat.yml b/conf/tomcat.yml index 33884ba..5d1c131 100644 --- a/conf/tomcat.yml +++ b/conf/tomcat.yml @@ -44,31 +44,42 @@ version_control: - master mailing_list: - # Where is the mbox located locally? - #mbox: ../../rawdata/mbox/tomcat-dev_2013_2019.mbox - # What is the domain of the chosen mailing list archive? - domain: http://mail-archives.apache.org/mod_mbox - # Which lists of the domain will be used? - list_key: - - tomcat-dev + mod_mbox: + mail_key_1: + archive_url: http://mail-archives.apache.org/mod_mbox/tomcat-dev + mbox: ../../rawdata/tomcat/mod_mbox/tomcat-dev/ + mailing_list: tomcat-dev + archive_type: apache + mail_key_2: + archive_url: http://mail-archives.apache.org/mod_mbox/tomcat-users + mbox: ../../rawdata/tomcat/mod_mbox/tomcat-users/ + mailing_list: tomcat-users + archive_type: apache + pipermail: + mail_key_1: + archive_url: http://some/pipermail/url + mbox: ../../rawdata/geronimo/pipermail/geronimo-dev/ -issue_tracker: - jira: - # Obtained from the project's JIRA URL - #domain: https://issues.apache.org/jira - #project_key: GERONIMO - # Download using `download_jira_data.Rmd` - #issues: ../../rawdata/issue_tracker/geronimo_issues.json - #issue_comments: ../../rawdata/issue_tracker/geronimo_issue_comments.json - github: - # Obtained from the project's GitHub URL - #owner: apache - #repo: geronimo - # Download using `download_github_comments.Rmd` - #replies: ../../rawdata/github/geronimo/ - # Currently not supported - #bugzilla: - #url: https://bz.apache.org/bugzilla/buglist.cgi?bug_status=__open__&no_redirect=1&order=Importance&product=Tomcat%209&query_format=specific +# issue_tracker: +# jira: +# project_key_1: +# # Obtained from the project's JIRA URL +# domain: https://issues.apache.org/jira +# #project_key: HELIX +# # Download using `download_jira_data.Rmd` +# # issues: ../../rawdata/helix/jira/issues/helix/ +# # issue_comments: ../../rawdata/helix/jira/issue_comments/helix/ +# github: +# project_key_1: +# # Obtained from the project's GitHub URL +# owner: apache +# repo: apr +# # Download using `download_github_comments.Rmd` +# issue_or_pr_comment: ../../rawdata/apr/github/issue_or_pr_comment/apache_apr/ +# issue: ../../rawdata/apr/github/issue/apache_apr/ +# issue_search: ../../rawdata/apr/github/issue_search/apache_apr/ +# pull_request: ../../rawdata/apr/github/pull_request/apache_apr/ +# commit: ../../rawdata/apr/github/commit/apache_apr/ #vulnerabilities: # Folder path with nvd cve feeds (e.g. nvdcve-1.1-2018.json) diff --git a/conf/tse_apex.yml b/conf/tse_apex.yml index 46841ce..1a41a6b 100644 --- a/conf/tse_apex.yml +++ b/conf/tse_apex.yml @@ -52,20 +52,26 @@ mailing_list: # list_key: # - geronimo-dev -issue_tracker: + issue_tracker: jira: - # Obtained from the project's JIRA URL - domain: https://issues.apache.org/jira - project_key: APEXCORE - # Download using `download_jira_data.Rmd` - issues: ../../../../tse_motif_2021/dataset/jira/apex - #issue_comments: ../../rawdata/issue_tracker/geronimo_issue_comments.json - #github: - # Obtained from the project's GitHub URL - #owner: apache - #repo: geronimo - # Download using `download_github_comments.Rmd` - #replies: ../../rawdata/github/geronimo/ + project_key_1: + # Obtained from the project's JIRA URL + domain: https://issues.apache.org/jira + project_key: APEXCORE + # Download using `download_jira_data.Rmd` + issues: ../../rawdata/apex/jira/issues/apexcore/ + issue_comments: ../../rawdata/apex/jira/issue_comments/apexcore/ +# github: +# project_key_1: +# # Obtained from the project's GitHub URL +# owner: apache +# repo: apr +# # Download using `download_github_comments.Rmd` +# issue_or_pr_comment: ../../rawdata/apr/github/issue_or_pr_comment/apache_apr/ +# issue: ../../rawdata/apr/github/issue/apache_apr/ +# issue_search: ../../rawdata/apr/github/issue_search/apache_apr/ +# pull_request: ../../rawdata/apr/github/pull_request/apache_apr/ +# commit: ../../rawdata/apr/github/commit/apache_apr/ #vulnerabilities: # Folder path with nvd cve feeds (e.g. nvdcve-1.1-2018.json)