-
Notifications
You must be signed in to change notification settings - Fork 0
/
filter.R
36 lines (29 loc) · 1.38 KB
/
filter.R
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
library("dplyr")
deps<-read.csv("react_deps.csv")
repos<-read.csv("repos.csv")
tidy_repos<-deps %>% inner_join(repos)
temp<-tidy_repos %>% select(dependency) %>% mutate(name=dependency) %>% select(name)
tidy_repos<-tidy_repos %>% anti_join(temp) %>% unique()
library("tidyr")
num_of_deps<-tidy_repos %>% select(repo, isDev) %>%
group_by(repo, isDev) %>% count() %>%
spread(isDev, n, fill=0) %>% ungroup() %>%
rename("dependencies"=`0`, "devDependencies"=`1`)
boxplot.stats(num_of_deps$dependencies)$stat
# [1] 1 5 10 20 42
boxplot.stats(num_of_deps$devDependencies)$stat
# [1] 0 5 13 24 52
outliers<-num_of_deps %>%
mutate(total_deps=dependencies+devDependencies) %>%
arrange(desc(total_deps)) %>% head(20) %>%
mutate(link=paste("https://github.com",repo, sep="/")) %>%
select(link, dependencies, devDependencies)
runtime_deps<-tidy_repos %>% filter(isDev==0) %>%
select(dependency) %>% count(dependency, sort=TRUE) %>%
head(100) %>% mutate(dependency = reorder(dependency, n))
design_time_deps_top_100<-tidy_repos %>% filter(isDev==1) %>%
select(dependency) %>% count(dependency, sort=TRUE) %>% head(100) %>%
mutate(dependency = reorder(dependency, n))
samples<-tidy_repos %>% select(repo, stars) %>% group_by(repo, stars) %>%
count() %>% ungroup() %>% select(-n) %>% arrange(desc(stars)) %>% head(100) %>%
mutate(repo = paste("https://github.com", repo, sep="/"))