Skip to content

Commit

Permalink
add blog notes
Browse files Browse the repository at this point in the history
  • Loading branch information
hpiwowar committed Oct 1, 2015
1 parent f0de55e commit 164cdcc
Show file tree
Hide file tree
Showing 2 changed files with 47 additions and 0 deletions.
38 changes: 38 additions & 0 deletions blog_notes.txt
Original file line number Diff line number Diff line change
@@ -0,0 +1,38 @@



Things that have lots of downloads, but not much pagerank
--------------
select id, pagerank/0.0203305158035518609, (num_downloads/14940006.0), num_downloads,
((pagerank/0.0203305158035518609)/(0.00000000001 + (num_downloads/14940006.0))) as r,
import_name, summary
from package
where host='pypi'
and pagerank > 0
--and num_downloads_percentile > 0.1
order by r asc
limit 100



PageRank benefits 1:
if people import ONLY you, you get more love than if they import loads of things
-------------------
select id,
summary,
(pagerank_percentile/(0.00000000001 + num_downloads_percentile)) as r,
pagerank * 1000000 as pagerank,
pagerank_percentile,
num_downloads_percentile,
num_downloads,
neighborhood_size,
indegree

from package
where host='cran'
and pagerank > 0
and num_downloads_percentile > 0.5
and pagerank_percentile > .6
and pagerank_percentile < .99999999
order by pagerank
limit 1000
9 changes: 9 additions & 0 deletions sql/set_unique_import_name.sql
Original file line number Diff line number Diff line change
@@ -0,0 +1,9 @@
update package set unique_import_name=false where
import_name in
(select import_name from
(select import_name, count(id) as c
from package
where host='pypi'
group by import_name) with_count
where c > 1
)

0 comments on commit 164cdcc

Please sign in to comment.