In [1]:
import pickle
from datetime import datetime, timedelta, date
import matplotlib.pyplot as plt
from collections import defaultdict
from crossref.restful import Works
import pandas as pd
pd.set_option('max_colwidth', 40)

with open('downloads_per_doi.pkl', 'rb') as pkl:
    doi_count = pickle.load(pkl)

In [2]:
works = Works()
doi = doi_count[1][0]
record = works.doi(doi)
record['author']

[{'name': 'The Cancer Genome Atlas Research Network',
  'sequence': 'first',
  'affiliation': []}]

In [3]:
def citation_generator(doi):

    article = ''
    record = works.doi(doi)

    # Author information
    try:
        at_el = False
        for a in record['author']:
            if a['sequence'] == 'first':
                article += '{} {}, '.format(a['given'],a['family'])
            else:
                at_el = True
        article = article[:-2]
        if at_el:
            article = article + ', at el '
    except:
        pass
    
    # Date and Title
    try:
        year = record['indexed']['date-time'][:4]
        title = record['title'][0]
        article += '({}) {}. '.format(year, title)
    except:
        pass
    
    # Publication
    try:
        article += '{} ({}):'.format(record['publisher'], record['issue'])
        article += '{}'.format(record['page'])
    except:
        pass   
    return article



In [4]:
table = []
for i in range(10):
    doi = doi_count[i][0]
    cnt = doi_count[i][1]
    table.append([cnt, doi, citation_generator(doi)])


In [5]:
pd.set_option('max_colwidth', 200)
pd_table = pd.DataFrame(table, columns=['Count', 'DOI', 'Article'])
pd_table

Unnamed: 0,Count,DOI,Article
0,7988,10.1007/978-1-4419-9716-6_11,"Richard Osgood, at el (2019) Full-scale modal wind turbine tests: comparing shaker excitation with wind excitation."
1,6117,10.1056/NEJMoa1402121,"(2020) Comprehensive, Integrative Genomic Analysis of Diffuse Lower-Grade Gliomas. Massachusetts Medical Society (26):2481-2498"
2,2991,10.1116/1.4904970,"Padmashree D. Joshi, at el (2019) Photosensitive field emission study of SnS2 nanosheets. American Vacuum Society (3):03C106"
3,2890,10.1103/PhysRevB.63.224204,"Olexei Motrunich, at el (2020) Griffiths effects and quantum critical points in dirty superconductors without spin-rotation invariance: One-dimensional examples. American Physical Society (APS) (22):"
4,2528,10.1182/asheducation-2015.1.8,Clara Camaschella(2020) Iron deficiency: new insights into diagnosis and treatment. American Society of Hematology (1):8-13
5,2266,10.4028/www.scientific.net/AMM.7-8.159,"M.A. Garcia-Romeu-Martinez, at el (2019) Monitoring the Evolution of Fatigue in Corrugated Paperboard under Random Loads."
6,2241,10.1111/j.1365-277X.2004.00520.x,"J. J. Lara, at el (2019) Intentional mis-reporting of food consumption and its relationship with body mass index and psychological scores in women. Wiley (3):209-218"
7,2168,10.1002/pmic.200600525,"Dustin Lippert, at el (2019) Conifer defense against insects: Proteome analysis of Sitka spruce (Picea sitchensis) bark induced by mechanical wounding or feeding by white pine weevils (Pissodes st..."
8,2001,10.1161/CIRCRESAHA.117.306290,"Parwiz Abrahimi, at el (2019) Efficient Gene Disruption in Cultured Primary Human Endothelial Cells by CRISPR/Cas9. Ovid Technologies (Wolters Kluwer Health) (2):121-128"
9,1806,10.1002/smll.201002009,"Xiao Huang, at el (2020) Graphene-Based Materials: Synthesis, Characterization, Properties, and Applications. Wiley (14):1876-1902"


In [6]:
for i in range(10):
    print(table[i])
    print('')

[7988, '10.1007/978-1-4419-9716-6_11', 'Richard Osgood, at el (2019) Full-scale modal wind turbine tests: comparing shaker excitation with wind excitation. ']

[6117, '10.1056/NEJMoa1402121', '(2020) Comprehensive, Integrative Genomic Analysis of Diffuse Lower-Grade Gliomas. Massachusetts Medical Society (26):2481-2498']

[2991, '10.1116/1.4904970', 'Padmashree D. Joshi, at el (2019) Photosensitive field emission study of SnS2 nanosheets. American Vacuum Society (3):03C106']

[2890, '10.1103/PhysRevB.63.224204', 'Olexei Motrunich, at el (2020) Griffiths effects and quantum critical points in dirty superconductors without spin-rotation invariance: One-dimensional examples. American Physical Society (APS) (22):']

[2528, '10.1182/asheducation-2015.1.8', 'Clara Camaschella(2020) Iron deficiency: new insights into diagnosis and treatment. American Society of Hematology (1):8-13']

[2266, '10.4028/www.scientific.net/AMM.7-8.159', 'M.A. Garcia-Romeu-Martinez, at el (2019) Monitoring the Evol