In [18]:
import pybliometrics.scopus as scopus
import numpy as np
import pandas as pd
import random
import time

In [19]:
year='2017'
query = f'title-abs-key("engineering" AND "research" AND "innovation") AND PUBYEAR = {year}'
labels = 'ABCDEFGHIJKLMNOPQRSTUVWXYZ'

In [20]:
scopus.init()
papers = scopus.ScopusSearch(query, subscriber=True, verbose=True, view='COMPLETE')
print(papers.results[3])

Downloading results for query "title-abs-key("engineering" AND "research" AND "innovation") AND PUBYEAR = 2017":


100%|██████████| 47/47 [00:44<00:00,  1.04it/s]

Document(eid='2-s2.0-85041456600', doi='10.1080/20964471.2017.1403062', pii=None, pubmed_id=None, title='Big Earth data: A new frontier in Earth and information sciences', subtype='ar', subtypeDescription='Article', creator='Guo H.', afid='60019499', affilname='Chinese Academy of Sciences', affiliation_city='Beijing', affiliation_country='China', author_count='1', author_names='Guo, Huadong', author_ids='56415384100', author_afids='60019499', coverDate='2017-12-22', coverDisplayDate='22 December 2017', publicationName='Big Earth Data', issn='20964471', source_id='21101020024', eIssn='25745417', aggregationType='Journal', volume='1', issueIdentifier='1-2', article_number=None, pageRange='4-20', description='Big data is a revolutionary innovation that has allowed the development of many new methods in scientific research. This new way of thinking has encouraged the pursuit of new discoveries. Big data occupies the strategic high ground in the era of knowledge economies and also constitut




In [21]:
df = pd.DataFrame(papers.results)

In [22]:
# สร้าง DataFrame เพื่อบันทึกเป็น CSV
data = []

for paper in papers.results:
    # Format the author names
    if hasattr(paper, 'author_names') and paper.author_names:
        # Split the author names by ';' and remove leading/trailing spaces
        authors = paper.author_names.split(';')
        authors = [author.strip() for author in authors]  # Strip extra spaces

        formatted_authors = []
        for author in authors:
            name_parts = author.split(',')
            if len(name_parts) == 2:  # If the name has both Lastname and Firstname
                last_name = name_parts[0].strip()
                first_name = name_parts[1].strip()
                # Only append the initial if there is a first name
                if first_name:
                    formatted_authors.append(f"{last_name} {first_name[0]}.")
                else:
                    formatted_authors.append(f"{last_name}.")  # In case of missing first name
            else:  # If the name is a single part (like just Lastname)
                formatted_authors.append(f"{name_parts[0].strip()}.")

        # Join formatted authors with "; "
        formatted_authors = "; ".join(formatted_authors)
    else:
        formatted_authors = ""

    paper_dict = {
        "Title": paper.title,
        "Abstract": paper.description if hasattr(paper, 'description') else "",
        "Author": formatted_authors,
        "Aggregation_Type": paper.aggregationType if hasattr(paper, 'aggregationType') else "",
        "Publisher": paper.publicationName if hasattr(paper, 'publicationName') else "",
        "Publication_Date": paper.coverDate if hasattr(paper, 'coverDate') else "",
        "Institutions": "; ".join(paper.affilname.split('; ')) if hasattr(paper, 'affilname') and paper.affilname else "",
        "Keywords": "; ".join(paper.authkeywords.split('|')) if hasattr(paper, 'authkeywords') and paper.authkeywords else "",
    }
    data.append(paper_dict)



df = pd.DataFrame(data)

output_file = f"../../ExtractedData/Scopus/scopus_papers_{year}.csv"
df.to_csv(output_file, index=False, encoding="utf-8")

In [23]:
df = pd.read_csv(output_file)

In [24]:
df.head(10)

Unnamed: 0,Title,Abstract,Author,Aggregation_Type,Publisher,Publication_Date,Institutions,Keywords
0,Research on development status and innovation ...,"In the paper, patent literatures of giant magn...",Yan H.; Tan R.; Yang Z.; Hao H.,Journal,Gongneng Cailiao/Journal of Functional Materials,2017-12-30,Inner Mongolia University of Science and Techn...,Dynamic of technology ; Giant magnetostrictiv...
1,ACM International Conference Proceeding Series,The proceedings contain 24 papers. The topics ...,,Conference Proceeding,ACM International Conference Proceeding Series,2017-12-28,,
2,3D printed braille maps - Texas A&M,This report explores the practical application...,Wilson J.; Wooten T.,Conference Proceeding,GHTC 2017 - IEEE Global Humanitarian Technolog...,2017-12-22,Texas A&M University,
3,Big Earth data: A new frontier in Earth and in...,Big data is a revolutionary innovation that ha...,Guo H.,Journal,Big Earth Data,2017-12-22,Chinese Academy of Sciences,Big data ; big Earth data ; decision support...
4,A smart place to work,,Davis B.,Journal,Nature,2017-12-21,,
5,Study on Social Responsibility Learning Needs ...,The advent of digital era and the growing comp...,Fleacǎ E.,Conference Proceeding,Balkan Region Conference on Engineering and Bu...,2017-12-20,University Politehnica of Bucharest,quality and innovation in higher education ; ...
6,Emerging Scientific and Engineering Opportunit...,Energy and water resources are deeply intercon...,Urban J.,Journal,Joule,2017-12-20,Lawrence Berkeley National Laboratory,energy ; membranes ; pretreatment ; thermal...
7,Research on reform plan of civil engineering a...,As for civil engineering adult education gradu...,Su Z.; Sun S.; Cui S.,Conference Proceeding,IOP Conference Series: Earth and Environmental...,2017-12-20,Liaocheng University,
8,A user-friendly college recommending system us...,Currently in India college ranking is the issu...,Girase S.; Powar V.; Mukhopadhyay D.,Conference Proceeding,Proceeding - IEEE International Conference on ...,2017-12-19,Dr. Vishwanath Karad MIT World Peace University,Matrix Factorization ; Recommendation System ...
9,Handbook of Research on Biomimetics and Biomed...,Biomimetic research is an emerging field that ...,Habib M.,Book,Handbook of Research on Biomimetics and Biomed...,2017-12-15,The American University in Cairo,
