# Find Top Related Topics

In [1]:
import os
import pandas as pd

from dotenv import load_dotenv
from io import StringIO

from pybliometrics.scival import PublicationLookup, init
from utils import get_content, split_lines

load_dotenv()
init()

# SET COOKIE in .env file
COOKIE = os.getenv('COOKIE')

In [2]:
# Get topic ID for pybliometrics paper
pl = PublicationLookup('85068268027')
topic_id = pl.topic_id

In [3]:
# Get related topics table
res_text = get_content(topic_id, api="related_topics", cookie=COOKIE, page=1)

In [None]:
import re

intro_lines, table_text = split_lines(res_text, api="related_topics")

print("\n".join(intro_lines[:3]))

# Match Data set,""<to_mach>""
data_set = re.findall(r'Data set,?""(.*)""', intro_lines[0])[0]
entity = re.findall(r'Entity,?"(.*)"', intro_lines[1])[0]
year_range = re.findall(r'Year range,?(.*)', intro_lines[2])[0]

Data set,""Top 50 related Topics, by keyphrase match""
Entity,"Impact of Citation Metrics on Scientific Evaluation (T.192)"
Year range,2020 to >2025


('Top 50 related Topics, by keyphrase match',
 'Impact of Citation Metrics on Scientific Evaluation (T.192)',
 '2020 to >2025')

In [None]:
# There are 50 related topics
n = 50
# The table has 3 footer lines
all_table_lines = table_text.splitlines()[:-3]

df = pd.read_csv(StringIO("\n".join(all_table_lines)))
assert df.shape[0] == n, f"Expected {n} rows, got {df.shape[0]}"

In [19]:
df.head(5)

Unnamed: 0,Topics,Topic Number,Topic Cluster,Relatedness rank,Scholarly Output,Prominence percentile
0,Sleeping Beauties in Citation Dynamics,T.35998,Peer Review Dynamics in Biomedical Research Ne...,1,149,73.702
1,Bibliometric Insights into Global Research Trends,T.79084,Peer Review Dynamics in Biomedical Research Ne...,2,378,91.342
2,International Scientific Publication Trends an...,T.74396,Peer Review Dynamics in Biomedical Research Ne...,3,51,53.541
3,Impact of Social Media on Research Visibility,T.5737,Peer Review Dynamics in Biomedical Research Ne...,4,1311,94.375
4,Research Output and Citation Trends in India,T.57117,Peer Review Dynamics in Biomedical Research Ne...,5,115,40.347


In [1]:
from dotenv import dotenv_values

from pybliometrics.scival import PublicationLookup, init
from scival_search import RelatedTopics

init()

env_vars = dotenv_values()
COOKIE = env_vars['COOKIE']

pl = PublicationLookup('85068268027')
topic_id = pl.topic_id

# Initialize with topic_id and cookie
topics = RelatedTopics(topic_id=topic_id, cookie=COOKIE, show_progress=True)

topics.results

Data for topic ID 192: Top 50 related Topics, by keyphrase match
Entity: Impact of Citation Metrics on Scientific Evaluation (T.192)
Year range: 2020 to >2025


Unnamed: 0,Topics,Topic Number,Topic Cluster,Relatedness rank,Scholarly Output,Prominence percentile
0,Sleeping Beauties in Citation Dynamics,T.35998,Peer Review Dynamics in Biomedical Research Ne...,1,149,73.702
1,Bibliometric Insights into Global Research Trends,T.79084,Peer Review Dynamics in Biomedical Research Ne...,2,384,91.342
2,International Scientific Publication Trends an...,T.74396,Peer Review Dynamics in Biomedical Research Ne...,3,50,53.541
3,Impact of Social Media on Research Visibility,T.5737,Peer Review Dynamics in Biomedical Research Ne...,4,1315,94.375
4,Research Output and Citation Trends in India,T.57117,Peer Review Dynamics in Biomedical Research Ne...,5,115,40.347
5,Acknowledgment Patterns in Scientific Research...,T.56003,Peer Review Dynamics in Biomedical Research Ne...,6,140,71.897
6,Trends in Library and Information Science Publ...,T.31758,Peer Review Dynamics in Biomedical Research Ne...,7,193,73.24
7,Scientometric Insights into Research Publicati...,T.77088,Peer Review Dynamics in Biomedical Research Ne...,8,34,13.772
8,Patterns of Scientific Productivity and Distri...,T.25965,Peer Review Dynamics in Biomedical Research Ne...,9,81,61.392
9,Nobel Prize Influence on Scientific Collaboration,T.36387,Peer Review Dynamics in Biomedical Research Ne...,10,157,72.449
