In [1]:
# Input data
articles_data = \
{
  "articles": [
    {
      "articleId": "1",
      "title": "Adaptive Frequency Hopping in 5G Networks for Enhanced QoS",
      "abstract": "This paper explores the implementation of adaptive frequency hopping techniques in 5G networks to improve Quality of Service (QoS). We discuss the challenges of interference management and propose a novel algorithm that dynamically adjusts hopping patterns based on real-time network conditions. Simulation results show a significant enhancement in both latency and throughput."
    },
    {
      "articleId": "2",
      "title": "Energy-Efficient Routing Protocols for IoT Networks",
      "abstract": "With the proliferation of IoT devices, energy efficiency in wireless networks has become crucial. This article introduces new routing protocols designed to minimize energy consumption while maintaining network connectivity. Through extensive simulations, we demonstrate that our protocols extend battery life by up to 30% compared to existing solutions."
    },
    {
      "articleId": "3",
      "title": "Millimeter Wave Communication: Challenges and Opportunities",
      "abstract": "Millimeter wave (mmWave) technology offers significant bandwidth for high data rates but comes with unique challenges like high path loss and sensitivity to blockages. This review examines the state-of-the-art in mmWave communication, focusing on propagation characteristics, beamforming techniques, and practical deployment issues."
    },
    {
      "articleId": "4",
      "title": "Secure Data Transmission in Ad Hoc Networks via Blockchain",
      "abstract": "Security remains a pivotal concern in ad hoc networks due to their dynamic nature. This study proposes integrating blockchain technology to ensure secure data transmission. The approach leverages distributed ledgers for transaction verification, providing a robust security framework against tampering and denial-of-service attacks."
    },
    {
      "articleId": "5",
      "title": "Network Slicing for Next-Generation Wireless Systems",
      "abstract": "Network slicing is pivotal for tailoring network services to specific applications in 5G and beyond. This paper discusses various slicing strategies, their implementation complexities, and performance benefits. We present a case study using a simulated urban environment to illustrate how slicing can optimize resource allocation for different service classes."
    },
    {
      "articleId": "6",
      "title": "Impact of UAVs on Wireless Network Performance",
      "abstract": "Unmanned Aerial Vehicles (UAVs) are increasingly used for extending network coverage and capacity. This article quantifies the impact of UAV-assisted networks on traditional wireless infrastructure. We analyze aspects like signal shadowing, interference, and mobility, providing insights into optimizing UAV deployment for maximum network efficiency."
    },
    {
      "articleId": "7",
      "title": "Machine Learning for Predictive Channel Modeling in Wireless Networks",
      "abstract": "Channel modeling is central to wireless network performance. This paper applies machine learning techniques to predict channel characteristics in dynamic environments. Our models, trained on real-world data, show superior prediction accuracy, which can lead to more efficient resource management and reduced interference."
    },
    {
      "articleId": "8",
      "title": "Latency Optimization in Wireless Sensor Networks",
      "abstract": "Latency in wireless sensor networks can critically affect data timeliness, especially in applications requiring real-time responses. This research introduces a method to optimize latency through adaptive sleep/wake cycles and dynamic data aggregation. Field tests demonstrate significant latency reductions without compromising energy efficiency."
    },
    {
      "articleId": "9",
      "title": "Cross-Layer Design for Enhancing Throughput in Wi-Fi 6 Networks",
      "abstract": "Wi-Fi 6 introduces several enhancements, yet challenges in throughput persist. This study investigates a cross-layer approach to optimize data transmission in Wi-Fi 6 environments, focusing on MAC and PHY layer interactions. Our findings suggest that such designs can increase throughput by adapting to network conditions more effectively."
    },
    {
      "articleId": "10",
      "title": "Interference Management in Dense Wireless Networks",
      "abstract": "In dense deployments, interference becomes a major issue. Here, we propose and evaluate an interference management strategy based on cooperative MIMO and cognitive radio techniques. The results from our experimental network setup show a marked improvement in signal quality and user experience in high-density scenarios."
    }
  ]
}

In [6]:
import pandas as pd
import sqlite3
from sklearn.feature_extraction.text import TfidfVectorizer
import re

In [7]:
df = pd.DataFrame(articles_data["articles"])
df["text"] = df["title"] + ". " + df["abstract"]


In [15]:
vectorizer = TfidfVectorizer(ngram_range=(2, 3),stop_words="english", max_features=10)
X = vectorizer.fit_transform(df["text"])
terms = vectorizer.get_feature_names_out()

In [16]:
def split_sentences(text):
    return re.split(r'(?<=[.?!])\s+', text)

In [17]:
term_defs = []
term_id_map = {}
term_counter = 1
article_term_links = []

In [18]:
for _, row in df.iterrows():
    article_id = row["articleId"]
    abstract = row["abstract"]
    sentences = split_sentences(abstract)
    for term in terms:
        if any(term in sentence.lower() for sentence in sentences):
            if term not in term_id_map:
                definition = next((s for s in sentences if term in s.lower()), "")
                term_id_map[term] = term_counter
                term_defs.append((term_counter, term, definition))
                term_counter += 1
            article_term_links.append((article_id, term_id_map[term]))

In [19]:
term_defs 

[(1,
  'frequency hopping',
  'This paper explores the implementation of adaptive frequency hopping techniques in 5G networks to improve Quality of Service (QoS).'),
 (2,
  'interference management',
  'We discuss the challenges of interference management and propose a novel algorithm that dynamically adjusts hopping patterns based on real-time network conditions.'),
 (3,
  'energy efficiency',
  'With the proliferation of IoT devices, energy efficiency in wireless networks has become crucial.'),
 (4,
  'wireless networks',
  'With the proliferation of IoT devices, energy efficiency in wireless networks has become crucial.'),
 (5,
  'data transmission',
  'This study proposes integrating blockchain technology to ensure secure data transmission.'),
 (6,
  'secure data',
  'This study proposes integrating blockchain technology to ensure secure data transmission.'),
 (7,
  'secure data transmission',
  'This study proposes integrating blockchain technology to ensure secure data transmissi