In [16]:
from tqdm import tqdm
import pandas as pd
from sentence_transformers import SentenceTransformer, util
import torch
import ast

In [3]:
df = pd.read_csv('C:/Users/29400/Desktop/data/original_data.csv')
df["topics"] = df["topics"].apply(ast.literal_eval)
model = SentenceTransformer("all-MiniLM-L6-v2")

In [18]:
tqdm.pandas()
predefined_topics = [
    "artificial-intelligence",
    "computer-vision",
    "web-development",
    "cybersecurity",
    "cloud-computing",
    "blockchain",
    "data-science",
    "education",
    "system"
]
predefined_embeddings = model.encode(predefined_topics, convert_to_tensor=True)
def match_topic(repo_topics):
    if not repo_topics:  # 如果 topic 为空，返回 "Unknown"
        return "Unknown"

    # 计算所有 `repo_topics` 的 embedding 并取平均值
    repo_embeddings = model.encode(repo_topics, convert_to_tensor=True)
    avg_repo_embedding = torch.mean(repo_embeddings, dim=0, keepdim=True)  # 计算平均 embedding

    # 计算 repo embedding 与 predefined topics 之间的相似度
    similarities = util.pytorch_cos_sim(avg_repo_embedding, predefined_embeddings)

    # 选择相似度最高的 predefined topic
    best_match_idx = torch.argmax(similarities)
    best_match = predefined_topics[best_match_idx]

    # print(f"{repo_topics} -> {best_match} (Similarity: {similarities[0][best_match_idx]:.4f})")
    return best_match

df["classified_topic"] = df["topics"].progress_apply(match_topic)

  0%|          | 17/185876 [00:00<36:29, 84.89it/s] 

['docker', 'miui', 'python', 'xiaomi'] -> system (Similarity: 0.3459)
['android', 'game', 'game-development', 'ios', 'java', 'libgdx'] -> system (Similarity: 0.4498)
['camera', 'embedded-project', 'esp32', 'esp32-cam', 'esp8266', 'espressif', 'firebase', 'firebase-database', 'firebase-realtime-database', 'flutter', 'gfx', 'gui', 'iot-project', 'lvgl', 'mcu', 'mqtt', 'tutorial'] -> system (Similarity: 0.4562)
['diskstation', 'dsm', 'rackstation', 'synology', 'synology-disk-station', 'synology-dsm', 'synology-nas'] -> data-science (Similarity: 0.4143)
['diskstation', 'dsm', 'rackstation', 'synology', 'synology-disk-station', 'synology-dsm', 'synology-nas'] -> data-science (Similarity: 0.4143)
['ajp', 'cnvd-2020-10487', 'cve-2020-1938', 'exp', 'ghostcat'] -> system (Similarity: 0.4268)
['flask', 'jieba', 'news', 'search-engine'] -> data-science (Similarity: 0.4253)
['jq', 'json', 'query', 'rust'] -> system (Similarity: 0.3921)
['arsenal', 'exploitation', 'faraday', 'kali', 'metasploit', '

  0%|          | 45/185876 [00:00<18:12, 170.16it/s]

['nodejs'] -> web-development (Similarity: 0.3863)
['asyncio', 'mysql', 'orm', 'peewee', 'postgresql', 'python'] -> system (Similarity: 0.4284)
['attack-defense-ctf', 'awd', 'awd-platform', 'cardinal', 'ctf', 'ctf-awd', 'ctf-awd-platform', 'ctf-platform', 'golang', 'lsif-enabled'] -> system (Similarity: 0.3525)
['css', 'css-in-js', 'preprocessor', 'style'] -> system (Similarity: 0.4505)
['icons', 'react', 'vue'] -> system (Similarity: 0.3384)
['create2', 'ethereum', 'factory', 'metamorphic', 'mutable', 'smart-contracts'] -> blockchain (Similarity: 0.6037)
['education', 'rust', 'video'] -> education (Similarity: 0.7246)
['captcha-solving', 'gan', 'generative-adversarial-network', 'keras', 'neural-network', 'simgan'] -> artificial-intelligence (Similarity: 0.4922)
['cryptocurrency', 'hft', 'high-frequency-trading', 'orderbook', 'trading'] -> blockchain (Similarity: 0.5472)
['3d', 'graphics', 'realism', 'shaders', 'threejs'] -> computer-vision (Similarity: 0.5436)
['antialiasing', 'global

  0%|          | 139/185876 [00:00<08:59, 344.43it/s]

['cpp', 'cpp11', 'cpp14', 'cpp17', 'cpp20', 'cpp98'] -> system (Similarity: 0.2950)
['boost', 'cpp', 'libevent', 'mongodb', 'nginx', 'ntyco', 'openmp'] -> blockchain (Similarity: 0.4307)
['c', 'dpdk', 'linux-kernel', 'openvswitch', 'vpp'] -> system (Similarity: 0.4717)
['c', 'ffmpeg', 'webrtc'] -> computer-vision (Similarity: 0.4131)
['cpu', 'high-performance', 'interview', 'mongodb', 'mysql', 'network', 'nginx', 'redis', 'storage', 'zookeeper'] -> system (Similarity: 0.5229)
['docker', 'go', 'golang', 'k8s', 'kubernetes'] -> system (Similarity: 0.4153)
['ceph', 'fuse', 'kvm', 'linux-kernel'] -> system (Similarity: 0.4750)
['c', 'kernel', 'linux', 'memory-management'] -> system (Similarity: 0.5660)
['ceph', 'ebpf', 'fuse', 'iouring', 'kvm', 'linux-kernel'] -> system (Similarity: 0.4440)
['cpp', 'kubernetes', 'linux', 'tcp-ip'] -> system (Similarity: 0.4427)
['cassandra', 'couchdb', 'mariadb', 'mongodb', 'mysql', 'oceanbase', 'percona-server', 'redis', 'rocksdb', 'tidb', 'tokudb'] -> da

  0%|          | 281/185876 [00:00<07:18, 423.11it/s]

['linux', 'linux-insides', 'linux-kernel'] -> system (Similarity: 0.4288)
['binary', 'ctf', 'ctf-tools', 'database', 'exploitation', 'libc', 'libc-database', 'libc-db', 'libcdb', 'pwn', 'reverse-engineering', 'wargame'] -> data-science (Similarity: 0.4853)
['ctf', 'ctf-tools', 'exploitation', 'ghidra', 'ghidra-scripts', 'pwn', 'reverse-engineering'] -> cybersecurity (Similarity: 0.4374)
['boilerplate', 'cqrs', 'ddd', 'eventsourcing', 'eventstore', 'graphql', 'hacktoberfest', 'microservice', 'nestjs', 'nodejs', 'saga', 'typescript'] -> web-development (Similarity: 0.4259)
['binary-exploitation', 'php-internals', 'zend-engine'] -> system (Similarity: 0.3317)
['attack-surface-management', 'biu', 'biu-asm', 'easm', 'security'] -> cybersecurity (Similarity: 0.5581)
['github', 'leakage', 'security'] -> cybersecurity (Similarity: 0.5348)
['autoscan', 'scanner', 'security', 'security-audit', 'security-vulnerability', 'sqlmap', 'sqlmap-webui', 'sqlmapapi'] -> cybersecurity (Similarity: 0.5043)


  0%|          | 324/185876 [00:00<07:43, 400.12it/s]

['cfmm', 'mathematics', 'mev', 'research', 'resources', 'smt', 'solidity'] -> data-science (Similarity: 0.5596)
['amm', 'awesome-list'] -> artificial-intelligence (Similarity: 0.3006)
['awesome-list', 'derivatives'] -> artificial-intelligence (Similarity: 0.2693)
['blockchain', 'ethereum', 'protocol'] -> blockchain (Similarity: 0.8425)
['css', 'demo', 'geeks', 'hackers', 'html', 'javascript', 'portfolio', 'portfolio-template', 'programmer', 'resume', 'website'] -> web-development (Similarity: 0.5088)
['deprecated'] -> education (Similarity: 0.2878)
['0x', 'ethereum'] -> blockchain (Similarity: 0.5548)
['0x', 'dapp', 'ethereum', 'golang', 'libp2p', 'webassembly', 'webrtc'] -> blockchain (Similarity: 0.4827)
['0x', 'erc20', 'erc721', 'ethereum', 'exchange'] -> system (Similarity: 0.5021)
['bruteforce', 'bugbounty', 'dirsearch', 'ffuf', 'fuzz', 'fuzz4bounty', 'wordlist'] -> system (Similarity: 0.3648)
['bug-bounty', 'bugbounty', 'enumeration', 'onliner-scripts', 'subdomain-enumeration'] -

  0%|          | 418/185876 [00:01<07:11, 429.59it/s]

['django', 'django-admin', 'django-api', 'django-application', 'django-apps', 'django-rest', 'django-rest-framework', 'django-user', 'django-user-management', 'django2', 'hacktoberfest', 'otp', 'otp-verification', 'python', 'registration-system', 'rest-api', 'signup-flow', 'user-management'] -> blockchain (Similarity: 0.2842)
['ant-design-vue', 'codegenerator', 'composition-api', 'element-plus', 'element-ui', 'java', 'low-code', 'smart', 'spring-boot', 'spring-cloud', 'springboot', 'typescript', 'vue', 'vue3'] -> system (Similarity: 0.4508)
['chai', 'circleci', 'cypress', 'docker', 'emberjs', 'hacktoberfest', 'hapijs', 'knexjs', 'mocha', 'nock', 'nodejs', 'npm', 'postgresql', 'scalingo', 'sinonjs'] -> system (Similarity: 0.4198)
['glcm', 'histogram', 'image', 'image-processing', 'lbp', 'py-lbp', 'python', 'python-glcm-lbp', 'rgb', 'rgb-histogram'] -> computer-vision (Similarity: 0.5623)
['beego', 'redis', 'rpcx', 'shiro'] -> system (Similarity: 0.4007)
['prometheus-chinese', 'prometheu

  0%|          | 538/185876 [00:01<06:05, 507.00it/s]

['es6', 'javascript', 'tutorial'] -> web-development (Similarity: 0.4302)
['2d-game-framework', 'game-development', 'game-engine', 'game-frameworks', 'gamedev', 'rust'] -> web-development (Similarity: 0.4217)
['irt', 'psychometrics', 'python'] -> artificial-intelligence (Similarity: 0.4902)
['android', 'call', 'car', 'didi', 'java', 'map', 'mobile', 'nfc', 'ocr', 'rfid', 'uber'] -> system (Similarity: 0.4883)
['frontend', 'javascript', 'library', 'web', 'webdev'] -> web-development (Similarity: 0.6867)
['a11y', 'accessibility', 'best-practices'] -> computer-vision (Similarity: 0.3769)
['analytics', 'analytics-dashboard', 'dap', 'statistics', 'traffic'] -> data-science (Similarity: 0.5500)
['18f', 'css', 'frontend', 'guide', 'guild', 'html', 'javascript'] -> web-development (Similarity: 0.4866)
['civic-tech', 'identity', 'identity-provider', 'oidc', 'rails'] -> system (Similarity: 0.4442)
['cropper', 'image', 'imagecropper', 'mpvue', 'shear', 'uni-app', 'wechat', 'wepy'] -> computer-vis

  0%|          | 634/185876 [00:01<07:15, 425.28it/s]

['app', 'editor', 'guitar', 'html5', 'javascript', 'midi', 'music', 'scales', 'synth', 'synthesizer', 'tablature', 'tablature-parser', 'tabs', 'toy', 'tuna', 'web-app'] -> system (Similarity: 0.4514)
['app', 'canvas', 'drawing', 'editor', 'html5', 'image', 'image-editing', 'image-editor', 'image-manipulation', 'javascript', 'jspaint', 'ms-paint', 'mspaint', 'online', 'paint', 'painting', 'remake', 'retro', 'web-app', 'web-application'] -> computer-vision (Similarity: 0.5205)
['cli', 'command', 'command-history', 'command-line', 'command-line-app', 'console', 'console-substitute', 'html', 'html5', 'javascript', 'log', 'web'] -> web-development (Similarity: 0.4572)
['ansi-art', 'ansi-editor', 'artscene', 'ascii-art', 'bbs', 'drawing', 'image', 'image-editor', 'irc', 'mirc', 'mspaint', 'paint', 'pixel-art', 'pixel-editor', 'terminal', 'text-art', 'textual', 'tui'] -> computer-vision (Similarity: 0.5281)
['openrazer', 'razer', 'razer-macos'] -> system (Similarity: 0.3354)
['beta-vae', 'cel

  0%|          | 740/185876 [00:01<06:34, 469.80it/s]

['github', 'github-api', 'github-extension'] -> web-development (Similarity: 0.2611)
['blog-engine', 'haskell', 'jekyll', 'latex', 'static-site-generator'] -> web-development (Similarity: 0.4350)
['vm', 'vmware', 'vmwareworkstation', 'workstation', 'workstation16'] -> system (Similarity: 0.3503)
['cop', 'cops', 'copwatch', 'justice', 'police', 'police-brutality', 'police-reports'] -> cybersecurity (Similarity: 0.4294)
['chrome-extension', 'hacktoberfest'] -> web-development (Similarity: 0.2490)
['binary', 'binary-exploitation', 'c', 'cpp', 'ghidra', 'ghidra-decompiler', 'ghidra-extension', 'python', 'reverse-engineering', 'vulnerability'] -> cybersecurity (Similarity: 0.4846)
['css', 'html', 'java', 'java8', 'javascript', 'mongodb', 'mysql', 'nodejs', 'vue'] -> web-development (Similarity: 0.5338)
['alpinejs', 'postcss', 'snowpack', 'tailwindcss'] -> system (Similarity: 0.3973)
['android', 'animation', 'compose-animation', 'jetpack-compose', 'kotlin'] -> computer-vision (Similarity: 0.

  0%|          | 812/185876 [00:01<05:45, 535.86it/s]

['authentication', 'ruby', 'security', 'two-factor', 'twofactorauth'] -> cybersecurity (Similarity: 0.4960)
['android-app', 'authentication', 'authenticator', 'c-sharp', 'ios-app', 'linux-app', 'password', 'totp', 'uwp-apps', 'windows-10'] -> system (Similarity: 0.3633)
['documentation', 'documentation-generator', 'documentation-tool', 'graphql'] -> web-development (Similarity: 0.3451)
['audio', 'html5', 'javascript', 'lu-yin', 'mp3', 'pcm', 'recorder', 'typescript', 'wav', 'web', 'webaudio'] -> web-development (Similarity: 0.4738)
['javascript', 'leaflet', 'map', 'webmaps'] -> web-development (Similarity: 0.4585)
['automation', 'webdriver', 'windows', 'winium'] -> system (Similarity: 0.3991)
['tvbox'] -> system (Similarity: 0.3162)
['devicons', 'github', 'portfolio', 'projects-list', 'showcase', 'vanilla-js', 'website'] -> web-development (Similarity: 0.4500)
['chroot', 'container', 'cross-architecture'] -> system (Similarity: 0.4511)
['command-line', 'console-application', 'haskell',

  0%|          | 919/185876 [00:02<06:34, 469.24it/s]

['components', 'mobile-ui', 'react', 'react-mobile', 'ui-library', 'vant'] -> system (Similarity: 0.3586)
['live', 'react', 'redux', 'tv', 'webpack'] -> education (Similarity: 0.4170)
['javascript', 'lizmap', 'openlayers', 'php', 'qgis', 'qgis-server'] -> web-development (Similarity: 0.4862)
['recordview', 'slide-to-cancel', 'swipe', 'whatsapp'] -> computer-vision (Similarity: 0.2867)
['core-data', 'coredata', 'nspersistentcontainer'] -> data-science (Similarity: 0.3637)
['alamofire', 'carthage', 'cocoapods', 'mocking', 'moya', 'networking', 'nsurlsession', 'stubbing', 'swift'] -> education (Similarity: 0.4187)
['carthage', 'cocoapods', 'core-data', 'coredata', 'json', 'restkit', 'swift', 'sync'] -> cloud-computing (Similarity: 0.4067)
['imageviewer', 'ios', 'lightbox', 'swift', 'viewer'] -> computer-vision (Similarity: 0.4230)
['book', 'mysql', 'php', 'study'] -> data-science (Similarity: 0.5271)
['eternal-blue-exploits', 'hacking', 'hacktoberfest', 'python', 'security'] -> cybersecur

  1%|          | 967/185876 [00:02<06:43, 458.04it/s]

['kubelet', 'kubernetes', 'security'] -> cybersecurity (Similarity: 0.4557)
['react', 'redux', 'router'] -> blockchain (Similarity: 0.3855)
['frida'] -> cybersecurity (Similarity: 0.1830)
['debug', 'lldb', 'reverse-engineering'] -> data-science (Similarity: 0.4382)
['bev-perception', 'bird-eye-view', 'deep-learning', 'transformer', 'vision-transformer'] -> computer-vision (Similarity: 0.6844)
['breathecode', 'exercise', 'exercises', 'gitpod', 'practice', 'python', 'python-autograded', 'python-beginners', 'python-exercises', 'python-interactive', 'python-interactive-exercises', 'python-interactive-tutorial', 'python-programming-exercises', 'python-tutorial', 'python-tutorials', 'tutorial', 'tutorial-code', 'tutorial-exercises', 'tutoriales', 'tutorials'] -> artificial-intelligence (Similarity: 0.3415)
['exercise', 'learn-reactjs', 'learn-to-code', 'react-autograded', 'react-exercise', 'react-interactive-tutorial', 'react-tutorial', 'reactjs', 'reactjs-exercises', 'reactjs-tutorial'] -> 

  1%|          | 1057/185876 [00:02<07:34, 406.94it/s]

['cocoapods', 'greedo-layout', 'ios', 'layout', 'library', 'objective-c', 'uicollectionview'] -> computer-vision (Similarity: 0.3622)
['docx', 'docx-preview', 'excel', 'pdf', 'pdf-preview', 'pdf-viewer', 'vue', 'xlsx', 'xlsx-preview'] -> computer-vision (Similarity: 0.3105)
['braille', 'dithering', 'greyscale', 'image-processing', 'javascript', 'webapp', 'website'] -> computer-vision (Similarity: 0.5848)
['3d-printing', 'keyboard', 'openscad'] -> computer-vision (Similarity: 0.4198)
['cloud-native', 'cloud-native-platform', 'devops', 'dhorse', 'istio', 'jenkins', 'k8s', 'kubernetes', 'kubesphere', 'multi-cluster', 'rainbond', 'service-mesh'] -> cloud-computing (Similarity: 0.5546)
['51bitquant', 'algorithmic-trading', 'ccxt', 'cryptocurrency', 'gekko', 'high-frequency-trading', 'klines', 'marketmaker', 'python', 'quant', 'quantitative-finance', 'trading', 'trading-bot', 'trading-strategies', 'tradingview', 'vnpy'] -> blockchain (Similarity: 0.5233)
['51bitquant', 'algo-trading', 'algor

  1%|          | 1146/185876 [00:02<07:27, 412.49it/s]

['acpi', 'acpi-hotpatches', 'asl', 'hackintosh', 'hotpach', 'macos', 'oclp', 'opencore', 'sequoia-hackintosh', 'sleep', 'sonoma-hackintosh', 'ssdt', 'ventura-hackintosh', 'wake'] -> system (Similarity: 0.4363)
['11ty', '11ty-template', 'eleventy', 'eleventy-template', 'sass', 'sass-boilerplate'] -> system (Similarity: 0.3474)
['css'] -> system (Similarity: 0.4102)
['11ty', 'community', 'css', 'design', 'hacktoberfest', 'modern-css', 'style-stage'] -> system (Similarity: 0.4968)
['browser-support', 'css', 'css-support', 'feature-detection', 'modern-css', 'styles', 'testing'] -> computer-vision (Similarity: 0.4405)
['dark-theme', 'darktheme', 'pyqt', 'pyqt5', 'pyqt6', 'pyside', 'pyside2', 'pyside6', 'python', 'qdarkstyle', 'qt', 'style', 'stylesheet', 'theme'] -> system (Similarity: 0.4037)
['express-middleware', 'expressjs', 'hmr', 'hot-reloading', 'isomorphic', 'javascript', 'node', 'nodejs', 'react', 'reactjs', 'server-rendered', 'ssr', 'universal-applications', 'webpack', 'webpack-bu

  1%|          | 1232/185876 [00:02<07:39, 402.12it/s]

['360', 'css', 'w3c', 'web'] -> system (Similarity: 0.5220)
['dht', 'dhtspider', 'magnet', 'nodejs', 'torrent'] -> blockchain (Similarity: 0.4937)
['chat', 'chatbot', 'chatgpt', 'openai', 'react'] -> artificial-intelligence (Similarity: 0.3528)
['ctf', 'dict', 'fuzz', 'scan', 'scanner'] -> system (Similarity: 0.4432)
['masscan', 'nmap'] -> data-science (Similarity: 0.3285)
['client', 'data-analytics', 'druid', 'nodejs'] -> data-science (Similarity: 0.4956)
['cheatsheet', 'malware-analysis', 'malware-research', 'reverse-engineering', 'syscalls', 'systems-programming', 'win32-api', 'windows', 'windows-10', 'windows-11', 'windows-api', 'windows-internals'] -> system (Similarity: 0.4683)
['radiogroup', 'segmentcontrol', 'selector'] -> system (Similarity: 0.3790)
['android', 'ios', 'react-native', 'stock', 'yahoo-finance'] -> blockchain (Similarity: 0.4041)
['cats-effect', 'config', 'dependency-injection', 'distage-testkit', 'fp-testing', 'framework', 'generative', 'izumi', 'logger', 'loggi

  1%|          | 1322/185876 [00:03<07:15, 424.25it/s]

['autotitle', 'bert', 'crf', 'gpt2', 'ner', 'pytorch', 'roberta', 'seq2seq', 't5-model', 'text-classification', 'unilm'] -> artificial-intelligence (Similarity: 0.4944)
['android', 'whatsapp', 'whatsapp-web'] -> cloud-computing (Similarity: 0.2936)
['md'] -> system (Similarity: 0.2460)
['cloudmusic', 'music', 'music-player', 'pc', 'ui', 'wpf'] -> system (Similarity: 0.4929)
['dmskin', 'mvvm', 'ui', 'wpf', 'wpf-controls', 'wpf-styles', 'wpf-ui', 'wpfstyle', 'wpfui'] -> system (Similarity: 0.2757)
['desktop', 'dmskin', 'dynamicwallpaper', 'livewallpaper', 'ui', 'video', 'vlc', 'wallpaper', 'wallpapers', 'wpf'] -> computer-vision (Similarity: 0.4195)
['blog', 'java', 'mysql', 'simplewebserver'] -> web-development (Similarity: 0.5461)
['kaiyan', 'kotlin', 'mvp', 'retorfit', 'rxjava'] -> system (Similarity: 0.3425)
['96boards', 'documentation', 'jekyll'] -> system (Similarity: 0.4256)
['gdnative', 'gdnative-plugin', 'gdscript', 'godot', 'godot-engine', 'godotengine', 'linux', 'native-dialog

  1%|          | 1414/185876 [00:03<07:38, 402.40it/s]

['curses', 'ncurses', 'terminal', 'terminal-colors', 'tui', 'user-interface', 'widgets', 'xterm'] -> system (Similarity: 0.4820)
['adventure', 'dungeon-crawler', 'game', 'ocaml', 'open-world', 'opengl', 'procedural', 'roguelike'] -> artificial-intelligence (Similarity: 0.4386)
['android', 'android-application', 'android-platform', 'ed2k', 'emule', 'java', 'kad', 'peer-to-peer'] -> system (Similarity: 0.4168)
['cheatsheet', 'cybersecurity', 'enumeration', 'hacking', 'linux', 'mitre-attack', 'payload', 'penetration-testing', 'pentest', 'pentest-tools', 'red-team', 'red-team-tools', 'redteam', 'resources', 'security-tools', 'tools', 'windows'] -> cybersecurity (Similarity: 0.6021)
['bioinformatics', 'computational-biology', 'deep-learning', 'dgl', 'drug-discovery', 'gene-regulatory-networks', 'geometric-deep-learning', 'graph-neural-networks', 'interactome', 'interactomics', 'ppi-networks', 'protein', 'protein-data-bank', 'protein-design', 'protein-structure', 'python', 'pytorch', 'pytorc

  1%|          | 1496/185876 [00:03<07:53, 389.05it/s]

['bard-api', 'chatgpt', 'google', 'midjourney-api', 'spark', 'stable-diffusion'] -> data-science (Similarity: 0.3898)
['java', 'javascript'] -> web-development (Similarity: 0.4615)
['buider', 'drag', 'element-ui', 'h5editor', 'javascript', 'plugins', 'poster', 'vue', 'vuejs2'] -> system (Similarity: 0.4271)
['ip-czipdata', 'ip-mysql', 'ip-sql', 'python'] -> cybersecurity (Similarity: 0.3459)
['android', 'ios', 'ml', 'ml-kit', 'ml-kit-vision', 'react-native'] -> computer-vision (Similarity: 0.4422)
['development', 'esbuild', 'esbuild-node', 'nodejs', 'openlibrary', 'ts-node', 'tsnode'] -> web-development (Similarity: 0.4247)
['bug', 'error', 'exception-handler', 'openlibrary', 'react', 'react-native'] -> system (Similarity: 0.3474)
['angular', 'angular-filters', 'filter', 'ng-pipes'] -> computer-vision (Similarity: 0.2280)
['cheat-sheets', 'cheatsheet', 'go', 'golang'] -> artificial-intelligence (Similarity: 0.3170)
['go', 'markdown', 'markdown-processor', 'processor'] -> system (Simila

  1%|          | 1578/185876 [00:03<07:43, 397.46it/s]

['awesome', 'awesome-list', 'books', 'compiler', 'interpreter', 'list', 'programming-language', 'resources', 'runtime', 'virtual-machine'] -> artificial-intelligence (Similarity: 0.5087)
['api', 'chatgpt', 'client', 'coroutines', 'dall-e', 'gpt', 'kotlin', 'llm', 'multiplatform', 'openai', 'whisper'] -> system (Similarity: 0.4224)
['approximate-bayesian-inference', 'gaussian-processes', 'jax', 'machine-learning', 'markov-gps', 'signal-processing', 'sparse-gps', 'state-space-models'] -> artificial-intelligence (Similarity: 0.5579)
['cnn', 'computer-vision', 'deep-learning', 'image-matching', 'python', 'pytorch'] -> computer-vision (Similarity: 0.7683)
['confidence', 'deep-learning', 'evidence', 'neural-network', 'neurips-2020', 'pytorch', 'tensorflow', 'uncertainty'] -> artificial-intelligence (Similarity: 0.6589)
['animation', 'css', 'css3-support', 'javascript', 'jquery', 'jquery-plugin', 'marquee'] -> computer-vision (Similarity: 0.3697)
['ai', 'chatbot', 'chatgpt', 'cli', 'go', 'gol

  1%|          | 1688/185876 [00:04<06:35, 465.76it/s]

['authentication', 'authorization', 'django', 'django-rest-framework', 'passwordless', 'python3'] -> cybersecurity (Similarity: 0.3994)
['android', 'cross-platform', 'dart', 'flutter', 'ios'] -> system (Similarity: 0.3406)
['analytics', 'endpoint-manager', 'intune', 'macos', 'mdm', 'microsoft', 'powershell', 'powershell-script', 'windows'] -> system (Similarity: 0.5146)
['data-science', 'data-visualization', 'python3', 'visualization'] -> data-science (Similarity: 0.7533)
['database', 'gps', 'gps-tracker', 'indieweb', 'p3k'] -> data-science (Similarity: 0.3779)
['indieauth', 'indieweb', 'oauth'] -> blockchain (Similarity: 0.3594)
['corelocation', 'gps', 'gps-tracker', 'gpslogger', 'hacktoberfest', 'ios', 'trip'] -> computer-vision (Similarity: 0.3585)
['indieweb', 'instagram', 'micropub', 'photos'] -> data-science (Similarity: 0.3779)
['indieweb', 'micropub', 'p3k'] -> blockchain (Similarity: 0.3646)
['authentication', 'phoenix'] -> cybersecurity (Similarity: 0.3599)
['aws', 'dynamodb'

  1%|          | 1792/185876 [00:04<06:37, 463.40it/s]

['ascii-game', 'battleship', 'bsdgames', 'c', 'checkers', 'curses', 'fifteen-puzzle', 'game', 'games', 'maze', 'minesweeper', 'minimal', 'plan9', 'portable', 'public-domain', 'puzzle-game', 'reversi', 'sudoku', 'terminal', 'terminal-game'] -> system (Similarity: 0.5505)
['bot', 'discord', 'discord-api', 'eris', 'nodejs'] -> artificial-intelligence (Similarity: 0.3848)
['leaks-test', 'pytest-plugin', 'trace-resource-leaks'] -> cybersecurity (Similarity: 0.1961)
['lane-detection', 'lanenet', 'ros'] -> system (Similarity: 0.4611)
['abap', 'backend', 'erp', 'excel', 'excel-export', 'excel-import', 'excelgenerator', 'excelreader', 'excelwriter', 'hacktoberfest', 'open-source', 'sap', 'sap-netweaver'] -> data-science (Similarity: 0.4059)
['abap', 'abapgit', 'git-client', 'hacktoberfest', 'platform', 'sap', 'sap-gui'] -> cybersecurity (Similarity: 0.4270)
['abap', 'abaplint', 'code-quality-analyzer', 'hacktoberfest', 'linter', 'static-analysis', 'static-code-analysis'] -> data-science (Simila

  1%|          | 1886/185876 [00:04<07:26, 411.62it/s]

['forensic-examinations', 'forensics', 'investigation', 'windows'] -> data-science (Similarity: 0.4433)
['abell', 'abelljs', 'hacktoberfest', 'javascript', 'static-site-generator'] -> web-development (Similarity: 0.3853)
['inference', 'nlp', 'nlp-machine-learning', 'onnx', 'onnxruntime', 'sentiment-analysis', 'summarization', 'text-classification', 'text-generation', 'transformer', 'transformers', 'translation'] -> artificial-intelligence (Similarity: 0.5968)
['fmp4', 'go', 'golang', 'mp4', 'mp4box'] -> system (Similarity: 0.3152)
['curl', 'encryption', 'friends', 'gpg', 'hacktoberfest', 'shell', 'storage', 'transfer', 'wsend-gpg'] -> system (Similarity: 0.4537)
['mpvue', 'uni-app', 'vue'] -> education (Similarity: 0.3440)
['llvm', 'llvm-pass', 'tutorial'] -> artificial-intelligence (Similarity: 0.3013)
['disassembler', 'elf', 'reverse-engineering'] -> artificial-intelligence (Similarity: 0.3985)
['distillation', 'kd', 'kd-methods', 'knowledge-distillation', 'knowledge-transfer', 'mode

  1%|          | 1970/185876 [00:04<07:41, 398.43it/s]

['crawler', 'fuzzing', 'hacking', 'hacking-tool', 'information-gathering', 'lfi', 'networking', 'offensive-security', 'osint', 'pentesting', 'port-scanner', 'python', 'rfi', 'scanner', 'scrapy', 'security', 'sqlite', 'ssl-inspection', 'vault', 'xss-vulnerability'] -> cybersecurity (Similarity: 0.6225)
['airflow', 'data-engineering', 'datascience', 'devops', 'infrastructure', 'machine-learning', 'mlops', 'spark'] -> data-science (Similarity: 0.7117)
['client', 'gmail', 'gmail-api', 'gmail-client', 'gmail-login', 'google-api-client-library', 'python', 'python3'] -> blockchain (Similarity: 0.3155)
['deep-learning', 'deep-neural-networks', 'neural-networks', 'pytorch', 'tez'] -> artificial-intelligence (Similarity: 0.6412)
['awesome', 'awesome-list', 'github', 'github-profile-readme', 'github-readme', 'portfolio', 'profile-readme'] -> cloud-computing (Similarity: 0.2793)
['classification', 'deeplearning', 'fashion', 'keras', 'regression', 'vgg16'] -> data-science (Similarity: 0.5328)
['dee

  1%|          | 2062/185876 [00:04<07:19, 417.95it/s]

['completion', 'counsel', 'emacs', 'ivy', 'search', 'swiper'] -> system (Similarity: 0.4678)
['jquery', 'json'] -> blockchain (Similarity: 0.3396)
['compressed-data', 'crawler', 'html', 'java', 'json', 'jsoup', 'tw', 'vfs', 'xml'] -> data-science (Similarity: 0.4771)
['crates', 'http', 'multipart', 'rust'] -> system (Similarity: 0.4476)
['fast-multipole-method', 'hierarchical-matrices', 'meshless', 'molecular-dynamics', 'neighbour-search', 'particles', 'radial-basis-function', 'smoothed-particle-hydrodynamics'] -> computer-vision (Similarity: 0.3587)
['bower', 'javascript', 'jquery', 'jquery-plugin', 'performance-sticky-sidebars', 'scrolling', 'sticky-sidebar'] -> blockchain (Similarity: 0.2929)
['cpe', 'cve', 'cvss', 'nvd', 'ossindex', 'osv', 'package-url', 'purl', 'security', 'security-tools', 'snyk', 'vulndb', 'vulnerability', 'vulnerability-database', 'vulnerability-databases', 'vulnerability-detection', 'vulnerability-identification', 'vulnerability-scanners'] -> cybersecurity (Si

  1%|          | 2180/185876 [00:05<06:31, 469.67it/s]

['amazon-elasticsearch', 'aws', 'elasticsearch', 'iam-role', 'proxy', 'sign'] -> cloud-computing (Similarity: 0.4110)
['c', 'diablo', 'diablo2', 'game-engine'] -> system (Similarity: 0.4493)
['diablo', 'diablo2', 'diablo2lod', 'lua'] -> system (Similarity: 0.3093)
['lua', 'lunarvim', 'lvim', 'neovim', 'nvim', 'vim'] -> system (Similarity: 0.2987)
['android-application', 'dynamic-analysis', 'security-analysis', 'xposed'] -> cybersecurity (Similarity: 0.4393)
['dnslog', 'hyuga', 'out-of-band'] -> blockchain (Similarity: 0.3046)
['devtools', 'github', 'github-api', 'laravel', 'laravel-5-package', 'llum', 'php'] -> web-development (Similarity: 0.4227)
['analytics', 'awesome-list', 'data-mining', 'data-science', 'data-scientists', 'data-visualization', 'deep-learning', 'hacktoberfest', 'machine-learning', 'science'] -> data-science (Similarity: 0.8523)
['autobot', 'onmyoji', 'python'] -> artificial-intelligence (Similarity: 0.4816)
['web-development'] -> web-development (Similarity: 1.0000)

  1%|          | 2284/185876 [00:05<06:31, 468.85it/s]

['android', 'appstore', 'jetpack-compose', 'kotlin', 'material-design', 'material3', 'privacy', 'security'] -> cybersecurity (Similarity: 0.4482)
['book', 'chinese', 'computer-vision', 'deep-learning', 'jupyter-notebook', 'machine-learning', 'natural-language-processing', 'notebook', 'python'] -> artificial-intelligence (Similarity: 0.6960)
['ace', 'ace-editor', 'diff', 'diffing', 'rich-text-editor'] -> artificial-intelligence (Similarity: 0.3016)
['dice-coefficient', 'javascript', 'string-comparison', 'string-similarity', 'strings'] -> artificial-intelligence (Similarity: 0.3552)
['leetcode', 'leetcode-solutions'] -> artificial-intelligence (Similarity: 0.2228)
['arp-scan', 'arp-scanner', 'intrusion-detection', 'monitoring', 'network-security', 'self-hosted', 'selfhosted'] -> cybersecurity (Similarity: 0.5250)
['4a-gigabit', 'firmware', 'miwifi-3c', 'openwrt', 'router', 'routers', 'xiaomi', 'xiaomi-routers'] -> system (Similarity: 0.3049)
['arrow', 'crossovers', 'episodes', 'python', 

  1%|▏         | 2407/185876 [00:05<05:46, 529.07it/s]

['voodooinput', 'voodoops2'] -> system (Similarity: 0.3015)
['whatevergreen'] -> education (Similarity: 0.2568)
['angular', 'angularjs', 'component-library', 'hybrid-apps', 'ionic', 'ionic-plugin', 'javascript', 'javascript-library', 'jquery', 'mobile-web', 'mobiscroll', 'react', 'ui-components', 'ui-kit'] -> web-development (Similarity: 0.3996)
['ai', 'audio', 'deep-learning', 'generative-model', 'neural-network'] -> artificial-intelligence (Similarity: 0.7168)
['icons', 'world-of-warcraft'] -> artificial-intelligence (Similarity: 0.3564)
['cli-addon-updater', 'world-of-warcraft'] -> cybersecurity (Similarity: 0.2232)
['bitcoin', 'scala'] -> blockchain (Similarity: 0.5749)
['android', 'bitcoin', 'blockchain', 'cryptocurrency', 'eclair', 'lightning', 'lightning-network', 'payments'] -> blockchain (Similarity: 0.7725)
['bitcoin', 'blockchain', 'cryptocurrency', 'eclair', 'lightning', 'lightning-network', 'payments'] -> blockchain (Similarity: 0.7857)
['bitcoin', 'kotlin', 'lightning', '

  1%|▏         | 2525/185876 [00:05<05:39, 540.00it/s]

['cli-app', 'expressjs', 'graphql', 'graphql-server', 'javascript', 'proxy', 'rest-api', 'typescript'] -> web-development (Similarity: 0.4405)
['graphql', 'javascript', 'javascript-library', 'typescript'] -> web-development (Similarity: 0.4062)
['api', 'mexico', 'zip-codes'] -> education (Similarity: 0.3208)
['terrain', 'unity', 'unity-terrain', 'virtual-textures'] -> computer-vision (Similarity: 0.3817)
['directx12', 'flow-map', 'fluid-simulation', 'imgui', 'river', 'river-renderer', 'water', 'wave-particles'] -> computer-vision (Similarity: 0.4285)
['atomic-css', 'atomizer', 'css', 'functional-css', 'utility-css'] -> system (Similarity: 0.3446)
['w3c', 'wcag'] -> system (Similarity: 0.3205)
['actframework', 'ebean', 'hot-reload', 'java', 'java-web', 'mongodb', 'morphia', 'mvc', 'mvc-framework', 'mvc-frameworks', 'restful', 'restful-framework', 'web-framework', 'webframework'] -> web-development (Similarity: 0.5880)
['engine', 'gamification', 'gamification-engine', 'gamification-frame

  1%|▏         | 2638/185876 [00:06<05:54, 516.34it/s]

['actor-model', 'actors', 'async', 'caf', 'pattern-matching'] -> artificial-intelligence (Similarity: 0.5230)
['actorcloud', 'aep', 'dmp', 'flask', 'iot', 'iot-platform', 'lora', 'lwm2m', 'modbus', 'mqtt', 'rules-engine', 'vue'] -> system (Similarity: 0.4733)
['generic', 'gui-toolkit', 'immediate-gui', 'sdl2', 'simple'] -> system (Similarity: 0.4513)
['budgeting', 'finance', 'money', 'personal-finance'] -> education (Similarity: 0.4791)
['amqp', 'background', 'background-jobs', 'celery', 'celery-client', 'celery-protocol', 'celery-workers', 'job-queue', 'queue', 'queue-workers', 'queued-jobs', 'task-manager', 'task-queue', 'task-runner', 'worker', 'worker-queue', 'workers'] -> system (Similarity: 0.3844)
['docker', 'docker-compose', 'mapping', 'openstreetmap', 'openstreetmap-data', 'tile-server'] -> cloud-computing (Similarity: 0.3908)
['deep-reinforcement-learning', 'drl', 'gazebo', 'gym', 'reinforcement-learning', 'rl', 'robotics', 'ros', 'ros2'] -> artificial-intelligence (Similarit

  1%|▏         | 2745/185876 [00:06<05:55, 515.30it/s]

['arduino', 'arduino-library', 'ina219', 'library', 'power'] -> system (Similarity: 0.4976)
['adafruit-io', 'iot', 'python', 'raspberry-pi'] -> cloud-computing (Similarity: 0.4617)
['arduino-library'] -> computer-vision (Similarity: 0.2041)
['arduino-library'] -> computer-vision (Similarity: 0.2041)
['arduino-library'] -> computer-vision (Similarity: 0.2041)
['arduino-library'] -> computer-vision (Similarity: 0.2041)
['arduino', 'arduino-library', 'library', 'sensor'] -> system (Similarity: 0.4544)
['arduino-library'] -> computer-vision (Similarity: 0.2041)
['arduino-library'] -> computer-vision (Similarity: 0.2041)
['arduino-library'] -> computer-vision (Similarity: 0.2041)
['adafruit', 'arduino', 'arduino-library', 'tinyusb', 'usb'] -> system (Similarity: 0.4224)
['arduino-library'] -> computer-vision (Similarity: 0.2041)
['arduino-library'] -> computer-vision (Similarity: 0.2041)
['adafruit', 'awesome', 'awesome-list', 'circuitpython', 'embedded', 'iot', 'micropython', 'python'] -> 

  2%|▏         | 2865/185876 [00:06<05:30, 553.55it/s]

['anchor', 'keras', 'keras-yolov3-mobilenet', 'mobilenet', 'object-detection', 'tensorflow', 'vgg16', 'yolo', 'yolov3'] -> computer-vision (Similarity: 0.4863)
['powershell', 'selenium', 'web-testing'] -> web-development (Similarity: 0.4983)
['hacktoberfest', 'powershell', 'python'] -> cybersecurity (Similarity: 0.4376)
['dataframe', 'gui', 'pandas', 'viewer'] -> system (Similarity: 0.4532)
['captive', 'captive-portal', 'esp-12', 'esp8266', 'hack', 'nodemcu', 'nodemcu-arduino', 'password', 'phishing', 'portal', 'wifi', 'wifi-hacking', 'wifi-password'] -> cybersecurity (Similarity: 0.4387)
['esp8266', 'fake', 'node-mcu', 'sign-in', 'wifi-captive-portal'] -> cybersecurity (Similarity: 0.3159)
['aireplay', 'automatic', 'deauth', 'deauthentication', 'deauthentication-attack', 'deauthentication-script', 'deauther', 'hack', 'macchanger', 'mdk', 'mdk3', 'script'] -> cybersecurity (Similarity: 0.4398)
['ios', 'ios15', 'swift', 'swiftui', 'uikit'] -> computer-vision (Similarity: 0.2632)
['azure

  2%|▏         | 2929/185876 [00:06<05:19, 572.75it/s]

['arduino', 'arduino-sketch', 'arduino-uno'] -> computer-vision (Similarity: 0.3534)
['arduino', 'can', 'can-bus', 'car-hacking', 'pyqt5', 'python'] -> system (Similarity: 0.4720)
['behavioral-code-analysis', 'code-analysis-tool', 'repository-mining', 'technical-debt'] -> data-science (Similarity: 0.4548)
['hammerspoon', 'stacks', 'tabbed-layout', 'window-manager', 'yabai'] -> cloud-computing (Similarity: 0.3534)
['ios', 'swift', 'validation', 'validation-library', 'validators'] -> artificial-intelligence (Similarity: 0.3837)
['admin', 'openvpn', 'webapp'] -> web-development (Similarity: 0.4593)
['big-sur', 'firefox', 'firefox-theme', 'macos', 'macos-big-sur', 'safari', 'whitesur-theme', 'windows'] -> system (Similarity: 0.3870)
['cpp14', 'cpp17', 'embedded-string-literals', 'header-only', 'obfuscate', 'obfuscate-strings', 'obfuscation', 'string', 'string-literals', 'string-obfuscation'] -> cybersecurity (Similarity: 0.2986)
['peer-to-peer', 'screencast', 'screensharing', 'webrtc', 'we

  2%|▏         | 3056/185876 [00:06<05:16, 577.17it/s]

['data', 'finance', 'pandas', 'stock-data', 'stock-prices', 'stocks-api'] -> data-science (Similarity: 0.5556)
['audio-recorder', 'getusermedia', 'javascript', 'pcm', 'record-audio', 'wav'] -> computer-vision (Similarity: 0.3908)
['bukkit-plugin', 'discord', 'moss', 'spigot'] -> system (Similarity: 0.3865)
['java'] -> system (Similarity: 0.3842)
['debian', 'dotfiles', 'fluxbox', 'openbox', 'rice', 'theme'] -> system (Similarity: 0.4989)
['debian', 'dotfiles', 'i3', 'rice'] -> system (Similarity: 0.4726)
['critical-css', 'critical-path-css', 'critical-path-styles', 'css', 'inline-css', 'inline-styles'] -> web-development (Similarity: 0.2425)
['auditing-predictive-models', 'discrimination', 'fairness', 'model-criticism', 'prediction-model', 'toolbox'] -> artificial-intelligence (Similarity: 0.4825)
['deep-learning', 'information-retrieval', 'neural-network'] -> artificial-intelligence (Similarity: 0.7009)
['android', 'automation', 'autoreply', 'chatbot', 'facebook', 'facebook-bot', 'mess

  2%|▏         | 3167/185876 [00:07<06:24, 474.66it/s]

['adi1090x', 'arch-linux', 'archcraft', 'bash', 'bash-scripts', 'cron', 'cronjob', 'crontab', 'dynamic-wallpaper', 'linux', 'live-wallpapers', 'pywal', 'timed-wallpaper', 'ubuntu', 'unixporn', 'wallpaper', 'wallpaper-manager', 'wallpaper-set', 'wallpaperengine', 'wallpapers'] -> system (Similarity: 0.3768)
['adi1090x', 'arch-linux', 'archcraft', 'color-schemes', 'debian', 'kitty', 'kitty-cat', 'kitty-terminal', 'linux', 'linux-terminal', 'linux-terminal-emulator', 'terminal', 'terminal-colours', 'terminal-emulator', 'terminal-theme', 'ubuntu', 'unixporn'] -> system (Similarity: 0.4277)
['adi1090x', 'archlinux', 'bootanimation', 'bootsplash', 'bootsplash-theme', 'debian', 'fedora', 'linux', 'plymouth', 'plymouth-bootsplash', 'plymouth-theme', 'plymouth-themes', 'ubuntu', 'unixporn'] -> system (Similarity: 0.4075)
['adi1090x', 'archlinux', 'debian', 'display-manager', 'gdm', 'greeter', 'lightdm', 'linux', 'login-manager', 'lxdm', 'sddm', 'slim', 'slim-themes', 'themes', 'ubuntu', 'unixpo

  2%|▏         | 3221/185876 [00:07<06:12, 490.87it/s]

['travel'] -> education (Similarity: 0.3562)
['adldap', 'auth', 'driver', 'laravel', 'ldap', 'ldap-authentication'] -> blockchain (Similarity: 0.3639)
['active-record', 'ldap', 'php', 'php-ldap', 'query-builder'] -> web-development (Similarity: 0.3222)
['b3log', 'blog', 'bolo', 'bolo-solo', 'docker', 'java', 'solo', 'tomcat'] -> system (Similarity: 0.4995)
['csdn', 'tampermonkey', 'userscript'] -> cybersecurity (Similarity: 0.4494)
['compiler', 'deep-learning', 'docker-images', 'inference', 'inference-engine', 'model-optimizer', 'openvino', 'tensorflow-serving', 'tensorrt'] -> artificial-intelligence (Similarity: 0.5666)
['xapi'] -> artificial-intelligence (Similarity: 0.2528)
['xapi'] -> artificial-intelligence (Similarity: 0.2528)
['c', 'edges', 'facets', 'meshes', 'repair', 'three-d-printing', 'vertices'] -> computer-vision (Similarity: 0.4746)
['admidio', 'club-management', 'documents-manager', 'event-management', 'lists', 'members', 'membership', 'membership-management', 'organiza

  2%|▏         | 3320/185876 [00:07<06:40, 455.35it/s]

['cplusplus', 'documentation-tool', 'jekyll', 'libtooling'] -> artificial-intelligence (Similarity: 0.3339)
['a11y', 'color', 'color-generator', 'color-palette', 'color-palette-generator', 'color-picker', 'color-theme', 'color-theme-switcher', 'color-themes', 'colors', 'colorscheme', 'colorscheme-generator', 'contrast', 'contrast-ratio', 'dark'] -> computer-vision (Similarity: 0.4047)
['lit-element', 'mixin', 'mobx', 'web-components'] -> system (Similarity: 0.3508)
['aem', 'aem64'] -> cybersecurity (Similarity: 0.2841)
['ansible', 'aws', 'azure', 'eks', 'helm', 'helmfile', 'jinja2', 'kubernetes', 'kubernetes-cluster', 'kubernetes-deployment', 'ops', 'packer', 'terraform', 'terraform-files', 'vault'] -> cloud-computing (Similarity: 0.4952)
['accessibility', 'design-systems', 'react', 'react-components', 'ui-components', 'wai-aria'] -> system (Similarity: 0.4198)
['computer-vision', 'customization', 'diffusion-models', 'few-shot', 'fine-tuning', 'pytorch', 'text-to-image-generation'] -> 

  2%|▏         | 3412/185876 [00:07<07:02, 431.70it/s]

['cacert', 'docker-commands', 'docker-container', 'docker-group', 'hacktoberfest', 'shell-script', 'temurin'] -> system (Similarity: 0.3002)
['hacktoberfest', 'homebrew', 'homebrew-tap'] -> cybersecurity (Similarity: 0.3016)
['escape-analysis', 'hotspot', 'hotspot-jit-compiler', 'java', 'javafx', 'jit-compiler', 'jitwatch', 'log-analyser'] -> web-development (Similarity: 0.3327)
['docker-image', 'dockerfile', 'hacktoberfest', 'unofficial-images'] -> cloud-computing (Similarity: 0.2112)
['automation', 'configuration-as-code', 'configuration-management', 'continuous-integration', 'export', 'import', 'jboss', 'json', 'keycloak', 'keycloak-config-cli', 'oauth2', 'rest', 'spring-boot'] -> system (Similarity: 0.4392)
['bash', 'bash-script', 'bashrc', 'linux', 'shell', 'shell-script', 'utility'] -> system (Similarity: 0.3884)
['checklist', 'development-tools', 'docker', 'frontend-web', 'linux', 'nodejs', 'shell', 'toolkits', 'tools'] -> web-development (Similarity: 0.5300)
['adlib', 'adlibemu

  2%|▏         | 3496/185876 [00:07<08:11, 370.88it/s]

['nextjs'] -> web-development (Similarity: 0.2579)
['next14', 'nextjs', 'nextjs14'] -> system (Similarity: 0.2615)
['ai', 'chatgpt'] -> artificial-intelligence (Similarity: 0.5944)
['framer-motion', 'reactjs', 'sanity-io'] -> computer-vision (Similarity: 0.3174)
['react', 'reactjs', 'sanity', 'sanity-io'] -> system (Similarity: 0.3091)
['react', 'reactjs', 'syncfusion', 'syncfusion-ej2'] -> blockchain (Similarity: 0.2733)
['reactjs'] -> blockchain (Similarity: 0.2362)
['nextjs', 'reactjs', 'sanity', 'typescript'] -> web-development (Similarity: 0.2944)
['api', 'javascript', 'rapidapi', 'reactjs'] -> web-development (Similarity: 0.4112)
['react', 'react-project', 'reactjs', 'webrtc'] -> web-development (Similarity: 0.3799)
['smart-contracts', 'solidity', 'web3'] -> blockchain (Similarity: 0.5606)
['avalanche', 'blockchain', 'nft', 'solidity', 'web3'] -> blockchain (Similarity: 0.6862)
['blockchain', 'cranq', 'smart-contracts', 'uniswap-v2', 'web3'] -> blockchain (Similarity: 0.6938)
['m

  2%|▏         | 3536/185876 [00:08<08:03, 376.94it/s]

['hacktoberfest', 'irc', 'irc-client', 'irc-gateway', 'ircd', 'slack', 'slack-gateway'] -> cybersecurity (Similarity: 0.3342)
['c', 'console', 'editor', 'hacktoberfest', 'terminal', 'text', 'text-editor'] -> system (Similarity: 0.4576)
['hacktoberfest', 'performance', 'php', 'profiler'] -> system (Similarity: 0.3913)
['bash', 'command-line', 'developer-tools', 'linux', 'shell', 'zsh'] -> system (Similarity: 0.4232)
['c', 'filesystem', 'linux', 'sandbox'] -> system (Similarity: 0.5877)
['aarch64', 'arm64', 'ghidra', 'java', 'nintendo', 'nintendo-switch', 'nx', 'reverse-engineering', 'switch'] -> system (Similarity: 0.5105)
['jekyll', 'jekyll-site', 'jekyll-theme', 'minimalist'] -> artificial-intelligence (Similarity: 0.3420)
['ja3', 'ja3-signature-creation', 'network-analysis', 'network-monitoring', 'ssldump', 'sslv3', 'tls', 'tls-traffic', 'tls13'] -> cybersecurity (Similarity: 0.3733)
['game-dev', 'game-development', 'gamedev', 'graphics', 'material', 'shader', 'shaders', 'unity', 'un

  2%|▏         | 3627/185876 [00:08<07:35, 400.26it/s]

['2fa', 'android', 'icons', 'svg', 'vector'] -> computer-vision (Similarity: 0.4837)
['encryption-tool', 'filesystem', 'golang', 'secure-storage'] -> cloud-computing (Similarity: 0.4346)
['activitypub', 'android-app', 'fediverse', 'ionic', 'ios-app', 'lemmy', 'link-aggregator', 'pwa', 'universal-app', 'wefwef'] -> blockchain (Similarity: 0.4004)
['angular', 'angular-bindings', 'angular-extension', 'angular-performance', 'javascript'] -> web-development (Similarity: 0.2417)
['aws', 'aws-cdk', 'aws-textract', 'cdk', 'cloudformation', 'data-pipeline', 'dynamodb', 'jest', 'lambda', 'pdf', 'puppeteer', 's3', 'serverless', 'sns', 'textract', 'typescript', 'webscraping'] -> cloud-computing (Similarity: 0.5332)
['brave', 'chrome-extension', 'eslint', 'extension-popup', 'google-chrome', 'jest', 'microsoft-edge-extension', 'mozilla-firefox', 'opera-extension', 'prettier', 'react', 'storybook', 'tailwindcss', 'typescript', 'webpack'] -> web-development (Similarity: 0.3908)
['3d', '3d-designing', 

  2%|▏         | 3710/185876 [00:08<07:34, 400.44it/s]

['aerospike', 'database-driver', 'javascript', 'nodejs', 'nosql'] -> web-development (Similarity: 0.4216)
['element-ui', 'koa2', 'nodejs', 'sequelize', 'vue'] -> web-development (Similarity: 0.3596)
['angular', 'full-stack', 'full-stack-development', 'full-stack-web-developer', 'interview-practice', 'interview-preparation', 'interview-questions', 'interview-test', 'react', 'vuejs'] -> web-development (Similarity: 0.4273)
['html', 'markdown', 'markdown-convertor', 'server'] -> system (Similarity: 0.3922)
['gene-regulatory-network', 'single-cell', 'transcription-factors', 'transcriptomics'] -> data-science (Similarity: 0.3395)
['ci', 'git', 'github', 'gitlab', 'package-manager', 'rust'] -> cybersecurity (Similarity: 0.3561)
['aesara', 'automatic-differentiation', 'optimizing-compiler', 'optimizing-compilers', 'symbolic-computation', 'tensors', 'term-rewriting-system', 'theano', 'transpiler'] -> artificial-intelligence (Similarity: 0.4436)
['admin', 'dashboard', 'ecto', 'elixir', 'phoenix

  2%|▏         | 3809/185876 [00:08<06:51, 442.02it/s]

['flutter', 'flutter-animation', 'flutter-design', 'flutter-login', 'flutter-signup', 'flutter-ui', 'login-page'] -> cloud-computing (Similarity: 0.1516)
['artificial-intelligence', 'deep-learning', 'diffusion', 'image-generation', 'multimodal', 'multimodality', 'openai', 'openai-clip', 'text-to-image', 'text-to-image-synthesis'] -> artificial-intelligence (Similarity: 0.6091)
['c', 'file-manager', 'filemanager', 'sfm', 'simple', 'suckless', 'terminal', 'tty', 'tui'] -> system (Similarity: 0.5050)
['afip', 'afip-api', 'afip-facturas', 'afip-php', 'afip-sdk', 'argentina', 'ayuda', 'cae', 'clase', 'contribuyente', 'ejemplos', 'facturacion-electronica', 'libreria', 'padron', 'php', 'programacion', 'soap', 'webservice', 'wsaa'] -> system (Similarity: 0.4533)
['oled', 'ssd1306', 'ssd1309', 'stm32'] -> system (Similarity: 0.2973)
['beginner-friendly', 'contributions-welcome', 'datascience', 'good-first-issue', 'good-first-pr', 'hacktoberfest', 'machinelearning', 'opensource', 'python'] -> da

  2%|▏         | 3971/185876 [00:08<06:00, 504.21it/s]

['api', 'graphql', 'graphql-api', 'rest-api', 'rick-and-morty', 'rickandmorty'] -> web-development (Similarity: 0.3202)
['angular', 'angular-grid', 'angular-table', 'charting', 'datagrid', 'datatable', 'excel', 'filtering', 'grid', 'grouping', 'javascript-table', 'pagination', 'pivoting', 'react', 'react-grid', 'react-table', 'sorting', 'table', 'vue-table', 'vuejs'] -> data-science (Similarity: 0.4504)
['exploit', 'ldap-authentication', 'nginx', 'nginxday', 'zero-day'] -> blockchain (Similarity: 0.3775)
['aria2', 'bittorrent', 'bt', 'download', 'download-manager', 'electron', 'linux', 'mac', 'macos', 'magnet', 'motrix', 'torrent', 'windows'] -> system (Similarity: 0.4784)
['bird-detection', 'bird-recognition', 'bird-songs', 'bird-species', 'classification', 'convolutional-neural-network', 'datasets', 'review', 'survey'] -> computer-vision (Similarity: 0.5595)
['audio-augmentation', 'augmentation-policies', 'autoaugment', 'data-augmentation', 'data-augmentations', 'data-generation', 'd

  2%|▏         | 4037/185876 [00:09<05:33, 545.16it/s]

['background-jobs', 'ios', 'location', 'tracking'] -> computer-vision (Similarity: 0.4902)
['audio-effect', 'audio-files', 'displayers-audio-visualizers', 'equalizer', 'objective-c', 'objective-c-library', 'pod', 'swift'] -> computer-vision (Similarity: 0.3887)
['agi', 'llm', 'opensource'] -> artificial-intelligence (Similarity: 0.4100)
['bioinformatics', 'pseudotime-algorithms', 'rna-seq', 'single-cell'] -> data-science (Similarity: 0.4817)
['async', 'asynchronous', 'conda', 'cygwin', 'git', 'git-prompt', 'macintosh', 'macos', 'msys2', 'osx', 'prompt', 'shell', 'virtualenv', 'zsh', 'zsh-prompt', 'zsh-theme'] -> system (Similarity: 0.5036)
['autojump', 'command-line-tool', 'filesystem', 'z', 'zsh', 'zsh-plugin'] -> system (Similarity: 0.4303)
['eloquent', 'laravel', 'orm', 'php'] -> system (Similarity: 0.3294)
['async', 'asynchronous', 'fsm', 'go', 'golang', 'networking', 'non-blocking', 'select', 'state-machine', 'websocket'] -> system (Similarity: 0.5161)
['3d', '3d-models', 'awesome

  2%|▏         | 4151/185876 [00:09<05:43, 528.35it/s]

['admin-ui', 'blazor-webassembly', 'docker-cloud', 'dotnet', 'duende-identityserver', 'iam', 'oauth', 'oauth2', 'oauth2-server', 'oidc', 'oidc-server', 'openid', 'openid-connect', 'saml', 'sponsor', 'sso', 'sso-authentication', 'ws-federation'] -> blockchain (Similarity: 0.3786)
['arduino', 'awesome', 'awesome-list', 'awesome-lists', 'esp', 'esp32', 'esp8266', 'espressif', 'iot', 'micropython', 'nodemcu'] -> system (Similarity: 0.4413)
['codeigniter', 'environment', 'htaccess-files', 'nginx', 'php'] -> web-development (Similarity: 0.4122)
['convolutional-neural-networks', 'deep-learning', 'error-level-analysis', 'fake-image-detection', 'image-classification', 'image-tampering-detection'] -> computer-vision (Similarity: 0.6632)
['android', 'animation', 'dashboard-concept', 'transition-animation', 'ui-design', 'ux-design'] -> computer-vision (Similarity: 0.4371)
['grub', 'iso', 'iso-files', 'multiboot', 'usb'] -> system (Similarity: 0.3753)
['github-pages', 'jekyll', 'jekyll-theme'] -> a

  2%|▏         | 4255/185876 [00:09<07:05, 426.85it/s]

['hacktoberfest', 'purple', 'shades-of-purple', 'visual-studio', 'vscode', 'vscode-extension', 'vscode-theme'] -> web-development (Similarity: 0.3028)
['database', 'geographic', 'iran'] -> data-science (Similarity: 0.4555)
['ai-engine', 'bots', 'chatbot', 'chatbotai', 'chatbots', 'python', 'python-chatbot'] -> artificial-intelligence (Similarity: 0.4576)
['blog-theme', 'bootstrap4', 'css', 'multipurpose-ecommerce-template', 'scss'] -> web-development (Similarity: 0.3871)
['assets', 'downloader', 'offline-web-pages', 'scraper'] -> web-development (Similarity: 0.3633)
['action', 'dependabot', 'github'] -> system (Similarity: 0.3986)
['android', 'android-library', 'material-design', 'pressure', 'pressure-status', 'weather-wind', 'wind'] -> system (Similarity: 0.3803)
['api', 'goinsta', 'instagram', 'instagram-api', 'iranian'] -> education (Similarity: 0.3342)
['aws', 'aws-lambda', 'cartoongan', 'cartoonify', 'computer-vision', 'deployment', 'gan', 'machine-learning-production', 'netlify',

  2%|▏         | 4340/185876 [00:09<06:48, 444.39it/s]


['automation', 'gmail', 'script'] -> artificial-intelligence (Similarity: 0.4851)
['animated-gif', 'booru-browser', 'c-plus-plus', 'image-viewer', 'mangareader', 'webm'] -> computer-vision (Similarity: 0.4778)
['animations', 'css-grid', 'transitions'] -> computer-vision (Similarity: 0.4066)
['bundle-analyzer', 'developer-tools', 'javascript', 'performance'] -> web-development (Similarity: 0.4535)
['animation', 'gestures', 'mobile-first', 'mobile-web', 'reactjs'] -> computer-vision (Similarity: 0.4459)
['animation', 'animation-library', 'animejs', 'beginner-friendly', 'comparison', 'popmotion', 'react', 'react-spring'] -> artificial-intelligence (Similarity: 0.3821)
['animation', 'demo', 'flip', 'popmotion', 'react', 'stripe', 'styled-components', 'ui'] -> system (Similarity: 0.4403)
['aqara', 'home-automation', 'mi-home', 'miio', 'miio-protocol', 'mijia', 'xiaomi', 'yeelight'] -> system (Similarity: 0.3736)
['hexo', 'hexo-theme'] -> cybersecurity (Similarity: 0.2323)
['one', 'weapp'] -

KeyboardInterrupt: 