In [2]:
cvpr_keywords = [
    # 1. 기초 Vision 기술
    "image classification", "object detection", "bounding box", "YOLO", "Faster R-CNN",
    "semantic segmentation", "instance segmentation", "panoptic segmentation", "DeepLab", "Mask R-CNN",
    "pose estimation", "human keypoints", "2D pose", "3D pose", "OpenPose",
    "object tracking", "multi-object tracking", "MOT", "SORT", "DeepSORT",
    "depth estimation", "monocular depth", "stereo matching",
    "optical flow", "scene flow",

    # 2. 3D 및 공간 정보 처리
    "3D reconstruction", "point cloud", "mesh generation", "3D shape", "NeRF",
    "SLAM", "visual SLAM", "RGB-D", "depth sensors", "LiDAR", "ToF",

    # 3. 딥러닝 및 모델
    "convolutional neural networks", "ResNet", "VGG", "EfficientNet",
    "Vision Transformer", "ViT", "Swin Transformer", "DETR", "attention",
    "model compression", "network pruning", "quantization", "distillation",
    "self-supervised learning", "contrastive learning", "SimCLR", "MoCo",
    "zero-shot learning", "few-shot learning", "meta-learning",
    "multimodal learning", "vision-language", "CLIP", "VLP", "BLIP",

    # 4. 생성/영상처리/합성
    "image generation", "GAN", "StyleGAN", "Diffusion model", "image-to-image translation",
    "style transfer", "image enhancement", "super resolution",
    "synthetic data", "domain adaptation", "Sim2Real", "CycleGAN", "domain generalization",

    # 5. 데이터셋/벤치마크
    "ImageNet", "COCO", "Pascal VOC", "OpenImages",
    "YouTube-VOS", "Kinetics", "AVA", "Charades",
    "ScanNet", "ShapeNet", "KITTI", "Waymo Open Dataset", "nuScenes",

    # 6. 응용 분야
    "autonomous driving", "ADAS", "lane detection", "BEV", "bird's-eye view",
    "medical imaging", "CT segmentation", "MRI analysis",
    "robot vision", "grasp detection", "manipulation",
    "action recognition", "gesture recognition", "video understanding",
    "VQA", "video captioning", "image captioning",
    "face detection", "face recognition", "facial landmarks", "deepfake detection"
]

In [3]:
venue_name = ["Computer Vision and Pattern Recognition",
              "International Conference on Computer Vision",
              "European Conference on Computer Vision"]

In [4]:
import requests
import time

url = "https://api.semanticscholar.org/graph/v1/paper/search"
filtered_papers = []
paper_ids = set()
for keyword in cvpr_keywords:
    print("🔍 Searching for:", keyword)
    success = False
    params = {
        "query": keyword,
        "limit": 100,
        "fields": "paperId,title,abstract,citationCount,year,venue,fieldsOfStudy"
    }
    while not success:
        response = requests.get(url, params=params)
        if response.status_code == 200:  # Too many requests
            success = True
        else:
            print("Rate limit exceeded. Retrying in 5 seconds...")
            time.sleep(5)
    #url = "https://api.semanticscholar.org/graph/v1/paper/search"

    #response = requests.get(url, params=params)
    #print("Response Status Code:", response.status_code)
    papers = response.json()["data"]

    for paper in papers:
        paper_id = paper["paperId"]
        if paper_id not in paper_ids and paper["citationCount"] > 5 :
            if any(v in paper["venue"] for v in venue_name):
                paper_ids.add(paper_id)
                filtered_papers.append({
                    #"paperId": paper_id,
                    "title": paper["title"],
                    "authors": paper["authors"],
                    "abstract": paper["abstract"],
                    "citationCount": paper["citationCount"],
                    #"citaions": paper["citations"], # 이 논문을 인용한 논문들
                    #"references": paper["references"], # 이 논문이 인용한 논문들
                    "year": paper["year"],
                    "venue": paper["venue"],
                    "fieldsOfStudy": paper["fieldsOfStudy"],
                    #"embedding": paper["embedding"],
                })
        #else:
            #print("Duplicate found, skipping:", paper_id)

    print("Total num of paper: ", len(filtered_papers))

print("Total unique papers found:", len(filtered_papers))


🔍 Searching for: image classification
Rate limit exceeded. Retrying in 5 seconds...
Total num of paper:  18
🔍 Searching for: object detection
Total num of paper:  72
🔍 Searching for: bounding box
Rate limit exceeded. Retrying in 5 seconds...
Rate limit exceeded. Retrying in 5 seconds...
Rate limit exceeded. Retrying in 5 seconds...
Rate limit exceeded. Retrying in 5 seconds...
Rate limit exceeded. Retrying in 5 seconds...
Rate limit exceeded. Retrying in 5 seconds...
Total num of paper:  91
🔍 Searching for: YOLO
Total num of paper:  93
🔍 Searching for: Faster R-CNN
Rate limit exceeded. Retrying in 5 seconds...
Rate limit exceeded. Retrying in 5 seconds...
Total num of paper:  99
🔍 Searching for: semantic segmentation
Rate limit exceeded. Retrying in 5 seconds...
Total num of paper:  161
🔍 Searching for: instance segmentation
Total num of paper:  215
🔍 Searching for: panoptic segmentation
Rate limit exceeded. Retrying in 5 seconds...
Rate limit exceeded. Retrying in 5 seconds...
Rate li

In [5]:
paper = filtered_papers[0]
print("Title:", paper["title"])
print("Year:", paper["year"])
print("Venue:", paper["venue"])
#print("Authors:", [a["name"] for a in paper["authors"]])
print("Citation count", paper["citationCount"])
print("Abstract:", paper["abstract"][:300], "...\n")

Title: Residual Attention Network for Image Classification
Year: 2017
Venue: Computer Vision and Pattern Recognition
Citation count 3288
Abstract: In this work, we propose Residual Attention Network, a convolutional neural network using attention mechanism which can incorporate with state-of-art feed forward network architecture in an end-to-end training fashion. Our Residual Attention Network is built by stacking Attention Modules which gener ...



In [6]:
import json
with open("filtered_papers.json", "w", encoding="utf-8") as f:
    json.dump(filtered_papers, f, ensure_ascii=False, indent=4)

In [7]:
# paperid 저장
with open("paper_ids.txt", "w", encoding="utf-8") as f:
    for paperID in paper_ids:
        f.write(paperID + "\n")