# gemini 확인

Step 1 (재현 로직 디버깅):
gemini-2.5-flash-lite (빠르고 저렴 → 코드 안정화에 집중)

Step 2 (논문 구조 제대로 테스트):
gemini-2.5-flash (성능 + 속도 균형)

Step 3 (최종 보고·비교):
gemini-2.5-pro (최고 성능, 결과 품질 강조할 때)

In [1]:
import google.generativeai as genai
import os
from dotenv import load_dotenv
load_dotenv()

g_token = os.getenv("GEMINI_API_KEY")
# API 키 설정
genai.configure(api_key=g_token)

# 모델 목록 나열
models = genai.list_models()
for m in models:
    print(m.name, m.display_name, m.supported_generation_methods)


models/embedding-gecko-001 Embedding Gecko ['embedText', 'countTextTokens']
models/gemini-2.5-pro-preview-03-25 Gemini 2.5 Pro Preview 03-25 ['generateContent', 'countTokens', 'createCachedContent', 'batchGenerateContent']
models/gemini-2.5-flash-preview-05-20 Gemini 2.5 Flash Preview 05-20 ['generateContent', 'countTokens', 'createCachedContent', 'batchGenerateContent']
models/gemini-2.5-flash Gemini 2.5 Flash ['generateContent', 'countTokens', 'createCachedContent', 'batchGenerateContent']
models/gemini-2.5-flash-lite-preview-06-17 Gemini 2.5 Flash-Lite Preview 06-17 ['generateContent', 'countTokens', 'createCachedContent', 'batchGenerateContent']
models/gemini-2.5-pro-preview-05-06 Gemini 2.5 Pro Preview 05-06 ['generateContent', 'countTokens', 'createCachedContent', 'batchGenerateContent']
models/gemini-2.5-pro-preview-06-05 Gemini 2.5 Pro Preview ['generateContent', 'countTokens', 'createCachedContent', 'batchGenerateContent']
models/gemini-2.5-pro Gemini 2.5 Pro ['generateContent

# 허깅페이스 확인

In [2]:
import os
from dotenv import load_dotenv
from huggingface_hub import HfApi
load_dotenv()

HF_TOKEN = os.getenv("HF_TOKEN")

# Hugging Face API 객체 생성
api = HfApi(token=HF_TOKEN)

# 모델 접근 확인
model_id = "mistralai/Mistral-7B-Instruct-v0.3"

try:
    model_info = api.model_info(model_id)
    print(f"모델 접근 성공! 모델 이름: {model_info.modelId}")
except Exception as e:
    print(f"모델 접근 실패: {e}")

모델 접근 성공! 모델 이름: mistralai/Mistral-7B-Instruct-v0.3


# 모델 다운로드

In [5]:
import os

# HF 캐시 이미 설정
os.environ["HF_HOME"] = "/home/dibaeck/hf_cache"

from transformers import AutoModel, AutoTokenizer

model_name = "mistralai/Mistral-7B-Instruct-v0.3"
model = AutoModel.from_pretrained(model_name, device_map="auto")
tokenizer = AutoTokenizer.from_pretrained(model_name)


config.json:   0%|          | 0.00/601 [00:00<?, ?B/s]

2025-09-30 22:49:30.367236: I tensorflow/core/util/port.cc:153] oneDNN custom operations are on. You may see slightly different numerical results due to floating-point round-off errors from different computation orders. To turn them off, set the environment variable `TF_ENABLE_ONEDNN_OPTS=0`.
2025-09-30 22:49:30.373909: E external/local_xla/xla/stream_executor/cuda/cuda_fft.cc:485] Unable to register cuFFT factory: Attempting to register factory for plugin cuFFT when one has already been registered
2025-09-30 22:49:30.381013: E external/local_xla/xla/stream_executor/cuda/cuda_dnn.cc:8454] Unable to register cuDNN factory: Attempting to register factory for plugin cuDNN when one has already been registered
2025-09-30 22:49:30.383563: E external/local_xla/xla/stream_executor/cuda/cuda_blas.cc:1452] Unable to register cuBLAS factory: Attempting to register factory for plugin cuBLAS when one has already been registered
2025-09-30 22:49:30.389941: I tensorflow/core/platform/cpu_feature_guar

model.safetensors.index.json:   0%|          | 0.00/23.9k [00:00<?, ?B/s]

Fetching 3 files:   0%|          | 0/3 [00:00<?, ?it/s]

model-00001-of-00003.safetensors:   0%|          | 0.00/4.95G [00:00<?, ?B/s]

model-00002-of-00003.safetensors:   0%|          | 0.00/5.00G [00:00<?, ?B/s]

model-00003-of-00003.safetensors:   0%|          | 0.00/4.55G [00:00<?, ?B/s]

Loading checkpoint shards:   0%|          | 0/3 [00:00<?, ?it/s]

tokenizer_config.json:   0%|          | 0.00/141k [00:00<?, ?B/s]

tokenizer.model:   0%|          | 0.00/587k [00:00<?, ?B/s]

tokenizer.json:   0%|          | 0.00/1.96M [00:00<?, ?B/s]

special_tokens_map.json:   0%|          | 0.00/414 [00:00<?, ?B/s]

In [None]:
import torch

print("CUDA 사용 가능:", torch.cuda.is_available())
print("GPU 개수:", torch.cuda.device_count())
print("현재 GPU 이름:", torch.cuda.get_device_name(0))
print("GPU 메모리 할당:", torch.cuda.memory_allocated(0))
print("GPU 메모리 예약:", torch.cuda.memory_reserved(0))


In [None]:
from transformers import cached_path
model_name = "mistralai/Mistral-7B-Instruct-v0.3"

# 실제 모델 파일 경로 확인
path = cached_path(f"{model_name}/pytorch_model-00001-of-00003.safetensors")
print(path)


: 