In [1]:
import pandas as pd
import torch
import torchvision.transforms as transforms
from torchvision.models import vit_b_16, ViT_B_16_Weights
from torch.utils.data import DataLoader 
from torchvision.datasets import ImageFolder 
import numpy as np
from sklearn.metrics import normalized_mutual_info_score
from tqdm import tqdm
from finch import FINCH
from sklearn.cluster import KMeans
from scipy.optimize import linear_sum_assignment

def clustering_accuracy(y_true, y_pred):
    y_true = np.asarray(y_true)
    y_pred = np.asarray(y_pred)

    D = max(y_pred.max(), y_true.max()) + 1
    w = np.zeros((D, D), dtype=np.int64)
    
    for i in range(y_pred.size):
        w[y_pred[i], y_true[i]] += 1

    row_ind, col_ind = linear_sum_assignment(w.max() - w)
    acc = w[row_ind, col_ind].sum() / y_pred.size
    return acc


def train_model(model, train_loader, epochs=10):
    model.to(device)

    for epoch in range(epochs):
        model.train()
        running_loss = 0.0
        
        for images, labels in tqdm(train_loader, desc=f"Training Epoch {epoch+1}/{epochs}"):
            images, labels = images.to(device), labels.to(device)

            optimizer.zero_grad()
            outputs = model(images)
            loss = criterion(outputs, labels)
            loss.backward()
            optimizer.step()

            running_loss += loss.item()
            
        train_loss = running_loss / len(train_loader)
        print(f"\nEpoch {epoch+1} | Train Loss: {train_loss:.4f}")

def extract_features(loader, model):
    features = []
    labels = []
    model.eval()
    with torch.no_grad():
        for images, targets in tqdm(loader, desc="Extracting features"):
            images = images.to(device)
            feat = model(images)
            print("Output shape:", feat.shape)
            features.append(feat.cpu().numpy())
            labels.append(targets.numpy())
    return np.concatenate(features), np.concatenate(labels)

results = []
all_image_info = []

device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
print(f"Using device: {device}")

Using device: cuda


In [None]:
for trial in range(5):
    labeled_transform = transforms.Compose([
    transforms.RandAugment(),
    transforms.ToTensor(),
    transforms.Normalize([0.485, 0.456, 0.406], [0.229, 0.224, 0.225]),])

    labeled_folder = fr"C:\Users\HP\novelty\split_datasets\trial_{trial}\32labeled_20unlabeled\labeled"

    labeled_dataset = ImageFolder(root=labeled_folder, 
    transform=labeled_transform) 
    print(f"Total gambar dalam labeled dataset: {len(labeled_dataset)} {len(labeled_dataset.classes)}")

    batch_size = 16

    labeled_loader = DataLoader(labeled_dataset, batch_size=batch_size, shuffle=True) 
    print(f"Total loader gambar dalam labeled dataset: {len(labeled_loader)}")
    
    model = vit_b_16(weights=ViT_B_16_Weights.IMAGENET1K_V1)

    model.heads = torch.nn.Linear(model.heads.head.in_features, len(labeled_dataset.classes))
    model = model.to(device)

    criterion = torch.nn.CrossEntropyLoss()
    optimizer = torch.optim.Adam(model.parameters(), lr=0.0001)
    print(model.encoder.layers[0].mlp[1])
    
    train_model(model, labeled_loader, epochs=5)

    torch.save(model.state_dict(), "vit_b16_finetuned_32labeled_20unlabeled_trial_" + str(trial) + ".pth")

In [None]:
for trial in range(5):

    unlabeled_transform = transforms.Compose([ 
    transforms.ToTensor(), 
    transforms.Normalize([0.485, 0.456, 0.406], [0.229, 0.224, 0.225]) ])

    unlabeled_folder = fr"C:\Users\HP\novelty\split_datasets\trial_{trial}\32labeled_20unlabeled\unlabeled"

    unlabeled_dataset = ImageFolder(root=unlabeled_folder, transform=unlabeled_transform) 
    print(f"Total gambar dalam unlabeled dataset: {len(unlabeled_dataset)}  {len(unlabeled_dataset.classes)}")

    batch_size = 16

    unlabeled_loader = DataLoader(unlabeled_dataset, batch_size=batch_size, shuffle=False)
    print(f"Total loader gambar dalam unlabeled dataset: {len(unlabeled_loader)}")
    
    model = vit_b_16(weights=None)
    model.heads = torch.nn.Identity()
    model.load_state_dict(torch.load("vit_b_16_finetuned_32labeled_20unlabeled_trial_" + str(trial) + ".pth"),strict=False)
    model = model.to(device)
    model.eval()
    
    unlabeled_features, unlabeled_true_labels = extract_features(unlabeled_loader, model)
    
    c, num_clust, req_c = FINCH(unlabeled_features, use_ann_above_samples=1000, verbose=True)
    finch_clusters = c[:,2]

    finch_nmi = normalized_mutual_info_score(unlabeled_true_labels, finch_clusters)
    finch_acc = clustering_accuracy(unlabeled_true_labels, finch_clusters)

    print(f"\nFINCH Clustering Performance:")
    print(f"Clustering Accuracy (ACC): {finch_acc:.4f}")
    print(f"Normalized Mutual Information (NMI): {finch_nmi:.4f}")
    print(f"Number of clusters found: {len(np.unique(finch_clusters))}")
    
    num_clusters = len(np.unique(unlabeled_true_labels))
    kmeans = KMeans(n_clusters=num_clusters, random_state=42)
    kmeans_clusters = kmeans.fit_predict(unlabeled_features)

    # ----- Evaluasi -----
    kmeans_nmi = normalized_mutual_info_score(unlabeled_true_labels, kmeans_clusters)
    kmeans_acc = clustering_accuracy(unlabeled_true_labels, kmeans_clusters)

    print(f"\nK-Means Clustering Performance: {num_clusters} Clusters")
    print(f"Clustering Accuracy (ACC): {kmeans_acc:.4f}")
    print(f"Normalized Mutual Information (NMI): {kmeans_nmi:.4f}")
    print(f"Number of clusters found: {len(np.unique(kmeans_clusters))}")
    
    # Simpan hasil trial ini
    results.append({
        'trial': trial,
        'FINCH_ACC': finch_acc,
        'FINCH_NMI': finch_nmi,
        'FINCH_Num_Clusters': len(np.unique(finch_clusters)),
        'KMeans_ACC': kmeans_acc,
        'KMeans_NMI': kmeans_nmi,
        'KMeans_Num_Clusters': len(np.unique(kmeans_clusters)),
    })
    
    # Simpan hasil per gambar
    for i in range(len(unlabeled_dataset)):
        path, true_label = unlabeled_dataset.samples[i]
        image_info = {
            'trial': trial,
            'image_path': path,
            'true_label': true_label,
            'finch_cluster': int(finch_clusters[i]),
            'kmeans_cluster': int(kmeans_clusters[i])
        }
        all_image_info.append(image_info)

    # Simpan file CSV per trial
    df_trial_detail = pd.DataFrame(all_image_info[-len(unlabeled_dataset):])  # ambil data dari trial ini saja
    df_trial_detail.to_csv(f'vit_b_16_finetuned_32labeled_20unlabeled_trial_{trial}_image_clustering.csv', index=False)

# Konversi ke DataFrame dan simpan ke CSV
df_results = pd.DataFrame(results)
mean_values = df_results.select_dtypes(include=np.number).mean()

mean_row = pd.DataFrame({
    'trial': ['Average'],
    'FINCH_ACC': [mean_values['FINCH_ACC']],
    'FINCH_NMI': [mean_values['FINCH_NMI']],
    'FINCH_Num_Clusters': [mean_values['FINCH_Num_Clusters']],
    'KMeans_ACC': [mean_values['KMeans_ACC']],
    'KMeans_NMI': [mean_values['KMeans_NMI']],
    'KMeans_Num_Clusters': [mean_values['KMeans_Num_Clusters']]
})

df_results = pd.concat([df_results, mean_row], ignore_index=True)

df_results.to_csv('clustering_results_vit_b_16_finetuned_32labeled_20unlabeled_FINCH_KMEANS.csv', index=False)
print("Results saved to clustering_results_vit_b_16_finetuned_32labeled_20unlabeled_FINCH_KMEANS.csv")

Total gambar dalam unlabel dataset: 2000  20
Total loader gambar dalam unlabel dataset: 125


  model.load_state_dict(torch.load("vit_b_16_finetuned_32labeled_20unlabeled_trial_" + str(trial) + ".pth"),strict=False)
Extracting features:   1%|          | 1/125 [00:00<00:40,  3.09it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:   2%|▏         | 3/125 [00:00<00:22,  5.45it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:   4%|▍         | 5/125 [00:00<00:21,  5.64it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:   6%|▌         | 7/125 [00:01<00:20,  5.72it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:   7%|▋         | 9/125 [00:01<00:18,  6.32it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:   9%|▉         | 11/125 [00:01<00:17,  6.69it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  10%|█         | 13/125 [00:02<00:16,  6.80it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  12%|█▏        | 15/125 [00:02<00:15,  6.89it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  14%|█▎        | 17/125 [00:02<00:15,  6.99it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  15%|█▌        | 19/125 [00:03<00:15,  6.66it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  17%|█▋        | 21/125 [00:03<00:15,  6.88it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  18%|█▊        | 23/125 [00:03<00:14,  6.99it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  20%|██        | 25/125 [00:03<00:14,  6.92it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  22%|██▏       | 27/125 [00:04<00:14,  6.96it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  23%|██▎       | 29/125 [00:04<00:13,  6.98it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  25%|██▍       | 31/125 [00:04<00:13,  7.00it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  26%|██▋       | 33/125 [00:05<00:13,  7.03it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  28%|██▊       | 35/125 [00:05<00:12,  7.05it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  30%|██▉       | 37/125 [00:05<00:12,  7.02it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  31%|███       | 39/125 [00:05<00:12,  6.94it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  33%|███▎      | 41/125 [00:06<00:12,  6.97it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  34%|███▍      | 43/125 [00:06<00:11,  7.03it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  36%|███▌      | 45/125 [00:06<00:11,  7.08it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  38%|███▊      | 47/125 [00:07<00:11,  7.03it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  39%|███▉      | 49/125 [00:07<00:11,  6.73it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  41%|████      | 51/125 [00:07<00:10,  6.90it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  42%|████▏     | 53/125 [00:07<00:10,  7.01it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  44%|████▍     | 55/125 [00:08<00:10,  6.96it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  46%|████▌     | 57/125 [00:08<00:09,  6.98it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  47%|████▋     | 59/125 [00:08<00:09,  7.05it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  49%|████▉     | 61/125 [00:09<00:09,  6.55it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  50%|█████     | 63/125 [00:09<00:09,  6.70it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  52%|█████▏    | 65/125 [00:09<00:08,  6.80it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  54%|█████▎    | 67/125 [00:09<00:08,  6.89it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  55%|█████▌    | 69/125 [00:10<00:08,  6.93it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  57%|█████▋    | 71/125 [00:10<00:07,  6.92it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  58%|█████▊    | 73/125 [00:10<00:07,  6.96it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  60%|██████    | 75/125 [00:11<00:07,  6.99it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  62%|██████▏   | 77/125 [00:11<00:06,  7.02it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  63%|██████▎   | 79/125 [00:11<00:06,  7.01it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  65%|██████▍   | 81/125 [00:11<00:06,  7.04it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  66%|██████▋   | 83/125 [00:12<00:05,  7.06it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  68%|██████▊   | 85/125 [00:12<00:05,  7.01it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  70%|██████▉   | 87/125 [00:12<00:05,  6.97it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  71%|███████   | 89/125 [00:13<00:05,  6.97it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  73%|███████▎  | 91/125 [00:13<00:05,  6.65it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  74%|███████▍  | 93/125 [00:13<00:04,  6.81it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  76%|███████▌  | 95/125 [00:13<00:04,  6.96it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  78%|███████▊  | 97/125 [00:14<00:04,  6.79it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  79%|███████▉  | 99/125 [00:14<00:03,  6.92it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  81%|████████  | 101/125 [00:14<00:03,  6.99it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  82%|████████▏ | 103/125 [00:15<00:03,  6.95it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  84%|████████▍ | 105/125 [00:15<00:02,  7.07it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  86%|████████▌ | 107/125 [00:15<00:02,  7.02it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  87%|████████▋ | 109/125 [00:15<00:02,  7.03it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  89%|████████▉ | 111/125 [00:16<00:02,  6.93it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  90%|█████████ | 113/125 [00:16<00:01,  6.79it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  92%|█████████▏| 115/125 [00:16<00:01,  6.85it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  94%|█████████▎| 117/125 [00:17<00:01,  6.71it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  95%|█████████▌| 119/125 [00:17<00:00,  6.56it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  97%|█████████▋| 121/125 [00:17<00:00,  6.62it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  98%|█████████▊| 123/125 [00:18<00:00,  6.53it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features: 100%|██████████| 125/125 [00:18<00:00,  6.82it/s]


Output shape: torch.Size([16, 768])
Using PyNNDescent to compute 1st-neighbours at this step ...
Step PyNNDescent done ...
Partition 0: 452 clusters
Partition 1: 94 clusters
Partition 2: 22 clusters
Partition 3: 6 clusters
Partition 4: 2 clusters

FINCH Clustering Performance:
Clustering Accuracy (ACC): 0.7375
Normalized Mutual Information (NMI): 0.8360
Number of clusters found: 22

K-Means Clustering Performance: 20 Clusters
Clustering Accuracy (ACC): 0.6670
Normalized Mutual Information (NMI): 0.7542
Number of clusters found: 20
Total gambar dalam unlabel dataset: 2000  20
Total loader gambar dalam unlabel dataset: 125


  model.load_state_dict(torch.load("vit_b_16_finetuned_32labeled_20unlabeled_trial_" + str(trial) + ".pth"),strict=False)
Extracting features:   0%|          | 0/125 [00:00<?, ?it/s]

Output shape: torch.Size([16, 768])


Extracting features:   2%|▏         | 2/125 [00:00<00:23,  5.32it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:   3%|▎         | 4/125 [00:00<00:20,  6.00it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:   5%|▍         | 6/125 [00:01<00:18,  6.30it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:   6%|▋         | 8/125 [00:01<00:17,  6.55it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:   8%|▊         | 10/125 [00:01<00:17,  6.59it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  10%|▉         | 12/125 [00:01<00:16,  6.71it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  11%|█         | 14/125 [00:02<00:16,  6.83it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  13%|█▎        | 16/125 [00:02<00:15,  6.83it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  14%|█▍        | 18/125 [00:02<00:15,  6.79it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  16%|█▌        | 20/125 [00:03<00:15,  6.86it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  18%|█▊        | 22/125 [00:03<00:15,  6.81it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  19%|█▉        | 24/125 [00:03<00:14,  6.74it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  21%|██        | 26/125 [00:03<00:14,  6.82it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  22%|██▏       | 28/125 [00:04<00:14,  6.70it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  24%|██▍       | 30/125 [00:04<00:13,  6.79it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  26%|██▌       | 32/125 [00:04<00:13,  6.92it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  27%|██▋       | 34/125 [00:05<00:13,  6.90it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  29%|██▉       | 36/125 [00:05<00:12,  6.92it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  30%|███       | 38/125 [00:05<00:12,  6.87it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  32%|███▏      | 40/125 [00:05<00:12,  6.93it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  34%|███▎      | 42/125 [00:06<00:12,  6.88it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  35%|███▌      | 44/125 [00:06<00:11,  6.90it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  37%|███▋      | 46/125 [00:06<00:11,  6.93it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  38%|███▊      | 48/125 [00:07<00:11,  6.92it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  40%|████      | 50/125 [00:07<00:10,  6.96it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  42%|████▏     | 52/125 [00:07<00:10,  7.03it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  43%|████▎     | 54/125 [00:07<00:10,  7.07it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  45%|████▍     | 56/125 [00:08<00:09,  7.11it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  46%|████▋     | 58/125 [00:08<00:09,  7.12it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  48%|████▊     | 60/125 [00:08<00:09,  7.09it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  50%|████▉     | 62/125 [00:09<00:08,  7.04it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  51%|█████     | 64/125 [00:09<00:08,  7.01it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  53%|█████▎    | 66/125 [00:09<00:08,  7.01it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  54%|█████▍    | 68/125 [00:09<00:08,  6.76it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  56%|█████▌    | 70/125 [00:10<00:07,  6.92it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  58%|█████▊    | 72/125 [00:10<00:07,  7.03it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  59%|█████▉    | 74/125 [00:10<00:07,  6.90it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  61%|██████    | 76/125 [00:11<00:06,  7.04it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  62%|██████▏   | 78/125 [00:11<00:07,  6.57it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  64%|██████▍   | 80/125 [00:11<00:06,  6.80it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  66%|██████▌   | 82/125 [00:12<00:06,  6.92it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  67%|██████▋   | 84/125 [00:12<00:05,  6.97it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  69%|██████▉   | 86/125 [00:12<00:05,  6.93it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  70%|███████   | 88/125 [00:12<00:05,  6.96it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  72%|███████▏  | 90/125 [00:13<00:05,  6.98it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  74%|███████▎  | 92/125 [00:13<00:04,  7.06it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  75%|███████▌  | 94/125 [00:13<00:04,  7.10it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  77%|███████▋  | 96/125 [00:13<00:04,  7.13it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  78%|███████▊  | 98/125 [00:14<00:03,  7.13it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  80%|████████  | 100/125 [00:14<00:03,  7.14it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  82%|████████▏ | 102/125 [00:14<00:03,  7.14it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  83%|████████▎ | 104/125 [00:15<00:02,  7.12it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  85%|████████▍ | 106/125 [00:15<00:02,  7.14it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  86%|████████▋ | 108/125 [00:15<00:02,  7.08it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  88%|████████▊ | 110/125 [00:15<00:02,  6.99it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  90%|████████▉ | 112/125 [00:16<00:01,  7.03it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  91%|█████████ | 114/125 [00:16<00:01,  7.07it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  93%|█████████▎| 116/125 [00:16<00:01,  7.06it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  94%|█████████▍| 118/125 [00:17<00:01,  6.94it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  96%|█████████▌| 120/125 [00:17<00:00,  7.01it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  98%|█████████▊| 122/125 [00:17<00:00,  7.07it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  99%|█████████▉| 124/125 [00:17<00:00,  7.05it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features: 100%|██████████| 125/125 [00:18<00:00,  6.91it/s]


Using PyNNDescent to compute 1st-neighbours at this step ...
Step PyNNDescent done ...
Partition 0: 465 clusters
Partition 1: 106 clusters
Partition 2: 29 clusters
Partition 3: 11 clusters
Partition 4: 3 clusters

FINCH Clustering Performance:
Clustering Accuracy (ACC): 0.6765
Normalized Mutual Information (NMI): 0.8078
Number of clusters found: 29

K-Means Clustering Performance: 20 Clusters
Clustering Accuracy (ACC): 0.7210
Normalized Mutual Information (NMI): 0.7879
Number of clusters found: 20
Total gambar dalam unlabel dataset: 2000  20
Total loader gambar dalam unlabel dataset: 125


  model.load_state_dict(torch.load("vit_b_16_finetuned_32labeled_20unlabeled_trial_" + str(trial) + ".pth"),strict=False)
Extracting features:   1%|          | 1/125 [00:00<00:17,  6.91it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:   2%|▏         | 3/125 [00:00<00:17,  7.04it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:   4%|▍         | 5/125 [00:00<00:17,  6.95it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:   6%|▌         | 7/125 [00:01<00:18,  6.51it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:   7%|▋         | 9/125 [00:01<00:17,  6.76it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:   9%|▉         | 11/125 [00:01<00:17,  6.69it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  10%|█         | 13/125 [00:01<00:16,  6.84it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  12%|█▏        | 15/125 [00:02<00:15,  6.92it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  14%|█▎        | 17/125 [00:02<00:15,  6.91it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  15%|█▌        | 19/125 [00:02<00:15,  6.91it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  17%|█▋        | 21/125 [00:03<00:14,  6.98it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  18%|█▊        | 23/125 [00:03<00:14,  7.00it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  20%|██        | 25/125 [00:03<00:14,  6.68it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  22%|██▏       | 27/125 [00:03<00:15,  6.50it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  23%|██▎       | 29/125 [00:04<00:14,  6.69it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  25%|██▍       | 31/125 [00:04<00:13,  6.74it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  26%|██▋       | 33/125 [00:04<00:13,  6.81it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  28%|██▊       | 35/125 [00:05<00:13,  6.83it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  30%|██▉       | 37/125 [00:05<00:12,  6.87it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  31%|███       | 39/125 [00:05<00:12,  6.92it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  33%|███▎      | 41/125 [00:06<00:12,  6.86it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  34%|███▍      | 43/125 [00:06<00:11,  6.84it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  36%|███▌      | 45/125 [00:06<00:11,  6.74it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  38%|███▊      | 47/125 [00:06<00:11,  6.83it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  39%|███▉      | 49/125 [00:07<00:11,  6.81it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  41%|████      | 51/125 [00:07<00:10,  6.87it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  42%|████▏     | 53/125 [00:07<00:10,  6.70it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  44%|████▍     | 55/125 [00:08<00:10,  6.82it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  46%|████▌     | 57/125 [00:08<00:09,  6.81it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  47%|████▋     | 59/125 [00:08<00:09,  6.82it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  49%|████▉     | 61/125 [00:08<00:09,  6.87it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  50%|█████     | 63/125 [00:09<00:09,  6.83it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  52%|█████▏    | 65/125 [00:09<00:08,  6.85it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  54%|█████▎    | 67/125 [00:09<00:08,  6.86it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  55%|█████▌    | 69/125 [00:10<00:08,  6.85it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  57%|█████▋    | 71/125 [00:10<00:07,  6.91it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  58%|█████▊    | 73/125 [00:10<00:07,  6.84it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  60%|██████    | 75/125 [00:10<00:07,  6.56it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  62%|██████▏   | 77/125 [00:11<00:07,  6.72it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  63%|██████▎   | 79/125 [00:11<00:06,  6.81it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  65%|██████▍   | 81/125 [00:11<00:06,  6.85it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  66%|██████▋   | 83/125 [00:12<00:06,  6.86it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  68%|██████▊   | 85/125 [00:12<00:05,  6.84it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  70%|██████▉   | 87/125 [00:12<00:05,  6.93it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  71%|███████   | 89/125 [00:13<00:05,  6.88it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  73%|███████▎  | 91/125 [00:13<00:04,  6.90it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  74%|███████▍  | 93/125 [00:13<00:04,  6.91it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  76%|███████▌  | 95/125 [00:13<00:04,  6.94it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  78%|███████▊  | 97/125 [00:14<00:04,  6.88it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  79%|███████▉  | 99/125 [00:14<00:03,  6.63it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  81%|████████  | 101/125 [00:14<00:03,  6.77it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  82%|████████▏ | 103/125 [00:15<00:03,  6.79it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  84%|████████▍ | 105/125 [00:15<00:02,  6.88it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  86%|████████▌ | 107/125 [00:15<00:02,  6.86it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  87%|████████▋ | 109/125 [00:15<00:02,  6.92it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  89%|████████▉ | 111/125 [00:16<00:02,  6.91it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  90%|█████████ | 113/125 [00:16<00:01,  6.92it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  92%|█████████▏| 115/125 [00:16<00:01,  6.94it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  94%|█████████▎| 117/125 [00:17<00:01,  6.94it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  95%|█████████▌| 119/125 [00:17<00:00,  6.91it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  97%|█████████▋| 121/125 [00:17<00:00,  6.89it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  98%|█████████▊| 123/125 [00:17<00:00,  6.40it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features: 100%|██████████| 125/125 [00:18<00:00,  6.84it/s]


Output shape: torch.Size([16, 768])
Using PyNNDescent to compute 1st-neighbours at this step ...
Step PyNNDescent done ...
Partition 0: 440 clusters
Partition 1: 97 clusters
Partition 2: 26 clusters
Partition 3: 8 clusters

FINCH Clustering Performance:
Clustering Accuracy (ACC): 0.7920
Normalized Mutual Information (NMI): 0.8664
Number of clusters found: 26

K-Means Clustering Performance: 20 Clusters
Clustering Accuracy (ACC): 0.7020
Normalized Mutual Information (NMI): 0.8074
Number of clusters found: 20
Total gambar dalam unlabel dataset: 2000  20
Total loader gambar dalam unlabel dataset: 125


  model.load_state_dict(torch.load("vit_b_16_finetuned_32labeled_20unlabeled_trial_" + str(trial) + ".pth"),strict=False)
Extracting features:   1%|          | 1/125 [00:00<00:17,  6.91it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:   2%|▏         | 3/125 [00:00<00:18,  6.75it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:   4%|▍         | 5/125 [00:00<00:17,  6.84it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:   6%|▌         | 7/125 [00:01<00:17,  6.65it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:   7%|▋         | 9/125 [00:01<00:17,  6.77it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:   9%|▉         | 11/125 [00:01<00:16,  6.85it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  10%|█         | 13/125 [00:01<00:16,  6.81it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  12%|█▏        | 15/125 [00:02<00:16,  6.80it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  14%|█▎        | 17/125 [00:02<00:15,  6.87it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  15%|█▌        | 19/125 [00:02<00:15,  6.74it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  17%|█▋        | 21/125 [00:03<00:15,  6.76it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  18%|█▊        | 23/125 [00:03<00:15,  6.79it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  20%|██        | 25/125 [00:03<00:14,  6.82it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  22%|██▏       | 27/125 [00:03<00:14,  6.77it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  23%|██▎       | 29/125 [00:04<00:14,  6.80it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  25%|██▍       | 31/125 [00:04<00:13,  6.82it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  26%|██▋       | 33/125 [00:04<00:13,  6.85it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  28%|██▊       | 35/125 [00:05<00:13,  6.82it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  30%|██▉       | 37/125 [00:05<00:12,  6.82it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  31%|███       | 39/125 [00:05<00:12,  6.86it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  33%|███▎      | 41/125 [00:06<00:12,  6.66it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  34%|███▍      | 43/125 [00:06<00:12,  6.74it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  36%|███▌      | 45/125 [00:06<00:11,  6.76it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  38%|███▊      | 47/125 [00:06<00:11,  6.80it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  39%|███▉      | 49/125 [00:07<00:11,  6.83it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  41%|████      | 51/125 [00:07<00:10,  6.78it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  42%|████▏     | 53/125 [00:07<00:10,  6.66it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  44%|████▍     | 55/125 [00:08<00:10,  6.69it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  46%|████▌     | 57/125 [00:08<00:09,  6.82it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  47%|████▋     | 59/125 [00:08<00:09,  6.71it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  49%|████▉     | 61/125 [00:08<00:09,  6.77it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  50%|█████     | 63/125 [00:09<00:09,  6.75it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  52%|█████▏    | 65/125 [00:09<00:08,  6.67it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  54%|█████▎    | 67/125 [00:09<00:08,  6.75it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  55%|█████▌    | 69/125 [00:10<00:08,  6.79it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  57%|█████▋    | 71/125 [00:10<00:07,  6.81it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  58%|█████▊    | 73/125 [00:10<00:07,  6.82it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  60%|██████    | 75/125 [00:11<00:07,  6.57it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  62%|██████▏   | 77/125 [00:11<00:07,  6.47it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  63%|██████▎   | 79/125 [00:11<00:06,  6.62it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  65%|██████▍   | 81/125 [00:11<00:06,  6.74it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  66%|██████▋   | 83/125 [00:12<00:06,  6.83it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  68%|██████▊   | 85/125 [00:12<00:05,  6.73it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  70%|██████▉   | 87/125 [00:12<00:05,  6.84it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  71%|███████   | 89/125 [00:13<00:05,  6.84it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  73%|███████▎  | 91/125 [00:13<00:04,  6.88it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  74%|███████▍  | 93/125 [00:13<00:04,  6.86it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  76%|███████▌  | 95/125 [00:13<00:04,  6.90it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  78%|███████▊  | 97/125 [00:14<00:04,  6.88it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  79%|███████▉  | 99/125 [00:14<00:03,  6.86it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  81%|████████  | 101/125 [00:14<00:03,  6.86it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  82%|████████▏ | 103/125 [00:15<00:03,  6.80it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  84%|████████▍ | 105/125 [00:15<00:02,  6.77it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  86%|████████▌ | 107/125 [00:15<00:02,  6.81it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  87%|████████▋ | 109/125 [00:16<00:02,  6.75it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  89%|████████▉ | 111/125 [00:16<00:02,  6.81it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  90%|█████████ | 113/125 [00:16<00:01,  6.87it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  92%|█████████▏| 115/125 [00:16<00:01,  6.63it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  94%|█████████▎| 117/125 [00:17<00:01,  6.71it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  95%|█████████▌| 119/125 [00:17<00:00,  6.69it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  97%|█████████▋| 121/125 [00:17<00:00,  6.63it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  98%|█████████▊| 123/125 [00:18<00:00,  6.70it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features: 100%|██████████| 125/125 [00:18<00:00,  6.78it/s]


Output shape: torch.Size([16, 768])
Using PyNNDescent to compute 1st-neighbours at this step ...
Step PyNNDescent done ...
Partition 0: 437 clusters
Partition 1: 89 clusters
Partition 2: 23 clusters
Partition 3: 5 clusters

FINCH Clustering Performance:
Clustering Accuracy (ACC): 0.8205
Normalized Mutual Information (NMI): 0.8549
Number of clusters found: 23

K-Means Clustering Performance: 20 Clusters
Clustering Accuracy (ACC): 0.7385
Normalized Mutual Information (NMI): 0.8045
Number of clusters found: 20
Total gambar dalam unlabel dataset: 2000  20
Total loader gambar dalam unlabel dataset: 125


  model.load_state_dict(torch.load("vit_b_16_finetuned_32labeled_20unlabeled_trial_" + str(trial) + ".pth"),strict=False)
Extracting features:   1%|          | 1/125 [00:00<00:18,  6.66it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:   2%|▏         | 3/125 [00:00<00:17,  6.78it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:   4%|▍         | 5/125 [00:00<00:17,  6.72it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:   6%|▌         | 7/125 [00:01<00:18,  6.33it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:   7%|▋         | 9/125 [00:01<00:17,  6.48it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:   9%|▉         | 11/125 [00:01<00:17,  6.37it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  10%|█         | 13/125 [00:01<00:16,  6.65it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  12%|█▏        | 15/125 [00:02<00:16,  6.77it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  14%|█▎        | 17/125 [00:02<00:15,  6.80it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  15%|█▌        | 19/125 [00:02<00:15,  6.82it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  17%|█▋        | 21/125 [00:03<00:15,  6.76it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  18%|█▊        | 23/125 [00:03<00:15,  6.66it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  20%|██        | 25/125 [00:03<00:15,  6.27it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  22%|██▏       | 27/125 [00:04<00:15,  6.49it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  23%|██▎       | 29/125 [00:04<00:14,  6.70it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  25%|██▍       | 31/125 [00:04<00:13,  6.74it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  26%|██▋       | 33/125 [00:04<00:13,  6.72it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  28%|██▊       | 35/125 [00:05<00:13,  6.76it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  30%|██▉       | 37/125 [00:05<00:12,  6.91it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  31%|███       | 39/125 [00:05<00:12,  6.80it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  33%|███▎      | 41/125 [00:06<00:12,  6.68it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  34%|███▍      | 43/125 [00:06<00:12,  6.73it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  36%|███▌      | 45/125 [00:06<00:11,  6.83it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  38%|███▊      | 47/125 [00:07<00:12,  6.46it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  39%|███▉      | 49/125 [00:07<00:11,  6.56it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  41%|████      | 51/125 [00:07<00:11,  6.70it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  42%|████▏     | 53/125 [00:07<00:10,  6.77it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  44%|████▍     | 55/125 [00:08<00:10,  6.88it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  46%|████▌     | 57/125 [00:08<00:09,  6.86it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  47%|████▋     | 59/125 [00:08<00:09,  6.82it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  49%|████▉     | 61/125 [00:09<00:09,  6.84it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  50%|█████     | 63/125 [00:09<00:09,  6.86it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  52%|█████▏    | 65/125 [00:09<00:08,  6.78it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  54%|█████▎    | 67/125 [00:09<00:08,  6.85it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  55%|█████▌    | 69/125 [00:10<00:08,  6.83it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  57%|█████▋    | 71/125 [00:10<00:07,  6.86it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  58%|█████▊    | 73/125 [00:10<00:07,  6.87it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  60%|██████    | 75/125 [00:11<00:07,  6.97it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  62%|██████▏   | 77/125 [00:11<00:06,  6.90it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  63%|██████▎   | 79/125 [00:11<00:06,  6.92it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  65%|██████▍   | 81/125 [00:12<00:06,  6.74it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  66%|██████▋   | 83/125 [00:12<00:06,  6.89it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  68%|██████▊   | 85/125 [00:12<00:05,  6.89it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  70%|██████▉   | 87/125 [00:12<00:05,  6.91it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  71%|███████   | 89/125 [00:13<00:05,  6.94it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  73%|███████▎  | 91/125 [00:13<00:04,  6.97it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  74%|███████▍  | 93/125 [00:13<00:04,  6.88it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  76%|███████▌  | 95/125 [00:14<00:04,  6.89it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  78%|███████▊  | 97/125 [00:14<00:04,  6.84it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  79%|███████▉  | 99/125 [00:14<00:03,  6.92it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  81%|████████  | 101/125 [00:14<00:03,  6.93it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  82%|████████▏ | 103/125 [00:15<00:03,  6.87it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  84%|████████▍ | 105/125 [00:15<00:02,  6.88it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  86%|████████▌ | 107/125 [00:15<00:02,  6.91it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  87%|████████▋ | 109/125 [00:16<00:02,  6.84it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  89%|████████▉ | 111/125 [00:16<00:02,  6.92it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  90%|█████████ | 113/125 [00:16<00:01,  6.62it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  92%|█████████▏| 115/125 [00:16<00:01,  6.74it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  94%|█████████▎| 117/125 [00:17<00:01,  6.54it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  95%|█████████▌| 119/125 [00:17<00:00,  6.66it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  97%|█████████▋| 121/125 [00:17<00:00,  6.84it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features:  98%|█████████▊| 123/125 [00:18<00:00,  6.84it/s]

Output shape: torch.Size([16, 768])
Output shape: torch.Size([16, 768])


Extracting features: 100%|██████████| 125/125 [00:18<00:00,  6.77it/s]


Output shape: torch.Size([16, 768])
Using PyNNDescent to compute 1st-neighbours at this step ...
Step PyNNDescent done ...
Partition 0: 434 clusters
Partition 1: 93 clusters
Partition 2: 23 clusters
Partition 3: 6 clusters
Partition 4: 2 clusters

FINCH Clustering Performance:
Clustering Accuracy (ACC): 0.6755
Normalized Mutual Information (NMI): 0.7816
Number of clusters found: 23

K-Means Clustering Performance: 20 Clusters
Clustering Accuracy (ACC): 0.6685
Normalized Mutual Information (NMI): 0.7494
Number of clusters found: 20
Results saved to clustering_results_vit_b_16_pretrained_32labeled_20unlabeled_FINCH_KMEANS.csv
