In [1]:
!pip install fastdup



In [2]:
from google.colab import drive
drive.mount('/content/drive')

Mounted at /content/drive


In [3]:
import os
import shutil
import fastdup

# Đường dẫn đến dữ liệu gốc trên Google Drive
input_dir = '/content/drive/MyDrive/sports_data'

# Đường dẫn để lưu dữ liệu đã tiền xử lý
output_dir = '/content/drive/MyDrive/processed_sports_data'

# Đảm bảo thư mục đích đã được tạo
os.makedirs(output_dir, exist_ok=True)

In [4]:
# danh sách các nhãn
categories = ['badminton', 'cricket', 'karate', 'football', 'swimming', 'tennis', 'wrestling']

In [5]:
# kiểm tra số lượng ảnh ban đầu trước khi tiền xử lý
for category in categories:
    category_dir = os.path.join(input_dir, category)
    print(f"Nhãn {category}: {len(os.listdir(category_dir))} ảnh")

Nhãn badminton: 1394 ảnh
Nhãn cricket: 1556 ảnh
Nhãn karate: 613 ảnh
Nhãn football: 1188 ảnh
Nhãn swimming: 652 ảnh
Nhãn tennis: 1445 ảnh
Nhãn wrestling: 1471 ảnh


In [6]:
# lọc các ảnh trùng lặp
def process_duplicate_category(category_name, input_dir, output_dir):
    """
    Tiền xử lý dữ liệu cho từng nhãn:
    - Loại bỏ ảnh trùng lặp và bất thường bằng fastdup.
    - Chia dữ liệu thành train và test.
    """

    print(f"Đang xử lý nhãn: {category_name}")

    # đường dẫn đến thư mục của nhãn
    category_dir = os.path.join(input_dir, category_name)

    # phân tích trùng lặp bằng fastdup
    fd = fastdup.create(input_dir=category_dir, work_dir=f"AI_{category_name}")
    ## (high_accuracy=True): Kích hoạt chế độ phân tích với độ chính xác cao hơn.
    ## (overwrite=True): Cho phép ghi đè kết quả của các lần chạy trước.
    ## (nearest_neighbors_k=5): Đây là số nearest neighbors được sử dụng trong thuật toán phát hiện tương tự (similarity detection).
    fd.run(high_accuracy=True, overwrite=True, nearest_neighbors_k=5)

    # Lấy danh sách ảnh trùng lặp
    duplicate_imgs = set(fd.similarity().sort_values("distance")['filename_from'])

    # Lấy dánh sách tất cả các ảnh trong thư mục
    all_images = set(os.listdir(category_dir))

    # Lấy danh sách ảnh không trùng lặp
    unique_images = all_images - duplicate_imgs

    # Định dạng lại đường dẫn cho unique_images
    unique_images = [os.path.join(category_dir, img) for img in unique_images
                     if img.lower().endswith(('.jpeg', '.jpg', '.png'))]

    # Tạo thư mục đích cho nhãn
    output_category_dir = os.path.join(output_dir, category_name)
    os.makedirs(output_category_dir, exist_ok=True)

    # Di chuyển các ảnh không trùng lặp vào thư mục đích
    for img_path in unique_images:
        shutil.copy(img_path, output_category_dir)

    print(f"Hoàn thành xử lý trùng lặp nhãn: {category_name}")

In [7]:
# xử lý từng nhãn
for category in categories:
    process_duplicate_category(category, input_dir, output_dir)

print("Hoàn tất tiền xử lý dữ liệu trùng lặp!")

fastdup By Visual Layer, Inc. 2024. All rights reserved.


Đang xử lý nhãn: badminton

fastdup By Visual Layer, Inc. 2024. All rights reserved.

A fastdup dataset object was created!

Input directory is set to [0;35m"/content/drive/MyDrive/sports_data/badminton"[0m
Work directory is set to [0;35m"AI_badminton"[0m

The next steps are:
   1. Analyze your dataset with the [0;35m.run()[0m function of the dataset object
   2. Interactively explore your data on your local machine with the [0;35m.explore()[0m function of the dataset object

For more information, use [0;35mhelp(fastdup)[0m or check our documentation https://docs.visual-layer.com/docs/getting-started-with-fastdup.



  df_annot = self._df_annot.query(f'{FD.ANNOT_VALID}') if valid_only and self._df_annot is not None \
Done: 100%|██████████| 3/3 [00:44<00:00, 14.88s/it]



Analysis complete. Use the [0;35m.explore()[0m function to interactively explore your data on your local machine.

Alternatively, you can generate HTML-based galleries.
For more information, use [0;35mhelp(fastdup)[0m or check our documentation https://docs.visual-layer.com/docs/getting-started-with-fastdup.



fastdup By Visual Layer, Inc. 2024. All rights reserved.


Hoàn thành xử lý trùng lặp nhãn: badminton
Đang xử lý nhãn: cricket

fastdup By Visual Layer, Inc. 2024. All rights reserved.

A fastdup dataset object was created!

Input directory is set to [0;35m"/content/drive/MyDrive/sports_data/cricket"[0m
Work directory is set to [0;35m"AI_cricket"[0m

The next steps are:
   1. Analyze your dataset with the [0;35m.run()[0m function of the dataset object
   2. Interactively explore your data on your local machine with the [0;35m.explore()[0m function of the dataset object

For more information, use [0;35mhelp(fastdup)[0m or check our documentation https://docs.visual-layer.com/docs/getting-started-with-fastdup.



  df_annot = self._df_annot.query(f'{FD.ANNOT_VALID}') if valid_only and self._df_annot is not None \
Done: 100%|██████████| 3/3 [00:51<00:00, 17.30s/it]



Analysis complete. Use the [0;35m.explore()[0m function to interactively explore your data on your local machine.

Alternatively, you can generate HTML-based galleries.
For more information, use [0;35mhelp(fastdup)[0m or check our documentation https://docs.visual-layer.com/docs/getting-started-with-fastdup.



fastdup By Visual Layer, Inc. 2024. All rights reserved.


Hoàn thành xử lý trùng lặp nhãn: cricket
Đang xử lý nhãn: karate

fastdup By Visual Layer, Inc. 2024. All rights reserved.

A fastdup dataset object was created!

Input directory is set to [0;35m"/content/drive/MyDrive/sports_data/karate"[0m
Work directory is set to [0;35m"AI_karate"[0m

The next steps are:
   1. Analyze your dataset with the [0;35m.run()[0m function of the dataset object
   2. Interactively explore your data on your local machine with the [0;35m.explore()[0m function of the dataset object

For more information, use [0;35mhelp(fastdup)[0m or check our documentation https://docs.visual-layer.com/docs/getting-started-with-fastdup.



  df_annot = self._df_annot.query(f'{FD.ANNOT_VALID}') if valid_only and self._df_annot is not None \
Done: 100%|██████████| 3/3 [00:23<00:00,  7.79s/it]



Analysis complete. Use the [0;35m.explore()[0m function to interactively explore your data on your local machine.

Alternatively, you can generate HTML-based galleries.
For more information, use [0;35mhelp(fastdup)[0m or check our documentation https://docs.visual-layer.com/docs/getting-started-with-fastdup.



fastdup By Visual Layer, Inc. 2024. All rights reserved.


Hoàn thành xử lý trùng lặp nhãn: karate
Đang xử lý nhãn: football

fastdup By Visual Layer, Inc. 2024. All rights reserved.

A fastdup dataset object was created!

Input directory is set to [0;35m"/content/drive/MyDrive/sports_data/football"[0m
Work directory is set to [0;35m"AI_football"[0m

The next steps are:
   1. Analyze your dataset with the [0;35m.run()[0m function of the dataset object
   2. Interactively explore your data on your local machine with the [0;35m.explore()[0m function of the dataset object

For more information, use [0;35mhelp(fastdup)[0m or check our documentation https://docs.visual-layer.com/docs/getting-started-with-fastdup.



  df_annot = self._df_annot.query(f'{FD.ANNOT_VALID}') if valid_only and self._df_annot is not None \
Done: 100%|██████████| 3/3 [00:43<00:00, 14.46s/it]



Analysis complete. Use the [0;35m.explore()[0m function to interactively explore your data on your local machine.

Alternatively, you can generate HTML-based galleries.
For more information, use [0;35mhelp(fastdup)[0m or check our documentation https://docs.visual-layer.com/docs/getting-started-with-fastdup.



fastdup By Visual Layer, Inc. 2024. All rights reserved.


Hoàn thành xử lý trùng lặp nhãn: football
Đang xử lý nhãn: swimming

fastdup By Visual Layer, Inc. 2024. All rights reserved.

A fastdup dataset object was created!

Input directory is set to [0;35m"/content/drive/MyDrive/sports_data/swimming"[0m
Work directory is set to [0;35m"AI_swimming"[0m

The next steps are:
   1. Analyze your dataset with the [0;35m.run()[0m function of the dataset object
   2. Interactively explore your data on your local machine with the [0;35m.explore()[0m function of the dataset object

For more information, use [0;35mhelp(fastdup)[0m or check our documentation https://docs.visual-layer.com/docs/getting-started-with-fastdup.



  df_annot = self._df_annot.query(f'{FD.ANNOT_VALID}') if valid_only and self._df_annot is not None \
Done: 100%|██████████| 3/3 [00:24<00:00,  8.04s/it]



Analysis complete. Use the [0;35m.explore()[0m function to interactively explore your data on your local machine.

Alternatively, you can generate HTML-based galleries.
For more information, use [0;35mhelp(fastdup)[0m or check our documentation https://docs.visual-layer.com/docs/getting-started-with-fastdup.



fastdup By Visual Layer, Inc. 2024. All rights reserved.


Hoàn thành xử lý trùng lặp nhãn: swimming
Đang xử lý nhãn: tennis

fastdup By Visual Layer, Inc. 2024. All rights reserved.

A fastdup dataset object was created!

Input directory is set to [0;35m"/content/drive/MyDrive/sports_data/tennis"[0m
Work directory is set to [0;35m"AI_tennis"[0m

The next steps are:
   1. Analyze your dataset with the [0;35m.run()[0m function of the dataset object
   2. Interactively explore your data on your local machine with the [0;35m.explore()[0m function of the dataset object

For more information, use [0;35mhelp(fastdup)[0m or check our documentation https://docs.visual-layer.com/docs/getting-started-with-fastdup.



  df_annot = self._df_annot.query(f'{FD.ANNOT_VALID}') if valid_only and self._df_annot is not None \
Done: 100%|██████████| 3/3 [00:48<00:00, 16.22s/it]



Analysis complete. Use the [0;35m.explore()[0m function to interactively explore your data on your local machine.

Alternatively, you can generate HTML-based galleries.
For more information, use [0;35mhelp(fastdup)[0m or check our documentation https://docs.visual-layer.com/docs/getting-started-with-fastdup.



fastdup By Visual Layer, Inc. 2024. All rights reserved.


Hoàn thành xử lý trùng lặp nhãn: tennis
Đang xử lý nhãn: wrestling

fastdup By Visual Layer, Inc. 2024. All rights reserved.

A fastdup dataset object was created!

Input directory is set to [0;35m"/content/drive/MyDrive/sports_data/wrestling"[0m
Work directory is set to [0;35m"AI_wrestling"[0m

The next steps are:
   1. Analyze your dataset with the [0;35m.run()[0m function of the dataset object
   2. Interactively explore your data on your local machine with the [0;35m.explore()[0m function of the dataset object

For more information, use [0;35mhelp(fastdup)[0m or check our documentation https://docs.visual-layer.com/docs/getting-started-with-fastdup.



  df_annot = self._df_annot.query(f'{FD.ANNOT_VALID}') if valid_only and self._df_annot is not None \
Done: 100%|██████████| 3/3 [00:47<00:00, 15.98s/it]



Analysis complete. Use the [0;35m.explore()[0m function to interactively explore your data on your local machine.

Alternatively, you can generate HTML-based galleries.
For more information, use [0;35mhelp(fastdup)[0m or check our documentation https://docs.visual-layer.com/docs/getting-started-with-fastdup.

Hoàn thành xử lý trùng lặp nhãn: wrestling
Hoàn tất tiền xử lý dữ liệu trùng lặp!


In [8]:
# kiểm tra số lượng ảnh còn lại trong mỗi nhãn sau khi lọc ảnh trùng lặp
for category in categories:
    category_dir = os.path.join(output_dir, category)
    print(f"Nhãn {category}: {len(os.listdir(category_dir))} ảnh")

Nhãn badminton: 1394 ảnh
Nhãn cricket: 1556 ảnh
Nhãn karate: 613 ảnh
Nhãn football: 1188 ảnh
Nhãn swimming: 652 ảnh
Nhãn tennis: 1445 ảnh
Nhãn wrestling: 1471 ảnh


In [10]:
# lọc các ảnh bất thường (outliers)

def process_outliers_category(category_name, input_dir, output_dir):
    """
    Xử lý từng nhãn:
    - Phát hiện và loại bỏ ảnh bất thường.
    """
    print(f"Đang xử lý nhãn: {category_name}")

    # Đường dẫn đến thư mục nhãn
    category_dir = os.path.join(input_dir, category_name)

    # Phân tích dữ liệu bằng fastdup
    fd = fastdup.create(input_dir=category_dir, work_dir=f"AI_{category_name}")
    fd.run(high_accuracy=True, overwrite=True)

    # Lấy danh sách ảnh bất thường
    outliers = fd.outliers()['filename_outlier']
    print(f"Tìm thấy {len(outliers)} ảnh bất thường trong nhãn {category_name}")

    # Xóa các ảnh bất thường
    for file in outliers:
        if os.path.exists(file):
            os.remove(file)
            print(f"Đã xóa: {file}")

    # Di chuyển ảnh còn lại vào thư mục đích
    output_category_dir = os.path.join(output_dir, category_name)
    os.makedirs(output_category_dir, exist_ok=True)
    for img in os.listdir(category_dir):
        img_path = os.path.join(category_dir, img)
        if img.lower().endswith(('.jpeg', '.jpg', '.png')):
            shutil.move(img_path, os.path.join(output_category_dir, img))

    print(f"Hoàn thành xử lý bất thường nhãn: {category_name}")
    return fd  # Trả về đối tượng fastdup

# Danh sách đối tượng fastdup của từng nhãn
fds = {}

In [11]:
# Xử lý từng nhãn
for category in categories:
    fds[category] = process_outliers_category(category, input_dir, output_dir)

print("Hoàn tất tiền xử lý dữ liệu bất thường!")

fastdup By Visual Layer, Inc. 2024. All rights reserved.


Đang xử lý nhãn: badminton

fastdup By Visual Layer, Inc. 2024. All rights reserved.

A fastdup dataset object was created!

Input directory is set to [0;35m"/content/drive/MyDrive/sports_data/badminton"[0m
Work directory is set to [0;35m"AI_badminton"[0m

The next steps are:
   1. Analyze your dataset with the [0;35m.run()[0m function of the dataset object
   2. Interactively explore your data on your local machine with the [0;35m.explore()[0m function of the dataset object

For more information, use [0;35mhelp(fastdup)[0m or check our documentation https://docs.visual-layer.com/docs/getting-started-with-fastdup.



  df_annot = self._df_annot.query(f'{FD.ANNOT_VALID}') if valid_only and self._df_annot is not None \
Done: 100%|██████████| 3/3 [00:45<00:00, 15.31s/it]



Analysis complete. Use the [0;35m.explore()[0m function to interactively explore your data on your local machine.

Alternatively, you can generate HTML-based galleries.
For more information, use [0;35mhelp(fastdup)[0m or check our documentation https://docs.visual-layer.com/docs/getting-started-with-fastdup.

Tìm thấy 96 ảnh bất thường trong nhãn badminton
Đã xóa: drive/MyDrive/sports_data/badminton/ee6508bc72.jpg
Đã xóa: drive/MyDrive/sports_data/badminton/87096582c1.jpg
Đã xóa: drive/MyDrive/sports_data/badminton/ead523f2a6.jpg
Đã xóa: drive/MyDrive/sports_data/badminton/08b6ea2143.jpg
Đã xóa: drive/MyDrive/sports_data/badminton/f2ae0ccc3c.jpg
Đã xóa: drive/MyDrive/sports_data/badminton/40250a515d.jpg
Đã xóa: drive/MyDrive/sports_data/badminton/0559a5aa07.jpg
Đã xóa: drive/MyDrive/sports_data/badminton/fa09ba543c.jpg
Đã xóa: drive/MyDrive/sports_data/badminton/d6ad22dbec.jpg
Đã xóa: drive/MyDrive/sports_data/badminton/31343b0ac2.jpg
Đã xóa: drive/MyDrive/sports_data/badminton/fd

fastdup By Visual Layer, Inc. 2024. All rights reserved.


Hoàn thành xử lý bất thường nhãn: badminton
Đang xử lý nhãn: cricket

fastdup By Visual Layer, Inc. 2024. All rights reserved.

A fastdup dataset object was created!

Input directory is set to [0;35m"/content/drive/MyDrive/sports_data/cricket"[0m
Work directory is set to [0;35m"AI_cricket"[0m

The next steps are:
   1. Analyze your dataset with the [0;35m.run()[0m function of the dataset object
   2. Interactively explore your data on your local machine with the [0;35m.explore()[0m function of the dataset object

For more information, use [0;35mhelp(fastdup)[0m or check our documentation https://docs.visual-layer.com/docs/getting-started-with-fastdup.



  df_annot = self._df_annot.query(f'{FD.ANNOT_VALID}') if valid_only and self._df_annot is not None \
Done: 100%|██████████| 3/3 [00:53<00:00, 17.98s/it]



Analysis complete. Use the [0;35m.explore()[0m function to interactively explore your data on your local machine.

Alternatively, you can generate HTML-based galleries.
For more information, use [0;35mhelp(fastdup)[0m or check our documentation https://docs.visual-layer.com/docs/getting-started-with-fastdup.

Tìm thấy 111 ảnh bất thường trong nhãn cricket
Đã xóa: drive/MyDrive/sports_data/cricket/1506e455dc.jpg
Đã xóa: drive/MyDrive/sports_data/cricket/c17.jpg
Đã xóa: drive/MyDrive/sports_data/cricket/b4614bbd0b.jpg
Đã xóa: drive/MyDrive/sports_data/cricket/3455c44896.jpg
Đã xóa: drive/MyDrive/sports_data/cricket/6f5a719e8d.jpg
Đã xóa: drive/MyDrive/sports_data/cricket/eed2f075c6.jpg
Đã xóa: drive/MyDrive/sports_data/cricket/7b5ce59aa5.jpg
Đã xóa: drive/MyDrive/sports_data/cricket/bb8e9d8db9.jpg
Đã xóa: drive/MyDrive/sports_data/cricket/224a5c5b5b.jpg
Đã xóa: drive/MyDrive/sports_data/cricket/1a77e4a2c5.jpg
Đã xóa: drive/MyDrive/sports_data/cricket/f8df6eaf77.jpg
Đã xóa: drive/MyD

fastdup By Visual Layer, Inc. 2024. All rights reserved.


Hoàn thành xử lý bất thường nhãn: cricket
Đang xử lý nhãn: karate

fastdup By Visual Layer, Inc. 2024. All rights reserved.

A fastdup dataset object was created!

Input directory is set to [0;35m"/content/drive/MyDrive/sports_data/karate"[0m
Work directory is set to [0;35m"AI_karate"[0m

The next steps are:
   1. Analyze your dataset with the [0;35m.run()[0m function of the dataset object
   2. Interactively explore your data on your local machine with the [0;35m.explore()[0m function of the dataset object

For more information, use [0;35mhelp(fastdup)[0m or check our documentation https://docs.visual-layer.com/docs/getting-started-with-fastdup.



  df_annot = self._df_annot.query(f'{FD.ANNOT_VALID}') if valid_only and self._df_annot is not None \
Done: 100%|██████████| 3/3 [00:22<00:00,  7.66s/it]



Analysis complete. Use the [0;35m.explore()[0m function to interactively explore your data on your local machine.

Alternatively, you can generate HTML-based galleries.
For more information, use [0;35mhelp(fastdup)[0m or check our documentation https://docs.visual-layer.com/docs/getting-started-with-fastdup.

Tìm thấy 43 ảnh bất thường trong nhãn karate
Đã xóa: drive/MyDrive/sports_data/karate/c1004.jpg
Đã xóa: drive/MyDrive/sports_data/karate/3b8f71de6d.jpg
Đã xóa: drive/MyDrive/sports_data/karate/8fb3bbd60c.jpg
Đã xóa: drive/MyDrive/sports_data/karate/9311bd03f3.jpg
Đã xóa: drive/MyDrive/sports_data/karate/898ea7fd7d.jpg
Đã xóa: drive/MyDrive/sports_data/karate/c1009.jpg
Đã xóa: drive/MyDrive/sports_data/karate/735aa4138a.jpg
Đã xóa: drive/MyDrive/sports_data/karate/c1003.jpg
Đã xóa: drive/MyDrive/sports_data/karate/85baea6ca9.jpg
Đã xóa: drive/MyDrive/sports_data/karate/ddb83cbd3c.jpg
Đã xóa: drive/MyDrive/sports_data/karate/3b2b742b58.jpg
Đã xóa: drive/MyDrive/sports_data/kara

fastdup By Visual Layer, Inc. 2024. All rights reserved.


Hoàn thành xử lý bất thường nhãn: karate
Đang xử lý nhãn: football

fastdup By Visual Layer, Inc. 2024. All rights reserved.

A fastdup dataset object was created!

Input directory is set to [0;35m"/content/drive/MyDrive/sports_data/football"[0m
Work directory is set to [0;35m"AI_football"[0m

The next steps are:
   1. Analyze your dataset with the [0;35m.run()[0m function of the dataset object
   2. Interactively explore your data on your local machine with the [0;35m.explore()[0m function of the dataset object

For more information, use [0;35mhelp(fastdup)[0m or check our documentation https://docs.visual-layer.com/docs/getting-started-with-fastdup.



  df_annot = self._df_annot.query(f'{FD.ANNOT_VALID}') if valid_only and self._df_annot is not None \
Done: 100%|██████████| 3/3 [00:42<00:00, 14.23s/it]



Analysis complete. Use the [0;35m.explore()[0m function to interactively explore your data on your local machine.

Alternatively, you can generate HTML-based galleries.
For more information, use [0;35mhelp(fastdup)[0m or check our documentation https://docs.visual-layer.com/docs/getting-started-with-fastdup.

Tìm thấy 85 ảnh bất thường trong nhãn football
Đã xóa: drive/MyDrive/sports_data/football/18ffcd551e.jpg
Đã xóa: drive/MyDrive/sports_data/football/9d3de05692.jpg
Đã xóa: drive/MyDrive/sports_data/football/a285eba419.jpg
Đã xóa: drive/MyDrive/sports_data/football/61b01d675c.jpg
Đã xóa: drive/MyDrive/sports_data/football/a2f357c4bf.jpg
Đã xóa: drive/MyDrive/sports_data/football/9a607a1584.jpg
Đã xóa: drive/MyDrive/sports_data/football/c9e4eb6aac.jpg
Đã xóa: drive/MyDrive/sports_data/football/4a38142f16.jpg
Đã xóa: drive/MyDrive/sports_data/football/7f6f79e353.jpg
Đã xóa: drive/MyDrive/sports_data/football/c5354d8cb4.jpg
Đã xóa: drive/MyDrive/sports_data/football/734ffd5761.jpg

fastdup By Visual Layer, Inc. 2024. All rights reserved.


Hoàn thành xử lý bất thường nhãn: football
Đang xử lý nhãn: swimming

fastdup By Visual Layer, Inc. 2024. All rights reserved.

A fastdup dataset object was created!

Input directory is set to [0;35m"/content/drive/MyDrive/sports_data/swimming"[0m
Work directory is set to [0;35m"AI_swimming"[0m

The next steps are:
   1. Analyze your dataset with the [0;35m.run()[0m function of the dataset object
   2. Interactively explore your data on your local machine with the [0;35m.explore()[0m function of the dataset object

For more information, use [0;35mhelp(fastdup)[0m or check our documentation https://docs.visual-layer.com/docs/getting-started-with-fastdup.



  df_annot = self._df_annot.query(f'{FD.ANNOT_VALID}') if valid_only and self._df_annot is not None \
Done: 100%|██████████| 3/3 [00:22<00:00,  7.64s/it]



Analysis complete. Use the [0;35m.explore()[0m function to interactively explore your data on your local machine.

Alternatively, you can generate HTML-based galleries.
For more information, use [0;35mhelp(fastdup)[0m or check our documentation https://docs.visual-layer.com/docs/getting-started-with-fastdup.

Tìm thấy 53 ảnh bất thường trong nhãn swimming
Đã xóa: drive/MyDrive/sports_data/swimming/1bf6731a34.jpg
Đã xóa: drive/MyDrive/sports_data/swimming/614138a6b6.jpg
Đã xóa: drive/MyDrive/sports_data/swimming/fbc70aa01c.jpg
Đã xóa: drive/MyDrive/sports_data/swimming/fae3ae4d70.jpg
Đã xóa: drive/MyDrive/sports_data/swimming/59146d21d1.jpg
Đã xóa: drive/MyDrive/sports_data/swimming/3b90b9f115.jpg
Đã xóa: drive/MyDrive/sports_data/swimming/68f029108c.jpg
Đã xóa: drive/MyDrive/sports_data/swimming/4ad6cc10d6.jpg
Đã xóa: drive/MyDrive/sports_data/swimming/1e6a2d5614.jpg
Đã xóa: drive/MyDrive/sports_data/swimming/76bede4f33.jpg
Đã xóa: drive/MyDrive/sports_data/swimming/619e8b5ad6.jpg

fastdup By Visual Layer, Inc. 2024. All rights reserved.


Hoàn thành xử lý bất thường nhãn: swimming
Đang xử lý nhãn: tennis

fastdup By Visual Layer, Inc. 2024. All rights reserved.

A fastdup dataset object was created!

Input directory is set to [0;35m"/content/drive/MyDrive/sports_data/tennis"[0m
Work directory is set to [0;35m"AI_tennis"[0m

The next steps are:
   1. Analyze your dataset with the [0;35m.run()[0m function of the dataset object
   2. Interactively explore your data on your local machine with the [0;35m.explore()[0m function of the dataset object

For more information, use [0;35mhelp(fastdup)[0m or check our documentation https://docs.visual-layer.com/docs/getting-started-with-fastdup.



  df_annot = self._df_annot.query(f'{FD.ANNOT_VALID}') if valid_only and self._df_annot is not None \
Done: 100%|██████████| 3/3 [00:51<00:00, 17.11s/it]



Analysis complete. Use the [0;35m.explore()[0m function to interactively explore your data on your local machine.

Alternatively, you can generate HTML-based galleries.
For more information, use [0;35mhelp(fastdup)[0m or check our documentation https://docs.visual-layer.com/docs/getting-started-with-fastdup.

Tìm thấy 98 ảnh bất thường trong nhãn tennis
Đã xóa: drive/MyDrive/sports_data/tennis/42e9891221.jpg
Đã xóa: drive/MyDrive/sports_data/tennis/e78eae0d9b.jpg
Đã xóa: drive/MyDrive/sports_data/tennis/6d655af337.jpg
Đã xóa: drive/MyDrive/sports_data/tennis/1045261517.jpg
Đã xóa: drive/MyDrive/sports_data/tennis/ba24def98e.jpg
Đã xóa: drive/MyDrive/sports_data/tennis/89a6ae23ef.jpg
Đã xóa: drive/MyDrive/sports_data/tennis/24e05b329b.jpg
Đã xóa: drive/MyDrive/sports_data/tennis/097cdfa562.jpg
Đã xóa: drive/MyDrive/sports_data/tennis/07eab9352a.jpg
Đã xóa: drive/MyDrive/sports_data/tennis/5f38824b6f.jpg
Đã xóa: drive/MyDrive/sports_data/tennis/2f81b3e51b.jpg
Đã xóa: drive/MyDrive/s

fastdup By Visual Layer, Inc. 2024. All rights reserved.


Hoàn thành xử lý bất thường nhãn: tennis
Đang xử lý nhãn: wrestling

fastdup By Visual Layer, Inc. 2024. All rights reserved.

A fastdup dataset object was created!

Input directory is set to [0;35m"/content/drive/MyDrive/sports_data/wrestling"[0m
Work directory is set to [0;35m"AI_wrestling"[0m

The next steps are:
   1. Analyze your dataset with the [0;35m.run()[0m function of the dataset object
   2. Interactively explore your data on your local machine with the [0;35m.explore()[0m function of the dataset object

For more information, use [0;35mhelp(fastdup)[0m or check our documentation https://docs.visual-layer.com/docs/getting-started-with-fastdup.



  df_annot = self._df_annot.query(f'{FD.ANNOT_VALID}') if valid_only and self._df_annot is not None \
Done: 100%|██████████| 3/3 [00:51<00:00, 17.05s/it]



Analysis complete. Use the [0;35m.explore()[0m function to interactively explore your data on your local machine.

Alternatively, you can generate HTML-based galleries.
For more information, use [0;35mhelp(fastdup)[0m or check our documentation https://docs.visual-layer.com/docs/getting-started-with-fastdup.

Tìm thấy 116 ảnh bất thường trong nhãn wrestling
Đã xóa: drive/MyDrive/sports_data/wrestling/0c4b6db7c6.jpg
Đã xóa: drive/MyDrive/sports_data/wrestling/c9004c06f4.jpg
Đã xóa: drive/MyDrive/sports_data/wrestling/b8e461ed8b.jpg
Đã xóa: drive/MyDrive/sports_data/wrestling/2eb9c04b95.jpg
Đã xóa: drive/MyDrive/sports_data/wrestling/c6c7f444dd.jpg
Đã xóa: drive/MyDrive/sports_data/wrestling/c8004.jpg
Đã xóa: drive/MyDrive/sports_data/wrestling/e88320c906.jpg
Đã xóa: drive/MyDrive/sports_data/wrestling/5406eda401.jpg
Đã xóa: drive/MyDrive/sports_data/wrestling/b52d7d1952.jpg
Đã xóa: drive/MyDrive/sports_data/wrestling/47f1f5d75d.jpg
Đã xóa: drive/MyDrive/sports_data/wrestling/896028

In [12]:
# kiểm tra số lượng ảnh còn lại trong mỗi nhãn sau khi lọc ảnh bất thường
for category in categories:
    category_dir = os.path.join(output_dir, category)
    print(f"Nhãn {category}: {len(os.listdir(category_dir))} ảnh")

Nhãn badminton: 1394 ảnh
Nhãn cricket: 1556 ảnh
Nhãn karate: 613 ảnh
Nhãn football: 1188 ảnh
Nhãn swimming: 652 ảnh
Nhãn tennis: 1445 ảnh
Nhãn wrestling: 1471 ảnh


In [13]:
# Hiển thị ảnh bất thường cho từng nhãn
for category, fd in fds.items():
    print(f"Hiển thị ảnh bất thường cho nhãn: {category}")
    fd.vis.outliers_gallery(ascending=True)

Hiển thị ảnh bất thường cho nhãn: badminton


Generating gallery:   0%|          | 0/20 [00:00<?, ?it/s]

Failed to read image from img_path drive/MyDrive/sports_data/badminton/ee6508bc72.jpg
Failed to read image from img_path drive/MyDrive/sports_data/badminton/87096582c1.jpg
Failed to read image from img_path drive/MyDrive/sports_data/badminton/ead523f2a6.jpg
Failed to read image from img_path drive/MyDrive/sports_data/badminton/f2ae0ccc3c.jpg
Failed to read image from img_path drive/MyDrive/sports_data/badminton/40250a515d.jpg
Failed to read image from img_path drive/MyDrive/sports_data/badminton/fa09ba543c.jpg
Failed to read image from img_path drive/MyDrive/sports_data/badminton/31343b0ac2.jpg
Failed to read image from img_path drive/MyDrive/sports_data/badminton/358c149fb9.jpg
Failed to read image from img_path drive/MyDrive/sports_data/badminton/08b6ea2143.jpg
Failed to read image from img_path drive/MyDrive/sports_data/badminton/76eafa96a2.jpg


Traceback (most recent call last):
  File "/usr/local/lib/python3.10/dist-packages/fastdup/galleries.py", line 496, in load_one_image_for_outliers
    assert img is not None, f"Failed to read image from {impath1} {input_dir}"
AssertionError: Failed to read image from drive/MyDrive/sports_data/badminton/ee6508bc72.jpg /content/drive/MyDrive/sports_data/badminton
Traceback (most recent call last):
  File "/usr/local/lib/python3.10/dist-packages/fastdup/galleries.py", line 496, in load_one_image_for_outliers
    assert img is not None, f"Failed to read image from {impath1} {input_dir}"
AssertionError: Failed to read image from drive/MyDrive/sports_data/badminton/87096582c1.jpg /content/drive/MyDrive/sports_data/badminton
Traceback (most recent call last):
  File "/usr/local/lib/python3.10/dist-packages/fastdup/galleries.py", line 496, in load_one_image_for_outliers
    assert img is not None, f"Failed to read image from {impath1} {input_dir}"
AssertionError: Failed to read image from driv

Failed to read image from img_path drive/MyDrive/sports_data/badminton/d6ad22dbec.jpg
Failed to read image from img_path drive/MyDrive/sports_data/badminton/b7a2097352.jpg
Failed to read image from img_path drive/MyDrive/sports_data/badminton/0559a5aa07.jpg
Failed to read image from img_path drive/MyDrive/sports_data/badminton/06540352ad.jpg
Failed to read image from img_path drive/MyDrive/sports_data/badminton/f4456c2d50.jpg
Failed to read image from img_path drive/MyDrive/sports_data/badminton/868e209c3f.jpg
Failed to read image from img_path drive/MyDrive/sports_data/badminton/7f8292c33b.jpg
Failed to read image from img_path drive/MyDrive/sports_data/badminton/3936236487.jpg
Failed to read image from img_path drive/MyDrive/sports_data/badminton/2f32eba567.jpg
Failed to read image from img_path drive/MyDrive/sports_data/badminton/18c5df9680.jpg


Traceback (most recent call last):
  File "/usr/local/lib/python3.10/dist-packages/fastdup/galleries.py", line 496, in load_one_image_for_outliers
    assert img is not None, f"Failed to read image from {impath1} {input_dir}"
AssertionError: Failed to read image from drive/MyDrive/sports_data/badminton/d6ad22dbec.jpg /content/drive/MyDrive/sports_data/badminton
Traceback (most recent call last):
  File "/usr/local/lib/python3.10/dist-packages/fastdup/galleries.py", line 496, in load_one_image_for_outliers
    assert img is not None, f"Failed to read image from {impath1} {input_dir}"
AssertionError: Failed to read image from drive/MyDrive/sports_data/badminton/b7a2097352.jpg /content/drive/MyDrive/sports_data/badminton
Traceback (most recent call last):
  File "/usr/local/lib/python3.10/dist-packages/fastdup/galleries.py", line 496, in load_one_image_for_outliers
    assert img is not None, f"Failed to read image from {impath1} {input_dir}"
AssertionError: Failed to read image from driv

Stored outliers visual view in  AI_badminton/galleries/outliers.html
########################################################################################
Would you like to see awesome visualizations for some of the most popular academic datasets?
Click here to see and learn more: https://app.visual-layer.com/vl-datasets?utm_source=fastdup
########################################################################################


Info,Unnamed: 1
Distance,0.443076
Path,drive/MyDrive/sports_data/badminton/ee6508bc72.jpg

Info,Unnamed: 1
Distance,0.453978
Path,drive/MyDrive/sports_data/badminton/87096582c1.jpg

Info,Unnamed: 1
Distance,0.481823
Path,drive/MyDrive/sports_data/badminton/ead523f2a6.jpg

Info,Unnamed: 1
Distance,0.503097
Path,drive/MyDrive/sports_data/badminton/f2ae0ccc3c.jpg

Info,Unnamed: 1
Distance,0.515688
Path,drive/MyDrive/sports_data/badminton/40250a515d.jpg

Info,Unnamed: 1
Distance,0.564799
Path,drive/MyDrive/sports_data/badminton/fa09ba543c.jpg

Info,Unnamed: 1
Distance,0.574912
Path,drive/MyDrive/sports_data/badminton/31343b0ac2.jpg

Info,Unnamed: 1
Distance,0.583654
Path,drive/MyDrive/sports_data/badminton/358c149fb9.jpg

Info,Unnamed: 1
Distance,0.584158
Path,drive/MyDrive/sports_data/badminton/08b6ea2143.jpg

Info,Unnamed: 1
Distance,0.593818
Path,drive/MyDrive/sports_data/badminton/76eafa96a2.jpg

Info,Unnamed: 1
Distance,0.594024
Path,drive/MyDrive/sports_data/badminton/d6ad22dbec.jpg

Info,Unnamed: 1
Distance,0.594224
Path,drive/MyDrive/sports_data/badminton/b7a2097352.jpg

Info,Unnamed: 1
Distance,0.607925
Path,drive/MyDrive/sports_data/badminton/0559a5aa07.jpg

Info,Unnamed: 1
Distance,0.609393
Path,drive/MyDrive/sports_data/badminton/06540352ad.jpg

Info,Unnamed: 1
Distance,0.611918
Path,drive/MyDrive/sports_data/badminton/f4456c2d50.jpg

Info,Unnamed: 1
Distance,0.612528
Path,drive/MyDrive/sports_data/badminton/868e209c3f.jpg

Info,Unnamed: 1
Distance,0.613099
Path,drive/MyDrive/sports_data/badminton/7f8292c33b.jpg

Info,Unnamed: 1
Distance,0.613678
Path,drive/MyDrive/sports_data/badminton/3936236487.jpg

Info,Unnamed: 1
Distance,0.616893
Path,drive/MyDrive/sports_data/badminton/2f32eba567.jpg

Info,Unnamed: 1
Distance,0.619623
Path,drive/MyDrive/sports_data/badminton/18c5df9680.jpg


Hiển thị ảnh bất thường cho nhãn: cricket


Generating gallery:   0%|          | 0/20 [00:00<?, ?it/s]

Failed to read image from img_path drive/MyDrive/sports_data/cricket/1506e455dc.jpg
Failed to read image from img_path drive/MyDrive/sports_data/cricket/c17.jpg
Failed to read image from img_path drive/MyDrive/sports_data/cricket/b4614bbd0b.jpg
Failed to read image from img_path drive/MyDrive/sports_data/cricket/eed2f075c6.jpg
Failed to read image from img_path drive/MyDrive/sports_data/cricket/7b5ce59aa5.jpg
Failed to read image from img_path drive/MyDrive/sports_data/cricket/6f5a719e8d.jpg
Failed to read image from img_path drive/MyDrive/sports_data/cricket/3455c44896.jpg
Failed to read image from img_path drive/MyDrive/sports_data/cricket/1a77e4a2c5.jpg
Failed to read image from img_path drive/MyDrive/sports_data/cricket/f8df6eaf77.jpg
Failed to read image from img_path drive/MyDrive/sports_data/cricket/224a5c5b5b.jpg


Traceback (most recent call last):
  File "/usr/local/lib/python3.10/dist-packages/fastdup/galleries.py", line 496, in load_one_image_for_outliers
    assert img is not None, f"Failed to read image from {impath1} {input_dir}"
AssertionError: Failed to read image from drive/MyDrive/sports_data/cricket/1506e455dc.jpg /content/drive/MyDrive/sports_data/cricket
Traceback (most recent call last):
  File "/usr/local/lib/python3.10/dist-packages/fastdup/galleries.py", line 496, in load_one_image_for_outliers
    assert img is not None, f"Failed to read image from {impath1} {input_dir}"
AssertionError: Failed to read image from drive/MyDrive/sports_data/cricket/c17.jpg /content/drive/MyDrive/sports_data/cricket
Traceback (most recent call last):
  File "/usr/local/lib/python3.10/dist-packages/fastdup/galleries.py", line 496, in load_one_image_for_outliers
    assert img is not None, f"Failed to read image from {impath1} {input_dir}"
AssertionError: Failed to read image from drive/MyDrive/sport

Failed to read image from img_path drive/MyDrive/sports_data/cricket/a33a64fee4.jpg
Failed to read image from img_path drive/MyDrive/sports_data/cricket/bb8e9d8db9.jpg
Failed to read image from img_path drive/MyDrive/sports_data/cricket/4b0bc07882.jpg
Failed to read image from img_path drive/MyDrive/sports_data/cricket/a3f6e899da.jpg
Failed to read image from img_path drive/MyDrive/sports_data/cricket/1fce84d492.jpg
Failed to read image from img_path drive/MyDrive/sports_data/cricket/484666d6bf.jpg
Failed to read image from img_path drive/MyDrive/sports_data/cricket/7c6629f599.jpg
Failed to read image from img_path drive/MyDrive/sports_data/cricket/cf20a5aba5.jpg
Failed to read image from img_path drive/MyDrive/sports_data/cricket/ba4ee26825.jpg
Failed to read image from img_path drive/MyDrive/sports_data/cricket/26f53c8ca7.jpg
Stored outliers visual view in  AI_cricket/galleries/outliers.html
########################################################################################
Woul

  File "/usr/local/lib/python3.10/dist-packages/fastdup/galleries.py", line 496, in load_one_image_for_outliers
    assert img is not None, f"Failed to read image from {impath1} {input_dir}"
AssertionError: Failed to read image from drive/MyDrive/sports_data/cricket/224a5c5b5b.jpg /content/drive/MyDrive/sports_data/cricket
Traceback (most recent call last):
  File "/usr/local/lib/python3.10/dist-packages/fastdup/galleries.py", line 496, in load_one_image_for_outliers
    assert img is not None, f"Failed to read image from {impath1} {input_dir}"
AssertionError: Failed to read image from drive/MyDrive/sports_data/cricket/a33a64fee4.jpg /content/drive/MyDrive/sports_data/cricket
Traceback (most recent call last):
  File "/usr/local/lib/python3.10/dist-packages/fastdup/galleries.py", line 496, in load_one_image_for_outliers
    assert img is not None, f"Failed to read image from {impath1} {input_dir}"
AssertionError: Failed to read image from drive/MyDrive/sports_data/cricket/bb8e9d8db9.jp

Info,Unnamed: 1
Distance,0.450065
Path,drive/MyDrive/sports_data/cricket/1506e455dc.jpg

Info,Unnamed: 1
Distance,0.554618
Path,drive/MyDrive/sports_data/cricket/c17.jpg

Info,Unnamed: 1
Distance,0.56662
Path,drive/MyDrive/sports_data/cricket/b4614bbd0b.jpg

Info,Unnamed: 1
Distance,0.587307
Path,drive/MyDrive/sports_data/cricket/eed2f075c6.jpg

Info,Unnamed: 1
Distance,0.58845
Path,drive/MyDrive/sports_data/cricket/7b5ce59aa5.jpg

Info,Unnamed: 1
Distance,0.596364
Path,drive/MyDrive/sports_data/cricket/6f5a719e8d.jpg

Info,Unnamed: 1
Distance,0.611126
Path,drive/MyDrive/sports_data/cricket/3455c44896.jpg

Info,Unnamed: 1
Distance,0.612012
Path,drive/MyDrive/sports_data/cricket/1a77e4a2c5.jpg

Info,Unnamed: 1
Distance,0.613114
Path,drive/MyDrive/sports_data/cricket/f8df6eaf77.jpg

Info,Unnamed: 1
Distance,0.615677
Path,drive/MyDrive/sports_data/cricket/224a5c5b5b.jpg

Info,Unnamed: 1
Distance,0.621663
Path,drive/MyDrive/sports_data/cricket/a33a64fee4.jpg

Info,Unnamed: 1
Distance,0.625626
Path,drive/MyDrive/sports_data/cricket/bb8e9d8db9.jpg

Info,Unnamed: 1
Distance,0.634324
Path,drive/MyDrive/sports_data/cricket/4b0bc07882.jpg

Info,Unnamed: 1
Distance,0.636979
Path,drive/MyDrive/sports_data/cricket/a3f6e899da.jpg

Info,Unnamed: 1
Distance,0.637159
Path,drive/MyDrive/sports_data/cricket/1fce84d492.jpg

Info,Unnamed: 1
Distance,0.637966
Path,drive/MyDrive/sports_data/cricket/484666d6bf.jpg

Info,Unnamed: 1
Distance,0.639938
Path,drive/MyDrive/sports_data/cricket/7c6629f599.jpg

Info,Unnamed: 1
Distance,0.641542
Path,drive/MyDrive/sports_data/cricket/cf20a5aba5.jpg

Info,Unnamed: 1
Distance,0.64697
Path,drive/MyDrive/sports_data/cricket/ba4ee26825.jpg

Info,Unnamed: 1
Distance,0.64697
Path,drive/MyDrive/sports_data/cricket/26f53c8ca7.jpg


Hiển thị ảnh bất thường cho nhãn: karate


Generating gallery:   0%|          | 0/20 [00:00<?, ?it/s]

Failed to read image from img_path drive/MyDrive/sports_data/karate/c1004.jpg
Failed to read image from img_path drive/MyDrive/sports_data/karate/3b8f71de6d.jpg
Failed to read image from img_path drive/MyDrive/sports_data/karate/8fb3bbd60c.jpg
Failed to read image from img_path drive/MyDrive/sports_data/karate/9311bd03f3.jpg
Failed to read image from img_path drive/MyDrive/sports_data/karate/898ea7fd7d.jpg
Failed to read image from img_path drive/MyDrive/sports_data/karate/c1009.jpg
Failed to read image from img_path drive/MyDrive/sports_data/karate/735aa4138a.jpg
Failed to read image from img_path drive/MyDrive/sports_data/karate/85baea6ca9.jpg
Failed to read image from img_path drive/MyDrive/sports_data/karate/ddb83cbd3c.jpg
Failed to read image from img_path drive/MyDrive/sports_data/karate/3b2b742b58.jpg
Failed to read image from img_path drive/MyDrive/sports_data/karate/8aa75c1544.jpg


Traceback (most recent call last):
  File "/usr/local/lib/python3.10/dist-packages/fastdup/galleries.py", line 496, in load_one_image_for_outliers
    assert img is not None, f"Failed to read image from {impath1} {input_dir}"
AssertionError: Failed to read image from drive/MyDrive/sports_data/karate/c1004.jpg /content/drive/MyDrive/sports_data/karate
Traceback (most recent call last):
  File "/usr/local/lib/python3.10/dist-packages/fastdup/galleries.py", line 496, in load_one_image_for_outliers
    assert img is not None, f"Failed to read image from {impath1} {input_dir}"
AssertionError: Failed to read image from drive/MyDrive/sports_data/karate/3b8f71de6d.jpg /content/drive/MyDrive/sports_data/karate
Traceback (most recent call last):
  File "/usr/local/lib/python3.10/dist-packages/fastdup/galleries.py", line 496, in load_one_image_for_outliers
    assert img is not None, f"Failed to read image from {impath1} {input_dir}"
AssertionError: Failed to read image from drive/MyDrive/sports_

Failed to read image from img_path drive/MyDrive/sports_data/karate/21a811c5ce.jpg
Failed to read image from img_path drive/MyDrive/sports_data/karate/c1003.jpg
Failed to read image from img_path drive/MyDrive/sports_data/karate/5f023bc97b.jpg
Failed to read image from img_path drive/MyDrive/sports_data/karate/d77d5629ed.jpg
Failed to read image from img_path drive/MyDrive/sports_data/karate/4653964268.jpg
Failed to read image from img_path drive/MyDrive/sports_data/karate/2cc02d5f10.jpg
Failed to read image from img_path drive/MyDrive/sports_data/karate/9581e1136d.jpg
Failed to read image from img_path drive/MyDrive/sports_data/karate/751b6904bb.jpg
Failed to read image from img_path drive/MyDrive/sports_data/karate/f66520c8bd.jpg
Stored outliers visual view in  AI_karate/galleries/outliers.html
########################################################################################
Would you like to see awesome visualizations for some of the most popular academic datasets?
Click here

Traceback (most recent call last):
  File "/usr/local/lib/python3.10/dist-packages/fastdup/galleries.py", line 496, in load_one_image_for_outliers
    assert img is not None, f"Failed to read image from {impath1} {input_dir}"
AssertionError: Failed to read image from drive/MyDrive/sports_data/karate/21a811c5ce.jpg /content/drive/MyDrive/sports_data/karate
Traceback (most recent call last):
  File "/usr/local/lib/python3.10/dist-packages/fastdup/galleries.py", line 496, in load_one_image_for_outliers
    assert img is not None, f"Failed to read image from {impath1} {input_dir}"
AssertionError: Failed to read image from drive/MyDrive/sports_data/karate/c1003.jpg /content/drive/MyDrive/sports_data/karate
Traceback (most recent call last):
  File "/usr/local/lib/python3.10/dist-packages/fastdup/galleries.py", line 496, in load_one_image_for_outliers
    assert img is not None, f"Failed to read image from {impath1} {input_dir}"
AssertionError: Failed to read image from drive/MyDrive/sports_

Info,Unnamed: 1
Distance,0.473978
Path,drive/MyDrive/sports_data/karate/c1004.jpg

Info,Unnamed: 1
Distance,0.568774
Path,drive/MyDrive/sports_data/karate/3b8f71de6d.jpg

Info,Unnamed: 1
Distance,0.571812
Path,drive/MyDrive/sports_data/karate/8fb3bbd60c.jpg

Info,Unnamed: 1
Distance,0.591625
Path,drive/MyDrive/sports_data/karate/9311bd03f3.jpg

Info,Unnamed: 1
Distance,0.597016
Path,drive/MyDrive/sports_data/karate/898ea7fd7d.jpg

Info,Unnamed: 1
Distance,0.598354
Path,drive/MyDrive/sports_data/karate/c1009.jpg

Info,Unnamed: 1
Distance,0.602406
Path,drive/MyDrive/sports_data/karate/735aa4138a.jpg

Info,Unnamed: 1
Distance,0.607816
Path,drive/MyDrive/sports_data/karate/85baea6ca9.jpg

Info,Unnamed: 1
Distance,0.60854
Path,drive/MyDrive/sports_data/karate/ddb83cbd3c.jpg

Info,Unnamed: 1
Distance,0.612715
Path,drive/MyDrive/sports_data/karate/3b2b742b58.jpg

Info,Unnamed: 1
Distance,0.613916
Path,drive/MyDrive/sports_data/karate/8aa75c1544.jpg

Info,Unnamed: 1
Distance,0.614108
Path,drive/MyDrive/sports_data/karate/21a811c5ce.jpg

Info,Unnamed: 1
Distance,0.618221
Path,drive/MyDrive/sports_data/karate/c1003.jpg

Info,Unnamed: 1
Distance,0.627911
Path,drive/MyDrive/sports_data/karate/5f023bc97b.jpg

Info,Unnamed: 1
Distance,0.629417
Path,drive/MyDrive/sports_data/karate/d77d5629ed.jpg

Info,Unnamed: 1
Distance,0.632824
Path,drive/MyDrive/sports_data/karate/4653964268.jpg

Info,Unnamed: 1
Distance,0.632877
Path,drive/MyDrive/sports_data/karate/2cc02d5f10.jpg

Info,Unnamed: 1
Distance,0.632953
Path,drive/MyDrive/sports_data/karate/9581e1136d.jpg

Info,Unnamed: 1
Distance,0.635102
Path,drive/MyDrive/sports_data/karate/751b6904bb.jpg

Info,Unnamed: 1
Distance,0.635267
Path,drive/MyDrive/sports_data/karate/f66520c8bd.jpg


Hiển thị ảnh bất thường cho nhãn: football


Generating gallery:   0%|          | 0/20 [00:00<?, ?it/s]

Failed to read image from img_path drive/MyDrive/sports_data/football/9d3de05692.jpg
Failed to read image from img_path drive/MyDrive/sports_data/football/61b01d675c.jpg
Failed to read image from img_path drive/MyDrive/sports_data/football/c9e4eb6aac.jpg
Failed to read image from img_path drive/MyDrive/sports_data/football/4a38142f16.jpg
Failed to read image from img_path drive/MyDrive/sports_data/football/7f6f79e353.jpg
Failed to read image from img_path drive/MyDrive/sports_data/football/a285eba419.jpg
Failed to read image from img_path drive/MyDrive/sports_data/football/734ffd5761.jpg
Failed to read image from img_path drive/MyDrive/sports_data/football/c5354d8cb4.jpg
Failed to read image from img_path drive/MyDrive/sports_data/football/64c83d6d34.jpg
Failed to read image from img_path drive/MyDrive/sports_data/football/82b7d5c2da.jpg


Traceback (most recent call last):
  File "/usr/local/lib/python3.10/dist-packages/fastdup/galleries.py", line 496, in load_one_image_for_outliers
    assert img is not None, f"Failed to read image from {impath1} {input_dir}"
AssertionError: Failed to read image from drive/MyDrive/sports_data/football/9d3de05692.jpg /content/drive/MyDrive/sports_data/football
Traceback (most recent call last):
  File "/usr/local/lib/python3.10/dist-packages/fastdup/galleries.py", line 496, in load_one_image_for_outliers
    assert img is not None, f"Failed to read image from {impath1} {input_dir}"
AssertionError: Failed to read image from drive/MyDrive/sports_data/football/61b01d675c.jpg /content/drive/MyDrive/sports_data/football
Traceback (most recent call last):
  File "/usr/local/lib/python3.10/dist-packages/fastdup/galleries.py", line 496, in load_one_image_for_outliers
    assert img is not None, f"Failed to read image from {impath1} {input_dir}"
AssertionError: Failed to read image from drive/My

Failed to read image from img_path drive/MyDrive/sports_data/football/8e40382093.jpg
Failed to read image from img_path drive/MyDrive/sports_data/football/a2f357c4bf.jpg
Failed to read image from img_path drive/MyDrive/sports_data/football/c2035.jpg
Failed to read image from img_path drive/MyDrive/sports_data/football/19dfe2dddc.jpg
Failed to read image from img_path drive/MyDrive/sports_data/football/fe7aa3af05.jpg
Failed to read image from img_path drive/MyDrive/sports_data/football/9a607a1584.jpg
Failed to read image from img_path drive/MyDrive/sports_data/football/a4123d002a.jpg
Failed to read image from img_path drive/MyDrive/sports_data/football/fc8d63220c.jpg


Traceback (most recent call last):
  File "/usr/local/lib/python3.10/dist-packages/fastdup/galleries.py", line 496, in load_one_image_for_outliers
    assert img is not None, f"Failed to read image from {impath1} {input_dir}"
AssertionError: Failed to read image from drive/MyDrive/sports_data/football/8e40382093.jpg /content/drive/MyDrive/sports_data/football
Traceback (most recent call last):
  File "/usr/local/lib/python3.10/dist-packages/fastdup/galleries.py", line 496, in load_one_image_for_outliers
    assert img is not None, f"Failed to read image from {impath1} {input_dir}"
AssertionError: Failed to read image from drive/MyDrive/sports_data/football/a2f357c4bf.jpg /content/drive/MyDrive/sports_data/football
Traceback (most recent call last):
  File "/usr/local/lib/python3.10/dist-packages/fastdup/galleries.py", line 496, in load_one_image_for_outliers
    assert img is not None, f"Failed to read image from {impath1} {input_dir}"
AssertionError: Failed to read image from drive/My

Failed to read image from img_path drive/MyDrive/sports_data/football/a4db62fa26.jpg
Failed to read image from img_path drive/MyDrive/sports_data/football/5e895fcc86.jpg
Stored outliers visual view in  AI_football/galleries/outliers.html
########################################################################################
Would you like to see awesome visualizations for some of the most popular academic datasets?
Click here to see and learn more: https://app.visual-layer.com/vl-datasets?utm_source=fastdup
########################################################################################


Traceback (most recent call last):
  File "/usr/local/lib/python3.10/dist-packages/fastdup/galleries.py", line 496, in load_one_image_for_outliers
    assert img is not None, f"Failed to read image from {impath1} {input_dir}"
AssertionError: Failed to read image from drive/MyDrive/sports_data/football/a4db62fa26.jpg /content/drive/MyDrive/sports_data/football
Traceback (most recent call last):
  File "/usr/local/lib/python3.10/dist-packages/fastdup/galleries.py", line 496, in load_one_image_for_outliers
    assert img is not None, f"Failed to read image from {impath1} {input_dir}"
AssertionError: Failed to read image from drive/MyDrive/sports_data/football/5e895fcc86.jpg /content/drive/MyDrive/sports_data/football


Info,Unnamed: 1
Distance,0.477551
Path,drive/MyDrive/sports_data/football/9d3de05692.jpg

Info,Unnamed: 1
Distance,0.529083
Path,drive/MyDrive/sports_data/football/61b01d675c.jpg

Info,Unnamed: 1
Distance,0.541974
Path,drive/MyDrive/sports_data/football/c9e4eb6aac.jpg

Info,Unnamed: 1
Distance,0.546701
Path,drive/MyDrive/sports_data/football/4a38142f16.jpg

Info,Unnamed: 1
Distance,0.548198
Path,drive/MyDrive/sports_data/football/7f6f79e353.jpg

Info,Unnamed: 1
Distance,0.553882
Path,drive/MyDrive/sports_data/football/a285eba419.jpg

Info,Unnamed: 1
Distance,0.556374
Path,drive/MyDrive/sports_data/football/734ffd5761.jpg

Info,Unnamed: 1
Distance,0.556874
Path,drive/MyDrive/sports_data/football/c5354d8cb4.jpg

Info,Unnamed: 1
Distance,0.559207
Path,drive/MyDrive/sports_data/football/64c83d6d34.jpg

Info,Unnamed: 1
Distance,0.56031
Path,drive/MyDrive/sports_data/football/82b7d5c2da.jpg

Info,Unnamed: 1
Distance,0.560465
Path,drive/MyDrive/sports_data/football/8e40382093.jpg

Info,Unnamed: 1
Distance,0.564371
Path,drive/MyDrive/sports_data/football/a2f357c4bf.jpg

Info,Unnamed: 1
Distance,0.564518
Path,drive/MyDrive/sports_data/football/c2035.jpg

Info,Unnamed: 1
Distance,0.56591
Path,drive/MyDrive/sports_data/football/19dfe2dddc.jpg

Info,Unnamed: 1
Distance,0.567136
Path,drive/MyDrive/sports_data/football/fe7aa3af05.jpg

Info,Unnamed: 1
Distance,0.571933
Path,drive/MyDrive/sports_data/football/9a607a1584.jpg

Info,Unnamed: 1
Distance,0.572366
Path,drive/MyDrive/sports_data/football/a4123d002a.jpg

Info,Unnamed: 1
Distance,0.572544
Path,drive/MyDrive/sports_data/football/fc8d63220c.jpg

Info,Unnamed: 1
Distance,0.576399
Path,drive/MyDrive/sports_data/football/a4db62fa26.jpg

Info,Unnamed: 1
Distance,0.580469
Path,drive/MyDrive/sports_data/football/5e895fcc86.jpg


Hiển thị ảnh bất thường cho nhãn: swimming


Generating gallery:   0%|          | 0/20 [00:00<?, ?it/s]

Failed to read image from img_path drive/MyDrive/sports_data/swimming/1bf6731a34.jpg
Failed to read image from img_path drive/MyDrive/sports_data/swimming/614138a6b6.jpg
Failed to read image from img_path drive/MyDrive/sports_data/swimming/fbc70aa01c.jpg
Failed to read image from img_path drive/MyDrive/sports_data/swimming/fae3ae4d70.jpg
Failed to read image from img_path drive/MyDrive/sports_data/swimming/59146d21d1.jpg
Failed to read image from img_path drive/MyDrive/sports_data/swimming/3b90b9f115.jpg
Failed to read image from img_path drive/MyDrive/sports_data/swimming/68f029108c.jpg
Failed to read image from img_path drive/MyDrive/sports_data/swimming/4ad6cc10d6.jpg
Failed to read image from img_path drive/MyDrive/sports_data/swimming/619e8b5ad6.jpg
Failed to read image from img_path drive/MyDrive/sports_data/swimming/a837d63e34.jpg
Failed to read image from img_path drive/MyDrive/sports_data/swimming/169be9bfda.jpg
Failed to read image from img_path drive/MyDrive/sports_data/swim

Traceback (most recent call last):
  File "/usr/local/lib/python3.10/dist-packages/fastdup/galleries.py", line 496, in load_one_image_for_outliers
    assert img is not None, f"Failed to read image from {impath1} {input_dir}"
AssertionError: Failed to read image from drive/MyDrive/sports_data/swimming/1bf6731a34.jpg /content/drive/MyDrive/sports_data/swimming
Traceback (most recent call last):
  File "/usr/local/lib/python3.10/dist-packages/fastdup/galleries.py", line 496, in load_one_image_for_outliers
    assert img is not None, f"Failed to read image from {impath1} {input_dir}"
AssertionError: Failed to read image from drive/MyDrive/sports_data/swimming/614138a6b6.jpg /content/drive/MyDrive/sports_data/swimming
Traceback (most recent call last):
  File "/usr/local/lib/python3.10/dist-packages/fastdup/galleries.py", line 496, in load_one_image_for_outliers
    assert img is not None, f"Failed to read image from {impath1} {input_dir}"
AssertionError: Failed to read image from drive/My

Failed to read image from img_path drive/MyDrive/sports_data/swimming/1e6a2d5614.jpg
Failed to read image from img_path drive/MyDrive/sports_data/swimming/76bede4f33.jpg
Failed to read image from img_path drive/MyDrive/sports_data/swimming/ca38ffe010.jpg
Failed to read image from img_path drive/MyDrive/sports_data/swimming/157c299a95.jpg
Failed to read image from img_path drive/MyDrive/sports_data/swimming/42edb37438.jpg
Failed to read image from img_path drive/MyDrive/sports_data/swimming/063330a554.jpg


AssertionError: Failed to read image from drive/MyDrive/sports_data/swimming/b65062fa7f.jpg /content/drive/MyDrive/sports_data/swimming
Traceback (most recent call last):
  File "/usr/local/lib/python3.10/dist-packages/fastdup/galleries.py", line 496, in load_one_image_for_outliers
    assert img is not None, f"Failed to read image from {impath1} {input_dir}"
AssertionError: Failed to read image from drive/MyDrive/sports_data/swimming/1e6a2d5614.jpg /content/drive/MyDrive/sports_data/swimming
Traceback (most recent call last):
  File "/usr/local/lib/python3.10/dist-packages/fastdup/galleries.py", line 496, in load_one_image_for_outliers
    assert img is not None, f"Failed to read image from {impath1} {input_dir}"
AssertionError: Failed to read image from drive/MyDrive/sports_data/swimming/76bede4f33.jpg /content/drive/MyDrive/sports_data/swimming
Traceback (most recent call last):
  File "/usr/local/lib/python3.10/dist-packages/fastdup/galleries.py", line 496, in load_one_image_for_ou

Failed to read image from img_path drive/MyDrive/sports_data/swimming/36e898dd84.jpg
Failed to read image from img_path drive/MyDrive/sports_data/swimming/a2c0f03654.jpg
Stored outliers visual view in  AI_swimming/galleries/outliers.html
########################################################################################
Would you like to see awesome visualizations for some of the most popular academic datasets?
Click here to see and learn more: https://app.visual-layer.com/vl-datasets?utm_source=fastdup
########################################################################################


Info,Unnamed: 1
Distance,0.542395
Path,drive/MyDrive/sports_data/swimming/1bf6731a34.jpg

Info,Unnamed: 1
Distance,0.563127
Path,drive/MyDrive/sports_data/swimming/614138a6b6.jpg

Info,Unnamed: 1
Distance,0.567857
Path,drive/MyDrive/sports_data/swimming/fbc70aa01c.jpg

Info,Unnamed: 1
Distance,0.568217
Path,drive/MyDrive/sports_data/swimming/fae3ae4d70.jpg

Info,Unnamed: 1
Distance,0.583545
Path,drive/MyDrive/sports_data/swimming/59146d21d1.jpg

Info,Unnamed: 1
Distance,0.591998
Path,drive/MyDrive/sports_data/swimming/3b90b9f115.jpg

Info,Unnamed: 1
Distance,0.59639
Path,drive/MyDrive/sports_data/swimming/68f029108c.jpg

Info,Unnamed: 1
Distance,0.597082
Path,drive/MyDrive/sports_data/swimming/4ad6cc10d6.jpg

Info,Unnamed: 1
Distance,0.601769
Path,drive/MyDrive/sports_data/swimming/619e8b5ad6.jpg

Info,Unnamed: 1
Distance,0.605168
Path,drive/MyDrive/sports_data/swimming/a837d63e34.jpg

Info,Unnamed: 1
Distance,0.607006
Path,drive/MyDrive/sports_data/swimming/169be9bfda.jpg

Info,Unnamed: 1
Distance,0.607038
Path,drive/MyDrive/sports_data/swimming/b65062fa7f.jpg

Info,Unnamed: 1
Distance,0.612252
Path,drive/MyDrive/sports_data/swimming/1e6a2d5614.jpg

Info,Unnamed: 1
Distance,0.61424
Path,drive/MyDrive/sports_data/swimming/76bede4f33.jpg

Info,Unnamed: 1
Distance,0.61531
Path,drive/MyDrive/sports_data/swimming/ca38ffe010.jpg

Info,Unnamed: 1
Distance,0.616268
Path,drive/MyDrive/sports_data/swimming/157c299a95.jpg

Info,Unnamed: 1
Distance,0.618598
Path,drive/MyDrive/sports_data/swimming/42edb37438.jpg

Info,Unnamed: 1
Distance,0.619483
Path,drive/MyDrive/sports_data/swimming/063330a554.jpg

Info,Unnamed: 1
Distance,0.620006
Path,drive/MyDrive/sports_data/swimming/36e898dd84.jpg

Info,Unnamed: 1
Distance,0.620186
Path,drive/MyDrive/sports_data/swimming/a2c0f03654.jpg


Hiển thị ảnh bất thường cho nhãn: tennis


Generating gallery:   0%|          | 0/20 [00:00<?, ?it/s]

Failed to read image from img_path drive/MyDrive/sports_data/tennis/42e9891221.jpg
Failed to read image from img_path drive/MyDrive/sports_data/tennis/6d655af337.jpg
Failed to read image from img_path drive/MyDrive/sports_data/tennis/24e05b329b.jpg
Failed to read image from img_path drive/MyDrive/sports_data/tennis/1045261517.jpg
Failed to read image from img_path drive/MyDrive/sports_data/tennis/5f38824b6f.jpg
Failed to read image from img_path drive/MyDrive/sports_data/tennis/89a6ae23ef.jpg
Failed to read image from img_path drive/MyDrive/sports_data/tennis/2f81b3e51b.jpg
Failed to read image from img_path drive/MyDrive/sports_data/tennis/c84e9e109a.jpg
Failed to read image from img_path drive/MyDrive/sports_data/tennis/ab43dbdbf7.jpg


Traceback (most recent call last):
  File "/usr/local/lib/python3.10/dist-packages/fastdup/galleries.py", line 496, in load_one_image_for_outliers
    assert img is not None, f"Failed to read image from {impath1} {input_dir}"
AssertionError: Failed to read image from drive/MyDrive/sports_data/tennis/42e9891221.jpg /content/drive/MyDrive/sports_data/tennis
Traceback (most recent call last):
  File "/usr/local/lib/python3.10/dist-packages/fastdup/galleries.py", line 496, in load_one_image_for_outliers
    assert img is not None, f"Failed to read image from {impath1} {input_dir}"
AssertionError: Failed to read image from drive/MyDrive/sports_data/tennis/6d655af337.jpg /content/drive/MyDrive/sports_data/tennis
Traceback (most recent call last):
  File "/usr/local/lib/python3.10/dist-packages/fastdup/galleries.py", line 496, in load_one_image_for_outliers
    assert img is not None, f"Failed to read image from {impath1} {input_dir}"
AssertionError: Failed to read image from drive/MyDrive/sp

Failed to read image from img_path drive/MyDrive/sports_data/tennis/097cdfa562.jpg
Failed to read image from img_path drive/MyDrive/sports_data/tennis/e1e2a7e4c0.jpg
Failed to read image from img_path drive/MyDrive/sports_data/tennis/bc93a15ac0.jpg
Failed to read image from img_path drive/MyDrive/sports_data/tennis/31a0d78cbf.jpg
Failed to read image from img_path drive/MyDrive/sports_data/tennis/c620af3913.jpg
Failed to read image from img_path drive/MyDrive/sports_data/tennis/779988fdb3.jpg
Failed to read image from img_path drive/MyDrive/sports_data/tennis/2ebecfe199.jpg
Failed to read image from img_path drive/MyDrive/sports_data/tennis/23b18a929a.jpg
Failed to read image from img_path drive/MyDrive/sports_data/tennis/422833d4d1.jpg
Failed to read image from img_path drive/MyDrive/sports_data/tennis/dca30e2998.jpg


Traceback (most recent call last):
  File "/usr/local/lib/python3.10/dist-packages/fastdup/galleries.py", line 496, in load_one_image_for_outliers
    assert img is not None, f"Failed to read image from {impath1} {input_dir}"
AssertionError: Failed to read image from drive/MyDrive/sports_data/tennis/097cdfa562.jpg /content/drive/MyDrive/sports_data/tennis
Traceback (most recent call last):
  File "/usr/local/lib/python3.10/dist-packages/fastdup/galleries.py", line 496, in load_one_image_for_outliers
    assert img is not None, f"Failed to read image from {impath1} {input_dir}"
AssertionError: Failed to read image from drive/MyDrive/sports_data/tennis/e1e2a7e4c0.jpg /content/drive/MyDrive/sports_data/tennis
Traceback (most recent call last):
  File "/usr/local/lib/python3.10/dist-packages/fastdup/galleries.py", line 496, in load_one_image_for_outliers
    assert img is not None, f"Failed to read image from {impath1} {input_dir}"
AssertionError: Failed to read image from drive/MyDrive/sp

Failed to read image from img_path drive/MyDrive/sports_data/tennis/4c88415a39.jpg
Stored outliers visual view in  AI_tennis/galleries/outliers.html
########################################################################################
Would you like to see awesome visualizations for some of the most popular academic datasets?
Click here to see and learn more: https://app.visual-layer.com/vl-datasets?utm_source=fastdup
########################################################################################


Traceback (most recent call last):
  File "/usr/local/lib/python3.10/dist-packages/fastdup/galleries.py", line 496, in load_one_image_for_outliers
    assert img is not None, f"Failed to read image from {impath1} {input_dir}"
AssertionError: Failed to read image from drive/MyDrive/sports_data/tennis/4c88415a39.jpg /content/drive/MyDrive/sports_data/tennis


Info,Unnamed: 1
Distance,0.437663
Path,drive/MyDrive/sports_data/tennis/42e9891221.jpg

Info,Unnamed: 1
Distance,0.495438
Path,drive/MyDrive/sports_data/tennis/6d655af337.jpg

Info,Unnamed: 1
Distance,0.517078
Path,drive/MyDrive/sports_data/tennis/24e05b329b.jpg

Info,Unnamed: 1
Distance,0.52108
Path,drive/MyDrive/sports_data/tennis/1045261517.jpg

Info,Unnamed: 1
Distance,0.524761
Path,drive/MyDrive/sports_data/tennis/5f38824b6f.jpg

Info,Unnamed: 1
Distance,0.524761
Path,drive/MyDrive/sports_data/tennis/89a6ae23ef.jpg

Info,Unnamed: 1
Distance,0.527807
Path,drive/MyDrive/sports_data/tennis/2f81b3e51b.jpg

Info,Unnamed: 1
Distance,0.536584
Path,drive/MyDrive/sports_data/tennis/c84e9e109a.jpg

Info,Unnamed: 1
Distance,0.537837
Path,drive/MyDrive/sports_data/tennis/ab43dbdbf7.jpg

Info,Unnamed: 1
Distance,0.540514
Path,drive/MyDrive/sports_data/tennis/097cdfa562.jpg

Info,Unnamed: 1
Distance,0.55529
Path,drive/MyDrive/sports_data/tennis/e1e2a7e4c0.jpg

Info,Unnamed: 1
Distance,0.566413
Path,drive/MyDrive/sports_data/tennis/bc93a15ac0.jpg

Info,Unnamed: 1
Distance,0.566631
Path,drive/MyDrive/sports_data/tennis/31a0d78cbf.jpg

Info,Unnamed: 1
Distance,0.568197
Path,drive/MyDrive/sports_data/tennis/c620af3913.jpg

Info,Unnamed: 1
Distance,0.569794
Path,drive/MyDrive/sports_data/tennis/779988fdb3.jpg

Info,Unnamed: 1
Distance,0.571292
Path,drive/MyDrive/sports_data/tennis/2ebecfe199.jpg

Info,Unnamed: 1
Distance,0.578088
Path,drive/MyDrive/sports_data/tennis/23b18a929a.jpg

Info,Unnamed: 1
Distance,0.580248
Path,drive/MyDrive/sports_data/tennis/422833d4d1.jpg

Info,Unnamed: 1
Distance,0.582061
Path,drive/MyDrive/sports_data/tennis/dca30e2998.jpg

Info,Unnamed: 1
Distance,0.583868
Path,drive/MyDrive/sports_data/tennis/4c88415a39.jpg


Hiển thị ảnh bất thường cho nhãn: wrestling


Generating gallery:   0%|          | 0/20 [00:00<?, ?it/s]

Failed to read image from img_path drive/MyDrive/sports_data/wrestling/0c4b6db7c6.jpg
Failed to read image from img_path drive/MyDrive/sports_data/wrestling/b8e461ed8b.jpg
Failed to read image from img_path drive/MyDrive/sports_data/wrestling/c6c7f444dd.jpg
Failed to read image from img_path drive/MyDrive/sports_data/wrestling/2eb9c04b95.jpg
Failed to read image from img_path drive/MyDrive/sports_data/wrestling/c8004.jpg
Failed to read image from img_path drive/MyDrive/sports_data/wrestling/c9004c06f4.jpg
Failed to read image from img_path drive/MyDrive/sports_data/wrestling/5406eda401.jpg
Failed to read image from img_path drive/MyDrive/sports_data/wrestling/b52d7d1952.jpg
Failed to read image from img_path drive/MyDrive/sports_data/wrestling/8960280850.jpg
Failed to read image from img_path drive/MyDrive/sports_data/wrestling/3c8fee00b0.jpg
Failed to read image from img_path drive/MyDrive/sports_data/wrestling/3760663aaf.jpg
Failed to read image from img_path drive/MyDrive/sports_dat

Traceback (most recent call last):
  File "/usr/local/lib/python3.10/dist-packages/fastdup/galleries.py", line 496, in load_one_image_for_outliers
    assert img is not None, f"Failed to read image from {impath1} {input_dir}"
AssertionError: Failed to read image from drive/MyDrive/sports_data/wrestling/0c4b6db7c6.jpg /content/drive/MyDrive/sports_data/wrestling
Traceback (most recent call last):
  File "/usr/local/lib/python3.10/dist-packages/fastdup/galleries.py", line 496, in load_one_image_for_outliers
    assert img is not None, f"Failed to read image from {impath1} {input_dir}"
AssertionError: Failed to read image from drive/MyDrive/sports_data/wrestling/b8e461ed8b.jpg /content/drive/MyDrive/sports_data/wrestling
Traceback (most recent call last):
  File "/usr/local/lib/python3.10/dist-packages/fastdup/galleries.py", line 496, in load_one_image_for_outliers
    assert img is not None, f"Failed to read image from {impath1} {input_dir}"
AssertionError: Failed to read image from driv

Failed to read image from img_path drive/MyDrive/sports_data/wrestling/e88320c906.jpg
Failed to read image from img_path drive/MyDrive/sports_data/wrestling/6bd5d600c4.jpg
Failed to read image from img_path drive/MyDrive/sports_data/wrestling/d03ed14be3.jpg
Failed to read image from img_path drive/MyDrive/sports_data/wrestling/e25ab4d01a.jpg
Failed to read image from img_path drive/MyDrive/sports_data/wrestling/a682b9aef7.jpg
Stored outliers visual view in  AI_wrestling/galleries/outliers.html
########################################################################################
Would you like to see awesome visualizations for some of the most popular academic datasets?
Click here to see and learn more: https://app.visual-layer.com/vl-datasets?utm_source=fastdup
########################################################################################


Traceback (most recent call last):
  File "/usr/local/lib/python3.10/dist-packages/fastdup/galleries.py", line 496, in load_one_image_for_outliers
    assert img is not None, f"Failed to read image from {impath1} {input_dir}"
AssertionError: Failed to read image from drive/MyDrive/sports_data/wrestling/e88320c906.jpg /content/drive/MyDrive/sports_data/wrestling
Traceback (most recent call last):
  File "/usr/local/lib/python3.10/dist-packages/fastdup/galleries.py", line 496, in load_one_image_for_outliers
    assert img is not None, f"Failed to read image from {impath1} {input_dir}"
AssertionError: Failed to read image from drive/MyDrive/sports_data/wrestling/6bd5d600c4.jpg /content/drive/MyDrive/sports_data/wrestling
Traceback (most recent call last):
  File "/usr/local/lib/python3.10/dist-packages/fastdup/galleries.py", line 496, in load_one_image_for_outliers
    assert img is not None, f"Failed to read image from {impath1} {input_dir}"
AssertionError: Failed to read image from driv

Info,Unnamed: 1
Distance,0.418792
Path,drive/MyDrive/sports_data/wrestling/0c4b6db7c6.jpg

Info,Unnamed: 1
Distance,0.524557
Path,drive/MyDrive/sports_data/wrestling/b8e461ed8b.jpg

Info,Unnamed: 1
Distance,0.539804
Path,drive/MyDrive/sports_data/wrestling/c6c7f444dd.jpg

Info,Unnamed: 1
Distance,0.541789
Path,drive/MyDrive/sports_data/wrestling/2eb9c04b95.jpg

Info,Unnamed: 1
Distance,0.549564
Path,drive/MyDrive/sports_data/wrestling/c8004.jpg

Info,Unnamed: 1
Distance,0.554531
Path,drive/MyDrive/sports_data/wrestling/c9004c06f4.jpg

Info,Unnamed: 1
Distance,0.565561
Path,drive/MyDrive/sports_data/wrestling/5406eda401.jpg

Info,Unnamed: 1
Distance,0.566359
Path,drive/MyDrive/sports_data/wrestling/b52d7d1952.jpg

Info,Unnamed: 1
Distance,0.570826
Path,drive/MyDrive/sports_data/wrestling/8960280850.jpg

Info,Unnamed: 1
Distance,0.578302
Path,drive/MyDrive/sports_data/wrestling/3c8fee00b0.jpg

Info,Unnamed: 1
Distance,0.578455
Path,drive/MyDrive/sports_data/wrestling/3760663aaf.jpg

Info,Unnamed: 1
Distance,0.581011
Path,drive/MyDrive/sports_data/wrestling/5b6aef6ae3.jpg

Info,Unnamed: 1
Distance,0.585661
Path,drive/MyDrive/sports_data/wrestling/5d594319ef.jpg

Info,Unnamed: 1
Distance,0.589503
Path,drive/MyDrive/sports_data/wrestling/899a79c868.jpg

Info,Unnamed: 1
Distance,0.591118
Path,drive/MyDrive/sports_data/wrestling/47f1f5d75d.jpg

Info,Unnamed: 1
Distance,0.591261
Path,drive/MyDrive/sports_data/wrestling/e88320c906.jpg

Info,Unnamed: 1
Distance,0.595459
Path,drive/MyDrive/sports_data/wrestling/6bd5d600c4.jpg

Info,Unnamed: 1
Distance,0.595656
Path,drive/MyDrive/sports_data/wrestling/d03ed14be3.jpg

Info,Unnamed: 1
Distance,0.596012
Path,drive/MyDrive/sports_data/wrestling/e25ab4d01a.jpg

Info,Unnamed: 1
Distance,0.596549
Path,drive/MyDrive/sports_data/wrestling/a682b9aef7.jpg
