In [1]:
import numpy as np
from PIL import Image
from typing import Union, List
from pathlib import Path

from transights.utils import FolderScanner as fs


random_state = 23

In [2]:
# Example 1: Get files from a single folder (Path object)
folder_path = Path(r".\transights")
files = fs.get_files(folder_path)
print(files)

[WindowsPath('transights/__init__.py')]


In [3]:
# Example 2: Get files from multiple folders (Path objects)
folder_paths = [Path(r".\transights\aggregator"), Path(r".\transights\transforms")]
files = fs.get_files(folder_paths)
print(files)

[WindowsPath('transights/aggregator/Aggregator.py'), WindowsPath('transights/aggregator/__init__.py'), WindowsPath('transights/transforms/transforms.py'), WindowsPath('transights/transforms/__init__.py')]


In [4]:
# Example 3: Get files from a single folder (string)
folder_path = r".\transights"
files = fs.get_files(folder_path)
print(files)

[WindowsPath('transights/__init__.py')]


In [5]:
# Example 4: Get files from multiple folders (strings)
folder_paths = [r".\transights\aggregator", r".\transights\transforms"]
files = fs.get_files(folder_paths)
print(files)

[WindowsPath('transights/aggregator/Aggregator.py'), WindowsPath('transights/aggregator/__init__.py'), WindowsPath('transights/transforms/transforms.py'), WindowsPath('transights/transforms/__init__.py')]


In [7]:
# Example 5: Get files with a specific extension
folder_path = Path(r".\transights\aggregator")
extension = ".py"
files = fs.get_files(folder_path, extension)
print(files)

[WindowsPath('transights/aggregator/Aggregator.py'), WindowsPath('transights/aggregator/__init__.py')]


In [11]:
# Example 6: Get files with multiple specific extensions
folder_path = Path(r"..\transights")
extensions = [".py", ".txt"]
files = fs.get_files(folder_path, extensions)
print(files)

[WindowsPath('../transights/requirements.txt'), WindowsPath('../transights/setup.py')]


In [8]:
# Example 7: Get image files from a single folder (Path object)
folder_path = Path(r".\data\train")
image_files = fs.get_image_files(folder_path)
print(image_files)

[WindowsPath('E:/Dropbox/git/tutorials/data/indigits/train/907363-_AL_23-51-09.jpg'), WindowsPath('E:/Dropbox/git/tutorials/data/indigits/train/911838-_AL_22-47-38.jpg'), WindowsPath('E:/Dropbox/git/tutorials/data/indigits/train/916564-_AL_21-33-12.jpg'), WindowsPath('E:/Dropbox/git/tutorials/data/indigits/train/917955-_AL_22-56-58.jpg'), WindowsPath('E:/Dropbox/git/tutorials/data/indigits/train/921001-_AL_18-19-32.jpg'), WindowsPath('E:/Dropbox/git/tutorials/data/indigits/train/930299-1_AL_23-23-15.jpg'), WindowsPath('E:/Dropbox/git/tutorials/data/indigits/train/930299-2_AL_23-36-25.jpg'), WindowsPath('E:/Dropbox/git/tutorials/data/indigits/train/931807-1_AL_16-32-59.jpg'), WindowsPath('E:/Dropbox/git/tutorials/data/indigits/train/931807-2_AL_16-35-29.jpg'), WindowsPath('E:/Dropbox/git/tutorials/data/indigits/train/931932-_AL_21-22-57.jpg')]


In [9]:
# Example 8: Get image files from multiple folders (Path objects)
folder_paths = [Path(r".\data\train"), Path(r".\data\test")]
image_files = fs.get_image_files(folder_paths)
print(image_files)

[WindowsPath('E:/Dropbox/git/tutorials/data/indigits/train/907363-_AL_23-51-09.jpg'), WindowsPath('E:/Dropbox/git/tutorials/data/indigits/train/911838-_AL_22-47-38.jpg'), WindowsPath('E:/Dropbox/git/tutorials/data/indigits/train/916564-_AL_21-33-12.jpg'), WindowsPath('E:/Dropbox/git/tutorials/data/indigits/train/917955-_AL_22-56-58.jpg'), WindowsPath('E:/Dropbox/git/tutorials/data/indigits/train/921001-_AL_18-19-32.jpg'), WindowsPath('E:/Dropbox/git/tutorials/data/indigits/train/930299-1_AL_23-23-15.jpg'), WindowsPath('E:/Dropbox/git/tutorials/data/indigits/train/930299-2_AL_23-36-25.jpg'), WindowsPath('E:/Dropbox/git/tutorials/data/indigits/train/931807-1_AL_16-32-59.jpg'), WindowsPath('E:/Dropbox/git/tutorials/data/indigits/train/931807-2_AL_16-35-29.jpg'), WindowsPath('E:/Dropbox/git/tutorials/data/indigits/train/931932-_AL_21-22-57.jpg'), WindowsPath('E:/Dropbox/git/tutorials/data/indigits/test/894422-_AL_01-16-47.jpg'), WindowsPath('E:/Dropbox/git/tutorials/data/indigits/test/8944

In [10]:
# Example 9: Get CSV files from a single folder (string)
folder_path = Path(r".\data\train")
csv_files = fs.get_csv_files(folder_path)
print(csv_files)

[WindowsPath('E:/Dropbox/git/tutorials/data/3class_anomalies.csv'), WindowsPath('E:/Dropbox/git/tutorials/data/anagrams.csv'), WindowsPath('E:/Dropbox/git/tutorials/data/anscombe.csv'), WindowsPath('E:/Dropbox/git/tutorials/data/assignment1.csv'), WindowsPath('E:/Dropbox/git/tutorials/data/assignment_2.csv'), WindowsPath('E:/Dropbox/git/tutorials/data/assignment_3.csv'), WindowsPath('E:/Dropbox/git/tutorials/data/assignment_3_categoricals.csv'), WindowsPath('E:/Dropbox/git/tutorials/data/assignment_4.csv'), WindowsPath('E:/Dropbox/git/tutorials/data/attention.csv'), WindowsPath('E:/Dropbox/git/tutorials/data/brain_networks.csv'), WindowsPath('E:/Dropbox/git/tutorials/data/car_crashes.csv'), WindowsPath('E:/Dropbox/git/tutorials/data/DATA_dp_wc_bc.csv'), WindowsPath('E:/Dropbox/git/tutorials/data/diamonds.csv'), WindowsPath('E:/Dropbox/git/tutorials/data/dots.csv'), WindowsPath('E:/Dropbox/git/tutorials/data/exercise.csv'), WindowsPath('E:/Dropbox/git/tutorials/data/flights.csv'), Windo

In [11]:
# Example 10: Get CSV files from multiple folders (strings)
folder_paths = [Path(r".\data\train"), Path(r".\data\test")]
csv_files = fs.get_csv_files(folder_paths)
print(csv_files)

[WindowsPath('E:/Dropbox/git/tutorials/data/3class_anomalies.csv'), WindowsPath('E:/Dropbox/git/tutorials/data/anagrams.csv'), WindowsPath('E:/Dropbox/git/tutorials/data/anscombe.csv'), WindowsPath('E:/Dropbox/git/tutorials/data/assignment1.csv'), WindowsPath('E:/Dropbox/git/tutorials/data/assignment_2.csv'), WindowsPath('E:/Dropbox/git/tutorials/data/assignment_3.csv'), WindowsPath('E:/Dropbox/git/tutorials/data/assignment_3_categoricals.csv'), WindowsPath('E:/Dropbox/git/tutorials/data/assignment_4.csv'), WindowsPath('E:/Dropbox/git/tutorials/data/attention.csv'), WindowsPath('E:/Dropbox/git/tutorials/data/brain_networks.csv'), WindowsPath('E:/Dropbox/git/tutorials/data/car_crashes.csv'), WindowsPath('E:/Dropbox/git/tutorials/data/DATA_dp_wc_bc.csv'), WindowsPath('E:/Dropbox/git/tutorials/data/diamonds.csv'), WindowsPath('E:/Dropbox/git/tutorials/data/dots.csv'), WindowsPath('E:/Dropbox/git/tutorials/data/exercise.csv'), WindowsPath('E:/Dropbox/git/tutorials/data/flights.csv'), Windo

In [12]:
# Example 11: Get all files recursively
folder_path = Path(r"..\transights")
files = fs.get_files(folder_path, recursive=True)
print(files)

[WindowsPath('../transights/.gitattributes'), WindowsPath('../transights/.gitignore'), WindowsPath('../transights/FolderScanner_demo.ipynb'), WindowsPath('../transights/LICENSE'), WindowsPath('../transights/package_testing.ipynb'), WindowsPath('../transights/README.md'), WindowsPath('../transights/requirements.txt'), WindowsPath('../transights/setup.py'), WindowsPath('../transights/.git/COMMIT_EDITMSG'), WindowsPath('../transights/.git/config'), WindowsPath('../transights/.git/description'), WindowsPath('../transights/.git/FETCH_HEAD'), WindowsPath('../transights/.git/HEAD'), WindowsPath('../transights/.git/index'), WindowsPath('../transights/.git/ORIG_HEAD'), WindowsPath('../transights/.git/packed-refs'), WindowsPath('../transights/.git/hooks/applypatch-msg.sample'), WindowsPath('../transights/.git/hooks/commit-msg.sample'), WindowsPath('../transights/.git/hooks/fsmonitor-watchman.sample'), WindowsPath('../transights/.git/hooks/post-update.sample'), WindowsPath('../transights/.git/hoo