In [1]:
import glob
import pathlib
from pydantic import BaseModel, Field,  TypeAdapter
from typing import List, Literal, Dict, Optional
from uuid import uuid4
from enum import Enum
from IPython.display import Image 
import json
import pandas as pd


from constant import TARGET

In [2]:
class WasteLabel(str, Enum):
    PET = "PET"
    RIGID_PLASTIC = "Rigid Plastic"
    PLASTIC_CUPS = "Plastic Cups"
    FLEXIBLE_PLASTIC = "Flexible Plastic"
    HARD_PLASTIC = "Hard Plastic"
    PAPER = "Paper"
    METAL = "Metal"
    GLASS = "Glass"
    OTHER = "Other"

In [3]:
class Dataset(BaseModel):
    path:str = Field(description="Image path dataset")
    target:WasteLabel = Field(description= "Label of the image")

In [4]:
TARGET

{0: 'PET',
 1: 'Rigid Plastic',
 2: 'Plastic Cups',
 3: 'Flexible Plastic',
 4: 'Hard Plastic',
 5: 'Paper',
 6: 'Metal',
 7: 'Glass',
 8: 'Other'}

In [5]:
OUTPUT_FOLDER = "datasetv2.csv"

## Kaggle


### mostafaabla/garbage-classification

In [6]:
garbage_classification = glob.glob("datasets/datasets/mostafaabla/garbage-classification/versions/1/garbage_classification/*")
garbage_classification

['datasets/datasets/mostafaabla/garbage-classification/versions/1/garbage_classification/clothes',
 'datasets/datasets/mostafaabla/garbage-classification/versions/1/garbage_classification/brown-glass',
 'datasets/datasets/mostafaabla/garbage-classification/versions/1/garbage_classification/metal',
 'datasets/datasets/mostafaabla/garbage-classification/versions/1/garbage_classification/white-glass',
 'datasets/datasets/mostafaabla/garbage-classification/versions/1/garbage_classification/cardboard',
 'datasets/datasets/mostafaabla/garbage-classification/versions/1/garbage_classification/shoes',
 'datasets/datasets/mostafaabla/garbage-classification/versions/1/garbage_classification/battery',
 'datasets/datasets/mostafaabla/garbage-classification/versions/1/garbage_classification/paper',
 'datasets/datasets/mostafaabla/garbage-classification/versions/1/garbage_classification/biological',
 'datasets/datasets/mostafaabla/garbage-classification/versions/1/garbage_classification/trash',
 'dat

#### Glass

In [7]:
garbage_classification_glass = glob.glob("datasets/datasets/mostafaabla/garbage-classification/versions/1/garbage_classification/*glass/*.jpg")
garbage_classification_glass

['datasets/datasets/mostafaabla/garbage-classification/versions/1/garbage_classification/brown-glass/brown-glass218.jpg',
 'datasets/datasets/mostafaabla/garbage-classification/versions/1/garbage_classification/brown-glass/brown-glass404.jpg',
 'datasets/datasets/mostafaabla/garbage-classification/versions/1/garbage_classification/brown-glass/brown-glass151.jpg',
 'datasets/datasets/mostafaabla/garbage-classification/versions/1/garbage_classification/brown-glass/brown-glass219.jpg',
 'datasets/datasets/mostafaabla/garbage-classification/versions/1/garbage_classification/brown-glass/brown-glass26.jpg',
 'datasets/datasets/mostafaabla/garbage-classification/versions/1/garbage_classification/brown-glass/brown-glass135.jpg',
 'datasets/datasets/mostafaabla/garbage-classification/versions/1/garbage_classification/brown-glass/brown-glass48.jpg',
 'datasets/datasets/mostafaabla/garbage-classification/versions/1/garbage_classification/brown-glass/brown-glass279.jpg',
 'datasets/datasets/mostaf

In [8]:
glass_data = [
    Dataset(
        path=img_path,
        target=WasteLabel.GLASS
    )
    for img_path in garbage_classification_glass
] 

In [9]:
pd.DataFrame(TypeAdapter(list[Dataset]).dump_python(glass_data)).to_csv(OUTPUT_FOLDER, index=False)

#### Paper


In [10]:
garbage_classification_paper= glob.glob("datasets/datasets/mostafaabla/garbage-classification/versions/1/garbage_classification/*paper/*.jpg")
garbage_classification_paper


['datasets/datasets/mostafaabla/garbage-classification/versions/1/garbage_classification/paper/paper829.jpg',
 'datasets/datasets/mostafaabla/garbage-classification/versions/1/garbage_classification/paper/paper28.jpg',
 'datasets/datasets/mostafaabla/garbage-classification/versions/1/garbage_classification/paper/paper377.jpg',
 'datasets/datasets/mostafaabla/garbage-classification/versions/1/garbage_classification/paper/paper627.jpg',
 'datasets/datasets/mostafaabla/garbage-classification/versions/1/garbage_classification/paper/paper822.jpg',
 'datasets/datasets/mostafaabla/garbage-classification/versions/1/garbage_classification/paper/paper476.jpg',
 'datasets/datasets/mostafaabla/garbage-classification/versions/1/garbage_classification/paper/paper480.jpg',
 'datasets/datasets/mostafaabla/garbage-classification/versions/1/garbage_classification/paper/paper611.jpg',
 'datasets/datasets/mostafaabla/garbage-classification/versions/1/garbage_classification/paper/paper550.jpg',
 'datasets/

In [11]:
paper_data = [
    Dataset(
        path=img_path,
        target=WasteLabel.PAPER
    )
    for img_path in garbage_classification_paper
] 

In [12]:
pd.DataFrame(TypeAdapter(list[Dataset]).dump_python(paper_data)).to_csv(OUTPUT_FOLDER, index=False, mode="a", header = False)

In [13]:
garbage_classification_cardboard= glob.glob("datasets/datasets/mostafaabla/garbage-classification/versions/1/garbage_classification/*cardboard/*.jpg")
garbage_classification_cardboard

['datasets/datasets/mostafaabla/garbage-classification/versions/1/garbage_classification/cardboard/cardboard564.jpg',
 'datasets/datasets/mostafaabla/garbage-classification/versions/1/garbage_classification/cardboard/cardboard328.jpg',
 'datasets/datasets/mostafaabla/garbage-classification/versions/1/garbage_classification/cardboard/cardboard129.jpg',
 'datasets/datasets/mostafaabla/garbage-classification/versions/1/garbage_classification/cardboard/cardboard883.jpg',
 'datasets/datasets/mostafaabla/garbage-classification/versions/1/garbage_classification/cardboard/cardboard551.jpg',
 'datasets/datasets/mostafaabla/garbage-classification/versions/1/garbage_classification/cardboard/cardboard442.jpg',
 'datasets/datasets/mostafaabla/garbage-classification/versions/1/garbage_classification/cardboard/cardboard226.jpg',
 'datasets/datasets/mostafaabla/garbage-classification/versions/1/garbage_classification/cardboard/cardboard788.jpg',
 'datasets/datasets/mostafaabla/garbage-classification/v

In [14]:
cardboard_data = [
    Dataset(
        path=img_path,
        target=WasteLabel.PAPER
    )
    for img_path in garbage_classification_cardboard
] 

In [15]:
pd.DataFrame(TypeAdapter(list[Dataset]).dump_python(cardboard_data)).to_csv(OUTPUT_FOLDER, index=False, mode="a", header = False)

#### Metal

In [16]:
garbage_classification_metal= glob.glob("datasets/datasets/mostafaabla/garbage-classification/versions/1/garbage_classification/*metal/*.jpg")
garbage_classification_metal

['datasets/datasets/mostafaabla/garbage-classification/versions/1/garbage_classification/metal/metal678.jpg',
 'datasets/datasets/mostafaabla/garbage-classification/versions/1/garbage_classification/metal/metal713.jpg',
 'datasets/datasets/mostafaabla/garbage-classification/versions/1/garbage_classification/metal/metal489.jpg',
 'datasets/datasets/mostafaabla/garbage-classification/versions/1/garbage_classification/metal/metal274.jpg',
 'datasets/datasets/mostafaabla/garbage-classification/versions/1/garbage_classification/metal/metal536.jpg',
 'datasets/datasets/mostafaabla/garbage-classification/versions/1/garbage_classification/metal/metal116.jpg',
 'datasets/datasets/mostafaabla/garbage-classification/versions/1/garbage_classification/metal/metal442.jpg',
 'datasets/datasets/mostafaabla/garbage-classification/versions/1/garbage_classification/metal/metal260.jpg',
 'datasets/datasets/mostafaabla/garbage-classification/versions/1/garbage_classification/metal/metal289.jpg',
 'datasets

In [17]:
metal_data = [
    Dataset(
        path=img_path,
        target=WasteLabel.METAL
    )
    for img_path in garbage_classification_metal
] 

In [18]:
pd.DataFrame(TypeAdapter(list[Dataset]).dump_python(metal_data)).to_csv(OUTPUT_FOLDER, index=False, mode="a", header = False)

### vencerlanz09/plastic-paper-garbage-bag-synthetic-images

In [19]:
class_bag = glob.glob("datasets/datasets/vencerlanz09/plastic-paper-garbage-bag-synthetic-images/versions/1/*/Bag Classes/*")
class_bag

['datasets/datasets/vencerlanz09/plastic-paper-garbage-bag-synthetic-images/versions/1/Bag Classes/Bag Classes/Garbage Bag Images',
 'datasets/datasets/vencerlanz09/plastic-paper-garbage-bag-synthetic-images/versions/1/Bag Classes/Bag Classes/Paper Bag Images',
 'datasets/datasets/vencerlanz09/plastic-paper-garbage-bag-synthetic-images/versions/1/Bag Classes/Bag Classes/Plastic Bag Images']

### Plastic Bag

In [20]:
palstic_bag = glob.glob("datasets/datasets/vencerlanz09/plastic-paper-garbage-bag-synthetic-images/versions/1/*/Bag Classes/Plastic Bag Images/*.jpg")
palstic_bag

['datasets/datasets/vencerlanz09/plastic-paper-garbage-bag-synthetic-images/versions/1/Bag Classes/Bag Classes/Plastic Bag Images/00000630.jpg',
 'datasets/datasets/vencerlanz09/plastic-paper-garbage-bag-synthetic-images/versions/1/Bag Classes/Bag Classes/Plastic Bag Images/00004748.jpg',
 'datasets/datasets/vencerlanz09/plastic-paper-garbage-bag-synthetic-images/versions/1/Bag Classes/Bag Classes/Plastic Bag Images/00003781.jpg',
 'datasets/datasets/vencerlanz09/plastic-paper-garbage-bag-synthetic-images/versions/1/Bag Classes/Bag Classes/Plastic Bag Images/00001559.jpg',
 'datasets/datasets/vencerlanz09/plastic-paper-garbage-bag-synthetic-images/versions/1/Bag Classes/Bag Classes/Plastic Bag Images/00004438.jpg',
 'datasets/datasets/vencerlanz09/plastic-paper-garbage-bag-synthetic-images/versions/1/Bag Classes/Bag Classes/Plastic Bag Images/00001025.jpg',
 'datasets/datasets/vencerlanz09/plastic-paper-garbage-bag-synthetic-images/versions/1/Bag Classes/Bag Classes/Plastic Bag Images/

In [21]:
plastic_bag_data = [
    Dataset(
        path=img_path,
        target=WasteLabel.FLEXIBLE_PLASTIC
    )
    for img_path in palstic_bag
] 

In [22]:
pd.DataFrame(TypeAdapter(list[Dataset]).dump_python(plastic_bag_data)).to_csv(OUTPUT_FOLDER, index=False, mode="a", header = False)

#### Paper Bag

In [23]:
paper_bag = glob.glob("datasets/datasets/vencerlanz09/plastic-paper-garbage-bag-synthetic-images/versions/1/*/Bag Classes/Paper Bag Images/*.jpg")
paper_bag

['datasets/datasets/vencerlanz09/plastic-paper-garbage-bag-synthetic-images/versions/1/Bag Classes/Bag Classes/Paper Bag Images/00000630.jpg',
 'datasets/datasets/vencerlanz09/plastic-paper-garbage-bag-synthetic-images/versions/1/Bag Classes/Bag Classes/Paper Bag Images/00004748.jpg',
 'datasets/datasets/vencerlanz09/plastic-paper-garbage-bag-synthetic-images/versions/1/Bag Classes/Bag Classes/Paper Bag Images/00003781.jpg',
 'datasets/datasets/vencerlanz09/plastic-paper-garbage-bag-synthetic-images/versions/1/Bag Classes/Bag Classes/Paper Bag Images/00001559.jpg',
 'datasets/datasets/vencerlanz09/plastic-paper-garbage-bag-synthetic-images/versions/1/Bag Classes/Bag Classes/Paper Bag Images/00004438.jpg',
 'datasets/datasets/vencerlanz09/plastic-paper-garbage-bag-synthetic-images/versions/1/Bag Classes/Bag Classes/Paper Bag Images/00001025.jpg',
 'datasets/datasets/vencerlanz09/plastic-paper-garbage-bag-synthetic-images/versions/1/Bag Classes/Bag Classes/Paper Bag Images/00002927.jpg',

In [24]:
paper_bag_data = [
    Dataset(
        path=img_path,
        target=WasteLabel.PAPER
    )
    for img_path in paper_bag
] 

In [25]:
pd.DataFrame(TypeAdapter(list[Dataset]).dump_python(paper_bag_data)).to_csv(OUTPUT_FOLDER, index=False, mode="a", header = False)

#### Garbage Bag

In [26]:
garbage_bag = glob.glob("datasets/datasets/vencerlanz09/plastic-paper-garbage-bag-synthetic-images/versions/1/*/Bag Classes/Garbage Bag Images/*.jpg")
garbage_bag

['datasets/datasets/vencerlanz09/plastic-paper-garbage-bag-synthetic-images/versions/1/Bag Classes/Bag Classes/Garbage Bag Images/00000630.jpg',
 'datasets/datasets/vencerlanz09/plastic-paper-garbage-bag-synthetic-images/versions/1/Bag Classes/Bag Classes/Garbage Bag Images/00004748.jpg',
 'datasets/datasets/vencerlanz09/plastic-paper-garbage-bag-synthetic-images/versions/1/Bag Classes/Bag Classes/Garbage Bag Images/00003781.jpg',
 'datasets/datasets/vencerlanz09/plastic-paper-garbage-bag-synthetic-images/versions/1/Bag Classes/Bag Classes/Garbage Bag Images/00001559.jpg',
 'datasets/datasets/vencerlanz09/plastic-paper-garbage-bag-synthetic-images/versions/1/Bag Classes/Bag Classes/Garbage Bag Images/00004438.jpg',
 'datasets/datasets/vencerlanz09/plastic-paper-garbage-bag-synthetic-images/versions/1/Bag Classes/Bag Classes/Garbage Bag Images/00001025.jpg',
 'datasets/datasets/vencerlanz09/plastic-paper-garbage-bag-synthetic-images/versions/1/Bag Classes/Bag Classes/Garbage Bag Images/

In [27]:
garbage_bag_data = [
    Dataset(
        path=img_path,
        target=WasteLabel.FLEXIBLE_PLASTIC
    )
    for img_path in garbage_bag
] 

In [28]:
pd.DataFrame(TypeAdapter(list[Dataset]).dump_python(garbage_bag_data)).to_csv(OUTPUT_FOLDER, index=False, mode="a", header = False)

### vencerlanz09/plastic-and-paper-cups-synthetic-image-dataset

In [29]:
cups_syn_ven = glob.glob("datasets/datasets/vencerlanz09/plastic-and-paper-cups-synthetic-image-dataset/versions/2/Cup Images/*/*")
len(cups_syn_ven)

15000

In [30]:
cups_syn_ven_data = [
    Dataset(
        path=img_path,
        target=WasteLabel.PLASTIC_CUPS
    )
    for img_path in cups_syn_ven
] 

In [31]:
pd.DataFrame(TypeAdapter(list[Dataset]).dump_python(cups_syn_ven_data)).to_csv(OUTPUT_FOLDER, index=False, mode="a", header = False)

### joebeachcapital/realwaste

In [32]:
class_realwaste = glob.glob("datasets/datasets/joebeachcapital/realwaste/versions/1/realwaste-main/RealWaste/*")
class_realwaste

['datasets/datasets/joebeachcapital/realwaste/versions/1/realwaste-main/RealWaste/Vegetation',
 'datasets/datasets/joebeachcapital/realwaste/versions/1/realwaste-main/RealWaste/Food Organics',
 'datasets/datasets/joebeachcapital/realwaste/versions/1/realwaste-main/RealWaste/Miscellaneous Trash',
 'datasets/datasets/joebeachcapital/realwaste/versions/1/realwaste-main/RealWaste/Cardboard',
 'datasets/datasets/joebeachcapital/realwaste/versions/1/realwaste-main/RealWaste/Paper',
 'datasets/datasets/joebeachcapital/realwaste/versions/1/realwaste-main/RealWaste/Glass',
 'datasets/datasets/joebeachcapital/realwaste/versions/1/realwaste-main/RealWaste/Metal',
 'datasets/datasets/joebeachcapital/realwaste/versions/1/realwaste-main/RealWaste/Textile Trash',
 'datasets/datasets/joebeachcapital/realwaste/versions/1/realwaste-main/RealWaste/Plastic']

#### Cardboard

In [33]:
cardboard_class_realwaste = glob.glob("datasets/datasets/joebeachcapital/realwaste/versions/1/realwaste-main/RealWaste/Cardboard/*.jpg")
cardboard_class_realwaste

['datasets/datasets/joebeachcapital/realwaste/versions/1/realwaste-main/RealWaste/Cardboard/Cardboard_143.jpg',
 'datasets/datasets/joebeachcapital/realwaste/versions/1/realwaste-main/RealWaste/Cardboard/Cardboard_398.jpg',
 'datasets/datasets/joebeachcapital/realwaste/versions/1/realwaste-main/RealWaste/Cardboard/Cardboard_419.jpg',
 'datasets/datasets/joebeachcapital/realwaste/versions/1/realwaste-main/RealWaste/Cardboard/Cardboard_237.jpg',
 'datasets/datasets/joebeachcapital/realwaste/versions/1/realwaste-main/RealWaste/Cardboard/Cardboard_286.jpg',
 'datasets/datasets/joebeachcapital/realwaste/versions/1/realwaste-main/RealWaste/Cardboard/Cardboard_311.jpg',
 'datasets/datasets/joebeachcapital/realwaste/versions/1/realwaste-main/RealWaste/Cardboard/Cardboard_361.jpg',
 'datasets/datasets/joebeachcapital/realwaste/versions/1/realwaste-main/RealWaste/Cardboard/Cardboard_62.jpg',
 'datasets/datasets/joebeachcapital/realwaste/versions/1/realwaste-main/RealWaste/Cardboard/Cardboard_384

In [34]:
cardboard_class_realwaste_data = [
    Dataset(
        path=img_path,
        target=WasteLabel.PAPER)
    for img_path in cardboard_class_realwaste
] 

In [35]:
pd.DataFrame(TypeAdapter(list[Dataset]).dump_python(cardboard_class_realwaste_data)).to_csv(OUTPUT_FOLDER, index=False, mode="a", header = False)

#### Paper


In [36]:
paper_class_realwaste = glob.glob("datasets/datasets/joebeachcapital/realwaste/versions/1/realwaste-main/RealWaste/Paper/*.jpg")
paper_class_realwaste

['datasets/datasets/joebeachcapital/realwaste/versions/1/realwaste-main/RealWaste/Paper/Paper_19.jpg',
 'datasets/datasets/joebeachcapital/realwaste/versions/1/realwaste-main/RealWaste/Paper/Paper_284.jpg',
 'datasets/datasets/joebeachcapital/realwaste/versions/1/realwaste-main/RealWaste/Paper/Paper_469.jpg',
 'datasets/datasets/joebeachcapital/realwaste/versions/1/realwaste-main/RealWaste/Paper/Paper_269.jpg',
 'datasets/datasets/joebeachcapital/realwaste/versions/1/realwaste-main/RealWaste/Paper/Paper_270.jpg',
 'datasets/datasets/joebeachcapital/realwaste/versions/1/realwaste-main/RealWaste/Paper/Paper_109.jpg',
 'datasets/datasets/joebeachcapital/realwaste/versions/1/realwaste-main/RealWaste/Paper/Paper_349.jpg',
 'datasets/datasets/joebeachcapital/realwaste/versions/1/realwaste-main/RealWaste/Paper/Paper_57.jpg',
 'datasets/datasets/joebeachcapital/realwaste/versions/1/realwaste-main/RealWaste/Paper/Paper_274.jpg',
 'datasets/datasets/joebeachcapital/realwaste/versions/1/realwaste

In [37]:
paper_class_realwaste_data = [
    Dataset(
        path=img_path,
        target=WasteLabel.PAPER)
    for img_path in paper_class_realwaste
] 

In [38]:
pd.DataFrame(TypeAdapter(list[Dataset]).dump_python(paper_class_realwaste_data)).to_csv(OUTPUT_FOLDER, index=False, mode="a", header = False)

#### Glass

In [39]:
glass_class_realwaste = glob.glob("datasets/datasets/joebeachcapital/realwaste/versions/1/realwaste-main/RealWaste/Glass/*.jpg")
glass_class_realwaste

['datasets/datasets/joebeachcapital/realwaste/versions/1/realwaste-main/RealWaste/Glass/Glass_180.jpg',
 'datasets/datasets/joebeachcapital/realwaste/versions/1/realwaste-main/RealWaste/Glass/Glass_55.jpg',
 'datasets/datasets/joebeachcapital/realwaste/versions/1/realwaste-main/RealWaste/Glass/Glass_187.jpg',
 'datasets/datasets/joebeachcapital/realwaste/versions/1/realwaste-main/RealWaste/Glass/Glass_329.jpg',
 'datasets/datasets/joebeachcapital/realwaste/versions/1/realwaste-main/RealWaste/Glass/Glass_58.jpg',
 'datasets/datasets/joebeachcapital/realwaste/versions/1/realwaste-main/RealWaste/Glass/Glass_8.jpg',
 'datasets/datasets/joebeachcapital/realwaste/versions/1/realwaste-main/RealWaste/Glass/Glass_411.jpg',
 'datasets/datasets/joebeachcapital/realwaste/versions/1/realwaste-main/RealWaste/Glass/Glass_261.jpg',
 'datasets/datasets/joebeachcapital/realwaste/versions/1/realwaste-main/RealWaste/Glass/Glass_100.jpg',
 'datasets/datasets/joebeachcapital/realwaste/versions/1/realwaste-m

In [40]:
glass_class_realwaste_data = [
    Dataset(
        path=img_path,
        target=WasteLabel.GLASS)
    for img_path in glass_class_realwaste
] 

In [41]:
pd.DataFrame(TypeAdapter(list[Dataset]).dump_python(glass_class_realwaste_data)).to_csv(OUTPUT_FOLDER, index=False, mode="a", header = False)

#### Metal

In [42]:
metal_class_realwaste = glob.glob("datasets/datasets/joebeachcapital/realwaste/versions/1/realwaste-main/RealWaste/Metal/*.jpg")
metal_class_realwaste

['datasets/datasets/joebeachcapital/realwaste/versions/1/realwaste-main/RealWaste/Metal/Metal_643.jpg',
 'datasets/datasets/joebeachcapital/realwaste/versions/1/realwaste-main/RealWaste/Metal/Metal_219.jpg',
 'datasets/datasets/joebeachcapital/realwaste/versions/1/realwaste-main/RealWaste/Metal/Metal_434.jpg',
 'datasets/datasets/joebeachcapital/realwaste/versions/1/realwaste-main/RealWaste/Metal/Metal_202.jpg',
 'datasets/datasets/joebeachcapital/realwaste/versions/1/realwaste-main/RealWaste/Metal/Metal_428.jpg',
 'datasets/datasets/joebeachcapital/realwaste/versions/1/realwaste-main/RealWaste/Metal/Metal_129.jpg',
 'datasets/datasets/joebeachcapital/realwaste/versions/1/realwaste-main/RealWaste/Metal/Metal_131.jpg',
 'datasets/datasets/joebeachcapital/realwaste/versions/1/realwaste-main/RealWaste/Metal/Metal_150.jpg',
 'datasets/datasets/joebeachcapital/realwaste/versions/1/realwaste-main/RealWaste/Metal/Metal_624.jpg',
 'datasets/datasets/joebeachcapital/realwaste/versions/1/realwas

In [43]:
metal_class_realwaste_data = [
    Dataset(
        path=img_path,
        target=WasteLabel.METAL)
    for img_path in metal_class_realwaste
] 

In [44]:
pd.DataFrame(TypeAdapter(list[Dataset]).dump_python(metal_class_realwaste_data)).to_csv(OUTPUT_FOLDER, index=False, mode="a", header = False)

## Roboflow

### a-3zezt/styrofoam-wfuot/v1

In [45]:
styrofoam = glob.glob("datasets/roboflow/styrofoam-wfuot/*/*.jpg")
styrofoam

['datasets/roboflow/styrofoam-wfuot/train/styrofoam-110-_jpg.rf.9312d248c97cc89e473e55369b238293.jpg',
 'datasets/roboflow/styrofoam-wfuot/train/styrofoam-307-_jpg.rf.66ac8669042dc660b79e7702d39c4c1a.jpg',
 'datasets/roboflow/styrofoam-wfuot/train/styrofoam-215-_jpg.rf.fa4bc57be8d9769c8bc2c389306bb12c.jpg',
 'datasets/roboflow/styrofoam-wfuot/train/styrofoam-95-_jpg.rf.620759b3f231df2ee481d4c7311569dc.jpg',
 'datasets/roboflow/styrofoam-wfuot/train/styrofoam-257-_jpg.rf.5327f434332c29fda95915e9a1e6109f.jpg',
 'datasets/roboflow/styrofoam-wfuot/train/styrofoam-86-_jpg.rf.e23b5d33cb1a80d653061b9b15a444f8.jpg',
 'datasets/roboflow/styrofoam-wfuot/train/styrofoam-10-_jpg.rf.2279e8031daccc26ca149839eaba33c9.jpg',
 'datasets/roboflow/styrofoam-wfuot/train/img_-_68_jpeg.rf.d917ba880e8f71377ec6bcbf6ba6a1b5.jpg',
 'datasets/roboflow/styrofoam-wfuot/train/styrofoam-51-_jpg.rf.1d4168ceb81884e16077c4f983c5b2bb.jpg',
 'datasets/roboflow/styrofoam-wfuot/train/img_-_93_jpeg.rf.b3a2f7144af18fb79c2192b

In [46]:
styrofoam_data = [
    Dataset(
        path=img_path,
        target=WasteLabel.OTHER
    )
    for img_path in styrofoam
] 

In [47]:
pd.DataFrame(TypeAdapter(list[Dataset]).dump_python(styrofoam_data)).to_csv(OUTPUT_FOLDER, index=False, mode="a", header = False)


### ijuden/kelapa-megatron-kupas/v1

In [48]:
kelapa = glob.glob("datasets/roboflow/kelapa-megatron-kupas/*/*.jpg")
kelapa

['datasets/roboflow/kelapa-megatron-kupas/train/Test_95_jpg.rf.5130e97cf6c7ea4944c0a2e8ed71bc0c.jpg',
 'datasets/roboflow/kelapa-megatron-kupas/train/frame_24_jpg.rf.a9c2faf2e06ae78d06382dbf8838cfd3.jpg',
 'datasets/roboflow/kelapa-megatron-kupas/train/Test_120_jpg.rf.5b4e7525fef2afbfc2e0097f0d35e5fa.jpg',
 'datasets/roboflow/kelapa-megatron-kupas/train/39_jpeg.rf.f908ccb9c84175a51431d6a8a54537d9.jpg',
 'datasets/roboflow/kelapa-megatron-kupas/train/6_jpeg.rf.0fc27ad3cddff52ba88b4cfde02f7033.jpg',
 'datasets/roboflow/kelapa-megatron-kupas/train/LINE_ALBUM_-2_-_105_jpg.rf.925adfe85636e54ae04b42cffb58e12b.jpg',
 'datasets/roboflow/kelapa-megatron-kupas/train/35_jpeg.rf.ce0b1e39150e17a280d5bcb435f7560f.jpg',
 'datasets/roboflow/kelapa-megatron-kupas/train/30_jpeg.rf.4ea65f5acbc3f2be0b0aeb645aa9a666.jpg',
 'datasets/roboflow/kelapa-megatron-kupas/train/frame_0_jpg.rf.d5ab5753a38e72b3841505ff107f3cce.jpg',
 'datasets/roboflow/kelapa-megatron-kupas/train/Test_26_jpeg.rf.20ab89d2ab6c5e74cdd94

In [49]:
kelapa_data = [
    Dataset(
        path=img_path,
        target=WasteLabel.OTHER
    )
    for img_path in kelapa
] 

In [50]:
pd.DataFrame(TypeAdapter(list[Dataset]).dump_python(kelapa_data)).to_csv(OUTPUT_FOLDER, index=False, mode="a", header = False)

### dataixalab/metal-f7t6c/v1


In [51]:
metal = glob.glob("datasets/roboflow/metal-f7t6c/*/*.jpg")
metal

['datasets/roboflow/metal-f7t6c/train/metal405_jpg.rf.8cb2800d517962ac0386af5319b9d5d0.jpg',
 'datasets/roboflow/metal-f7t6c/train/metal351_jpg.rf.ac2cd9bcb02b1ee40c5eadb34b07feb9.jpg',
 'datasets/roboflow/metal-f7t6c/train/metal1490_jpg.rf.d249024bddfec102d5fe21d7f63015b8.jpg',
 'datasets/roboflow/metal-f7t6c/train/metal195_jpg.rf.c41b58d397e9dee423b8412e33fd5b25.jpg',
 'datasets/roboflow/metal-f7t6c/train/metal284_jpg.rf.e6eac11f4b32223ce71b5bf8563bb8f3.jpg',
 'datasets/roboflow/metal-f7t6c/train/metal1675_jpg.rf.8fe7b93723673134ab9cd41db3311376.jpg',
 'datasets/roboflow/metal-f7t6c/train/metal1407_jpg.rf.8542a579ccdc684b94366337c019ed07.jpg',
 'datasets/roboflow/metal-f7t6c/train/metal36_jpg.rf.8f79c5be5080e3d30f0b688cbf098450.jpg',
 'datasets/roboflow/metal-f7t6c/train/metal577_jpg.rf.a54930c427b91bd837df0a4e852ba33d.jpg',
 'datasets/roboflow/metal-f7t6c/train/metal1783_jpg.rf.6b7efffccacab74a0c7c459189a80db3.jpg',
 'datasets/roboflow/metal-f7t6c/train/metal256_jpg.rf.443daa46e21ef

In [52]:
metal_data = [
    Dataset(
        path=img_path,
        target=WasteLabel.METAL
    )
    for img_path in metal
] 

In [53]:
pd.DataFrame(TypeAdapter(list[Dataset]).dump_python(metal_data)).to_csv(OUTPUT_FOLDER, index=False, mode="a", header = False)

### trash-classification-mjez0/plastic-hdpe/v1

In [54]:
hdpe = glob.glob("datasets/roboflow/plastic-hdpe/*/*/*.jpg")
len(hdpe)

549

In [55]:
hdpe_data = [
    Dataset(
        path=img_path,
        target=WasteLabel.RIGID_PLASTIC
    )
    for img_path in hdpe
]

In [56]:
pd.DataFrame(TypeAdapter(list[Dataset]).dump_python(hdpe_data)).to_csv(OUTPUT_FOLDER, index=False, mode="a", header = False)


### project-swd48/plastic-cups-v7jar/v1


In [57]:
cupsv7jar = glob.glob("datasets/roboflow/plastic-cups-v7jar/*/*.jpg")
cupsv7jar

['datasets/roboflow/plastic-cups-v7jar/train/-_10_jpg.rf.d58ac64500fc95bb3d941d9eb61cff96.jpg',
 'datasets/roboflow/plastic-cups-v7jar/train/-_62_jpg.rf.e6f9c7ade2abe84dad07ca45e2249b02.jpg',
 'datasets/roboflow/plastic-cups-v7jar/train/-_7_jpg.rf.482d171bcce3a1b397824ddaf6a22258.jpg',
 'datasets/roboflow/plastic-cups-v7jar/train/-_88_jpg.rf.c6e4b9a8e199144e1b93f3c3553793f1.jpg',
 'datasets/roboflow/plastic-cups-v7jar/train/-_81_jpg.rf.6e28ada2e02528d54b36ae5b7b183de8.jpg',
 'datasets/roboflow/plastic-cups-v7jar/train/-_82_jpg.rf.8fa8e9049269c2e2e1e6fc8dfff78471.jpg',
 'datasets/roboflow/plastic-cups-v7jar/train/-_24_jpg.rf.3c30c48cea7e229d1d2d0409df11f5a7.jpg',
 'datasets/roboflow/plastic-cups-v7jar/train/-_5_jpg.rf.c81595463b30b0f0ab0d400263feadf0.jpg',
 'datasets/roboflow/plastic-cups-v7jar/train/-_38_jpg.rf.a117834c18686d25c8f798a66db08f03.jpg',
 'datasets/roboflow/plastic-cups-v7jar/train/-_55_jpg.rf.102a40dd7053e25cb2b76108e037b410.jpg',
 'datasets/roboflow/plastic-cups-v7jar/tra

In [58]:
cupsv7jar_data = [
    Dataset(
        path=img_path,
        target=WasteLabel.PLASTIC_CUPS
    )
    for img_path in cupsv7jar
]

In [59]:
pd.DataFrame(TypeAdapter(list[Dataset]).dump_python(cupsv7jar_data)).to_csv(OUTPUT_FOLDER, index=False, mode="a", header = False)

### cups-iupj5/cups-ctpw3/v1


In [60]:
cups = glob.glob("datasets/roboflow/cups-ctpw3/*/*.jpg")
cups

['datasets/roboflow/cups-ctpw3/train/00001481_jpg.rf.6a04bd5ddfa48cf1e1d74745e0610f43.jpg',
 'datasets/roboflow/cups-ctpw3/train/00001641_jpg.rf.ee03d1606fb66a6b6bb313bb574d7a74.jpg',
 'datasets/roboflow/cups-ctpw3/train/00001117_jpg.rf.5ab294855225913886e864d601979a5f.jpg',
 'datasets/roboflow/cups-ctpw3/train/00001888_jpg.rf.2413646445c951a57851fda1fded0dba.jpg',
 'datasets/roboflow/cups-ctpw3/train/00001754_jpg.rf.b89334aca1326da35b73a973ecab3eb5.jpg',
 'datasets/roboflow/cups-ctpw3/train/00001593_jpg.rf.2bd25d02bcfc00c0eada22d5a01d607d.jpg',
 'datasets/roboflow/cups-ctpw3/train/00001662_jpg.rf.f4f0a2b75752cee0f16c616b925a917b.jpg',
 'datasets/roboflow/cups-ctpw3/train/00001834_jpg.rf.ea8d050c371460eeff5d0b04f42a097c.jpg',
 'datasets/roboflow/cups-ctpw3/train/00001418_jpg.rf.f8a8c0ea6aff458ce42e73ede4fdbbf7.jpg',
 'datasets/roboflow/cups-ctpw3/train/00001934_jpg.rf.1b76079749910f538c6d7fd34e92844b.jpg',
 'datasets/roboflow/cups-ctpw3/train/00001660_jpg.rf.cd5bdc5312a96bce1be5285fca5

In [61]:
cups_data = [
    Dataset(
        path=img_path,
        target=WasteLabel.PLASTIC_CUPS
    )
    for img_path in cups
] 

In [62]:
pd.DataFrame(TypeAdapter(list[Dataset]).dump_python(cups_data)).to_csv(OUTPUT_FOLDER, index=False, mode="a",header = False)

### recyclable-sorting-algorithm/plastic-sorting-algorithm/v1


In [63]:
plastic_sorting = glob.glob("datasets/roboflow/plastic-sorting-algorithm/*/*")
plastic_sorting

['datasets/roboflow/plastic-sorting-algorithm/train/HDPE',
 'datasets/roboflow/plastic-sorting-algorithm/train/PET PP PS',
 'datasets/roboflow/plastic-sorting-algorithm/train/HDPE PET',
 'datasets/roboflow/plastic-sorting-algorithm/train/LDPE PS',
 'datasets/roboflow/plastic-sorting-algorithm/train/HDPE PP PS',
 'datasets/roboflow/plastic-sorting-algorithm/train/PET PP',
 'datasets/roboflow/plastic-sorting-algorithm/train/HDPE LDPE PET PP',
 'datasets/roboflow/plastic-sorting-algorithm/train/HDPE LDPE PET PS',
 'datasets/roboflow/plastic-sorting-algorithm/train/PP PS',
 'datasets/roboflow/plastic-sorting-algorithm/train/PP',
 'datasets/roboflow/plastic-sorting-algorithm/train/LDPE PET',
 'datasets/roboflow/plastic-sorting-algorithm/train/HDPE LDPE PET',
 'datasets/roboflow/plastic-sorting-algorithm/train/HDPE PS',
 'datasets/roboflow/plastic-sorting-algorithm/train/LDPE PP',
 'datasets/roboflow/plastic-sorting-algorithm/train/HDPE PET PP PS',
 'datasets/roboflow/plastic-sorting-algorit

#### HDPE

In [64]:
hdpe_plastic_sorting = glob.glob("datasets/roboflow/plastic-sorting-algorithm/*/HDPE/*")
hdpe_plastic_sorting

['datasets/roboflow/plastic-sorting-algorithm/train/HDPE/IMG_0092_JPG_jpg.rf.d60c668912dfd277a69c062d9a3f6edb.jpg',
 'datasets/roboflow/plastic-sorting-algorithm/train/HDPE/IMG_1839_JPG_jpg.rf.a8da884d8ce83f78f5479978b015fd13.jpg',
 'datasets/roboflow/plastic-sorting-algorithm/train/HDPE/43_jpg.rf.342b4a7e7181f1bb2daaa6e02d727057.jpg',
 'datasets/roboflow/plastic-sorting-algorithm/train/HDPE/IMG_1876_JPG_jpg.rf.9ca393f39cbafec42c66938b32afae65.jpg',
 'datasets/roboflow/plastic-sorting-algorithm/train/HDPE/IMG_9326_jpg.rf.7acfae5ec10f43fbdd2c488f1a018057.jpg',
 'datasets/roboflow/plastic-sorting-algorithm/train/HDPE/IMG_0755_Original_jpeg_jpg.rf.e7c45a8cd8ce0d7b1ed5e799b625d35b.jpg',
 'datasets/roboflow/plastic-sorting-algorithm/train/HDPE/IMG_0066_JPG_jpg.rf.add4bd9e51607f9317d0d22457d1ff92.jpg',
 'datasets/roboflow/plastic-sorting-algorithm/train/HDPE/IMG_0057_JPG_jpg.rf.8e1ac2fdd949ff61808ca5650b8954d9.jpg',
 'datasets/roboflow/plastic-sorting-algorithm/train/HDPE/IMG_0179_JPG_jpg.rf

In [65]:
hdpe_plastic_sorting_data = [
    Dataset(
        path=img_path,
        target=WasteLabel.RIGID_PLASTIC
    )
    for img_path in hdpe_plastic_sorting
]

In [66]:
pd.DataFrame(TypeAdapter(list[Dataset]).dump_python(hdpe_plastic_sorting_data)).to_csv(OUTPUT_FOLDER, index=False, mode="a",header = False)

### piyush-yadav-gh70a/pvc-pipe-detection/v1


In [67]:
pvc_pipe = glob.glob("datasets/roboflow/pvc-pipe-detection/*/*/*.jpg")
pvc_pipe

['datasets/roboflow/pvc-pipe-detection/train/L/IMG_2962-Custom-_jpeg_jpg.rf.d499e224f0534d835f7746cb0495a258.jpg',
 'datasets/roboflow/pvc-pipe-detection/train/L/IMG_2965-Custom-_jpeg_jpg.rf.0ff78732790f65711b3b038d5ac0b809.jpg',
 'datasets/roboflow/pvc-pipe-detection/train/L/IMG_2900-Custom-_jpeg_jpg.rf.188d69ce055bd3eb6289012af1d98d3a.jpg',
 'datasets/roboflow/pvc-pipe-detection/train/L/IMG_2885-Custom-_jpeg_jpg.rf.c83e23433d2695d8bf885050d26100c6.jpg',
 'datasets/roboflow/pvc-pipe-detection/train/L/IMG_2876-Custom-_jpeg_jpg.rf.f2dd667a3504727349f1b6d48f503db2.jpg',
 'datasets/roboflow/pvc-pipe-detection/train/L/IMG_2892-Custom-_jpeg_jpg.rf.51b8eef8d8ad714871b93d361c040f8e.jpg',
 'datasets/roboflow/pvc-pipe-detection/train/L/IMG_2934-Custom-_jpeg_jpg.rf.82822caea7caf09d29108586bff7bbde.jpg',
 'datasets/roboflow/pvc-pipe-detection/train/L/IMG_2953-Custom-_jpeg_jpg.rf.3c7952fbeb33702a44da73fc6b8f67fd.jpg',
 'datasets/roboflow/pvc-pipe-detection/train/L/IMG_2952-Custom-_jpeg_jpg.rf.0678

In [68]:
pvc_pipe_data = [
    Dataset(
        path=img_path,
        target=WasteLabel.HARD_PLASTIC
    )
    for img_path in pvc_pipe
]

In [69]:
pd.DataFrame(TypeAdapter(list[Dataset]).dump_python(pvc_pipe_data)).to_csv(OUTPUT_FOLDER, index=False, mode="a", header = False)

### tiago-rosa/un-pvc/v1


In [70]:
un_pvc_pipe = glob.glob("datasets/roboflow/un-pvc/*/*/*.jpg")
un_pvc_pipe

['datasets/roboflow/un-pvc/train/Uniao 20 pvc/opencv_frame_48_png.rf.c30ca7145615617e27622b0ce34ba598.jpg',
 'datasets/roboflow/un-pvc/train/Uniao 20 pvc/opencv_frame_50_png.rf.47d07954be76a40121c472beddf9765a.jpg',
 'datasets/roboflow/un-pvc/train/Uniao 20 pvc/opencv_frame_49_png.rf.0e37f0d018a667fefd4ec1c14c503280.jpg',
 'datasets/roboflow/un-pvc/train/Uniao 20 pvc/opencv_frame_604_png.rf.cb18cef638168283aafba60a5bc35bdc.jpg',
 'datasets/roboflow/un-pvc/train/Uniao 20 pvc/opencv_frame_37_png.rf.ad72be79e225ef63cd285e140902e4cc.jpg',
 'datasets/roboflow/un-pvc/train/Uniao 20 pvc/opencv_frame_47_png.rf.9b69d6dc29472f653ac4c655b36924ec.jpg',
 'datasets/roboflow/un-pvc/train/Uniao 20 pvc/opencv_frame_603_png.rf.b09868016b249b2ef13438a9bcd36690.jpg',
 'datasets/roboflow/un-pvc/train/Uniao 20 pvc/opencv_frame_47_png.rf.5ecdf2496c6bfee69caec5d5541f16f3.jpg',
 'datasets/roboflow/un-pvc/train/Uniao 20 pvc/opencv_frame_45_png.rf.3171225123de2c837b9eb519a80c7383.jpg',
 'datasets/roboflow/un-pvc

In [71]:
un_pvc_pipe_data = [
    Dataset(
        path=img_path,
        target=WasteLabel.HARD_PLASTIC
    )
    for img_path in pvc_pipe
]

In [72]:
pd.DataFrame(TypeAdapter(list[Dataset]).dump_python(un_pvc_pipe_data)).to_csv(OUTPUT_FOLDER, index=False, mode="a", header = False)

### demo-wdd86/od-3vc4m/v1


In [73]:
pvc_od = glob.glob("datasets/roboflow/od-3vc4m/*/*.jpg")
pvc_od

['datasets/roboflow/od-3vc4m/train/90mm-pvc-elbow_jpg.rf.45e3085b3c2b9f52b507090c58ab4d4d.jpg',
 'datasets/roboflow/od-3vc4m/train/R212277-01-1-_webp.rf.aa3f88409076f8da19088ae683983df1.jpg',
 'datasets/roboflow/od-3vc4m/train/pvc-metric-pressure-pipe-tee_1nd_3621_large_jpg.rf.70d444fc307c30a933d6f8e3f1b3e4bb.jpg',
 'datasets/roboflow/od-3vc4m/train/images-27-_jpg.rf.3b0ee10e33e6ba59be24acbc2a09f50e.jpg',
 'datasets/roboflow/od-3vc4m/train/IMG_5827_jpg.rf.1fc48b17ad8897b45d52b806cbba8467.jpg',
 'datasets/roboflow/od-3vc4m/train/IMG_5860_jpg.rf.9c2f513f50babf2163500d19548c5d21.jpg',
 'datasets/roboflow/od-3vc4m/train/IMG_5823_jpg.rf.94d7f22d1693e2219b0046ff24260019.jpg',
 'datasets/roboflow/od-3vc4m/train/s-l1200_jpg.rf.de60696547fe7293937e8ddb6829e916.jpg',
 'datasets/roboflow/od-3vc4m/train/images-52-_jpg.rf.aa61d296bf7617fb1a63899c3ae4ce57.jpg',
 'datasets/roboflow/od-3vc4m/train/IMG_5811_jpg.rf.980208564d3b6ff6f15fb45c51181b83.jpg',
 'datasets/roboflow/od-3vc4m/train/images-32-_jpg.

In [74]:
pvc_od_data = [
    Dataset(
        path=img_path,
        target=WasteLabel.HARD_PLASTIC
    )
    for img_path in pvc_od
]

In [75]:
pd.DataFrame(TypeAdapter(list[Dataset]).dump_python(pvc_od_data)).to_csv(OUTPUT_FOLDER, index=False, mode="a", header = False)

### construction-8c2ry/pipe-fittings/v1


In [76]:
pipe_pvc = glob.glob("datasets/roboflow/pipe-fittings/*/*.jpg")
pipe_pvc

['datasets/roboflow/pipe-fittings/train/images_jpg.rf.4ab7dc978cfd49fe4fde5c79d2b27ece.jpg',
 'datasets/roboflow/pipe-fittings/train/formufit-45-elbow-1-2-in-45-degree-furniture-grade-pvc-elbow-fitting-orange-33983650529429_535x_webp.rf.9452c7ace928c716191d4b6a04138bf6.jpg',
 'datasets/roboflow/pipe-fittings/train/images-20-_jpg.rf.5874bc66d38bc831bd485a5f0a1ee03b.jpg',
 'datasets/roboflow/pipe-fittings/train/11d2ebb9d00242ac110003_webp.rf.7bb5d89db2b5000a18fbaac0537c4669.jpg',
 'datasets/roboflow/pipe-fittings/train/images-1-_jpg.rf.bf30421f424618d3b7d994f5d2366a6e.jpg',
 'datasets/roboflow/pipe-fittings/train/51vCE-5PjPL_jpg.rf.4ed72f41c27c5f6ace24278e27f90f0d.jpg',
 'datasets/roboflow/pipe-fittings/train/images-5-_jpg.rf.fcf1341af20502f9429075d4dd2ab6ff.jpg',
 'datasets/roboflow/pipe-fittings/train/6f8af5315f0542a5d3bad2ad2dea7764_jpg.rf.ce577933e5905ca64e62ff548eec3cb3.jpg',
 'datasets/roboflow/pipe-fittings/train/images11_jpg.rf.7746935904b711434eccc4aaa60df743.jpg',
 'datasets/ro

In [77]:
pipe_pvc_data = [
    Dataset(
        path=img_path,
        target=WasteLabel.HARD_PLASTIC
    )
    for img_path in pipe_pvc
]

In [78]:
pd.DataFrame(TypeAdapter(list[Dataset]).dump_python(pipe_pvc_data)).to_csv(OUTPUT_FOLDER, index=False, mode="a", header = False)

### sumeyye-mo9wj/paper-7qwal/v1


In [79]:
paper_qwal = glob.glob("datasets/roboflow/paper-7qwal/*/*/*.jpg")
paper_qwal

['datasets/roboflow/paper-7qwal/train/paper/paprrr-1899-_jpg.rf.a9aad5e9908fc56a780b3149fb0b74e5.jpg',
 'datasets/roboflow/paper-7qwal/train/paper/paprrr-2142-_jpg.rf.72ebf14a0b9f9776abdffcaee4cd9123.jpg',
 'datasets/roboflow/paper-7qwal/train/paper/paprrr-1610-_jpg.rf.eaa39476c1048ad6ec073cfbf1902387.jpg',
 'datasets/roboflow/paper-7qwal/train/paper/paprrr-2531-_jpg.rf.b59b9efc24c9dfd0e69e2a6aadf064dd.jpg',
 'datasets/roboflow/paper-7qwal/train/paper/paprrr-2678-_jpg.rf.1f73c1f809930fa21643a566df195bce.jpg',
 'datasets/roboflow/paper-7qwal/train/paper/paper60_jpg.rf.5dd352092ddb2cd26adc79598dc947a0.jpg',
 'datasets/roboflow/paper-7qwal/train/paper/paprrr-975-_jpg.rf.78119523c5ef74c70deb44cb5606c977.jpg',
 'datasets/roboflow/paper-7qwal/train/paper/paper498_jpg.rf.d932d159222d7a010ffc0ae04e578178.jpg',
 'datasets/roboflow/paper-7qwal/train/paper/paper236_jpg.rf.c0c2f9765a047aeacfaf636f1e0b1292.jpg',
 'datasets/roboflow/paper-7qwal/train/paper/paprrr-1488-_jpg.rf.938a033b8dfa33ea669ae0c

In [80]:
paper_qwal_data = [
    Dataset(
        path=img_path,
        target=WasteLabel.PAPER
    )
    for img_path in paper_qwal
]

In [81]:
pd.DataFrame(TypeAdapter(list[Dataset]).dump_python(paper_qwal_data)).to_csv(OUTPUT_FOLDER, index=False, mode="a", header = False)

### rijah-yrbls/paper-d2z5n/v1


In [82]:
paper_d2z5n = glob.glob("datasets/roboflow/paper-d2z5n/*/*/*.jpg")
paper_d2z5n

['datasets/roboflow/paper-d2z5n/train/Paper/27-Old-Newspaper--252F-Newsprint--ONP--Waste-Paper_jpg.rf.a275526f00eab373edacbf0cfbd50fba.jpg',
 'datasets/roboflow/paper-d2z5n/train/Paper/48-800px_COLOURBOX9472010_jpg.rf.4307f345ed8a33e5c3656bcfed72b5f4.jpg',
 'datasets/roboflow/paper-d2z5n/train/Paper/32-brown-crumpled-paper-bag-15430581_jpg.rf.de7dc5a560053161821ba827e997bd6a.jpg',
 'datasets/roboflow/paper-d2z5n/train/Paper/20-an-old-crumpled-and-torn-newspaper-for-a-background-D7AAD2_jpg.rf.caf751d0d68e7d61d115398971ca9bcf.jpg',
 'datasets/roboflow/paper-d2z5n/train/Paper/10-crumpled-paper-bag-20286848_jpg.rf.bf9cd05a4b067d05f0b6bbc4be9be588.jpg',
 'datasets/roboflow/paper-d2z5n/train/Paper/61-crumpled_newspaper-200x186_jpg.rf.e24f8032e5844e8daf061bc1a984c83d.jpg',
 'datasets/roboflow/paper-d2z5n/train/Paper/16-paper-trash-12457899_jpg.rf.e082727d22fea186220d77f59bf8e778.jpg',
 'datasets/roboflow/paper-d2z5n/train/Paper/76-maxresdefault_jpg.rf.22ef4e61b180466f6e0ed9f63441d897.jpg',
 '

In [83]:
paper_d2z5n_data = [
    Dataset(
        path=img_path,
        target=WasteLabel.PAPER
    )
    for img_path in paper_d2z5n
]

In [84]:
pd.DataFrame(TypeAdapter(list[Dataset]).dump_python(paper_d2z5n_data)).to_csv(OUTPUT_FOLDER, index=False, mode="a", header = False)

### trash-classification-mjez0/paper-1/v2


In [85]:
paper_mjez0 = glob.glob("datasets/roboflow/paper-1/*/*/*.jpg")
paper_mjez0

['datasets/roboflow/paper-1/train/paper/paper37_jpg.rf.8649f9a8624e3f474da3b08ced27d3b8.jpg',
 'datasets/roboflow/paper-1/train/paper/paper524_jpg.rf.4e024f9925fc9c4490fc9b5f1e03b7be.jpg',
 'datasets/roboflow/paper-1/train/paper/paper130_jpg.rf.5d34a8b0df3213871f7f26f3a103233a.jpg',
 'datasets/roboflow/paper-1/train/paper/paper506_jpg.rf.879f4218076a62200d4e4ee7834c35d1.jpg',
 'datasets/roboflow/paper-1/train/paper/paper307_jpg.rf.21f4fcbaf62ce3b1db693f79f7bed7ea.jpg',
 'datasets/roboflow/paper-1/train/paper/paper214_jpg.rf.20cdb9fc2ebc46b94a8a5532ff6e2186.jpg',
 'datasets/roboflow/paper-1/train/paper/paper141_jpg.rf.0c49041cbe859da16bdc867fd75a83c3.jpg',
 'datasets/roboflow/paper-1/train/paper/paper207_jpg.rf.3ff784e7a1da1e614defb4087859d27d.jpg',
 'datasets/roboflow/paper-1/train/paper/paper532_jpg.rf.4416b206350e99b313384358fc241dfc.jpg',
 'datasets/roboflow/paper-1/train/paper/paper246_jpg.rf.9228c145db99578e958553d01462bf41.jpg',
 'datasets/roboflow/paper-1/train/paper/paper205_jp

In [86]:
paper_mjez0_data = [
    Dataset(
        path=img_path,
        target=WasteLabel.PAPER
    )
    for img_path in paper_mjez0
]

In [87]:
pd.DataFrame(TypeAdapter(list[Dataset]).dump_python(paper_mjez0_data)).to_csv(OUTPUT_FOLDER, index=False, mode="a", header = False)

### color-qltok/pet-bottle-9xet7/v1


In [88]:
bottle_pet_9xet7 = glob.glob("datasets/roboflow/pet-bottle-9xet7/*/PET_bottle/*.jpg")
bottle_pet_9xet7

['datasets/roboflow/pet-bottle-9xet7/train/PET_bottle/PET_009_5862_0_jpg.rf.d6665c4fe6d6fa59df3ed3adc552b5e8.jpg',
 'datasets/roboflow/pet-bottle-9xet7/train/PET_bottle/PET_002_1376_2_jpg.rf.ca460722f5a433b4987da00f68644fd7.jpg',
 'datasets/roboflow/pet-bottle-9xet7/train/PET_bottle/PET_015_4847_1_jpg.rf.8cf7b7202c85d243f31ea9a2d5ef7b1d.jpg',
 'datasets/roboflow/pet-bottle-9xet7/train/PET_bottle/PET_007_1484_1_jpg.rf.e00ae3514fc1075a84bbefd7f2057e75.jpg',
 'datasets/roboflow/pet-bottle-9xet7/train/PET_bottle/PET_015_118_2_jpg.rf.0fef5302fffe363001129edaec6aabc8.jpg',
 'datasets/roboflow/pet-bottle-9xet7/train/PET_bottle/PET_011_4290_1_jpg.rf.fc17331122c9db25ae95c309608e3e3c.jpg',
 'datasets/roboflow/pet-bottle-9xet7/train/PET_bottle/PET_001_2584_1_jpg.rf.dcdbef84f04cecf9338b75ecfc6fd012.jpg',
 'datasets/roboflow/pet-bottle-9xet7/train/PET_bottle/PET_003_4841_0_jpg.rf.7a6bed75e0ed891db6f834093aae76a2.jpg',
 'datasets/roboflow/pet-bottle-9xet7/train/PET_bottle/PET_005_3942_1_jpg.rf.3e2ce

In [89]:
bottle_pet_9xet7_data = [
    Dataset(
        path=img_path,
        target=WasteLabel.PET
    )
    for img_path in bottle_pet_9xet7
]

In [90]:
pd.DataFrame(TypeAdapter(list[Dataset]).dump_python(bottle_pet_9xet7_data)).to_csv(OUTPUT_FOLDER, index=False, mode="a", header = False)

### computer-vision-ewm5r/botol-pjepi/v4


In [91]:
bottle_pjepi_label = glob.glob("datasets/roboflow/botol-pjepi/*/*")
bottle_pjepi_label

['datasets/roboflow/botol-pjepi/train/HDPE',
 'datasets/roboflow/botol-pjepi/train/PET',
 'datasets/roboflow/botol-pjepi/test/HDPE',
 'datasets/roboflow/botol-pjepi/test/PET',
 'datasets/roboflow/botol-pjepi/valid/HDPE',
 'datasets/roboflow/botol-pjepi/valid/PET']

In [92]:
bottle_pjepi_hdpe = glob.glob("datasets/roboflow/botol-pjepi/*/HDPE/*.jpg")
bottle_pjepi_hdpe

['datasets/roboflow/botol-pjepi/train/HDPE/hdpe059_jpg.rf.85b0b78bebc5961f4f1249f6b018c1dd.jpg',
 'datasets/roboflow/botol-pjepi/train/HDPE/hdpe008_jpg.rf.fe5f2cf48b6e414da9237dc2f99bf4c9.jpg',
 'datasets/roboflow/botol-pjepi/train/HDPE/hdpe078_jpg.rf.e504e8ef2298aed286d1faf1fa8e59e1.jpg',
 'datasets/roboflow/botol-pjepi/train/HDPE/pet003_jpg.rf.d9dd40cb4bbe887c1226ffe2ee741699.jpg',
 'datasets/roboflow/botol-pjepi/train/HDPE/hdpe027_jpg.rf.8e9f112d3097065f507b7f84a838144f.jpg',
 'datasets/roboflow/botol-pjepi/train/HDPE/hdpe040_jpg.rf.2292579ca5baa3e762a0b7f19402ad89.jpg',
 'datasets/roboflow/botol-pjepi/train/HDPE/hdpe082_jpg.rf.afcfd4c446a1a7ce56e87fac3c3d1eb1.jpg',
 'datasets/roboflow/botol-pjepi/train/HDPE/hdpe049_jpg.rf.2fe2560cf95f7aceb0c8561cb5dea835.jpg',
 'datasets/roboflow/botol-pjepi/train/HDPE/hdpe043_jpg.rf.afca62295e89152a73e89e86a55bda54.jpg',
 'datasets/roboflow/botol-pjepi/train/HDPE/hdpe054_jpg.rf.174fa347e9688eef6bb10278cacf9f33.jpg',
 'datasets/roboflow/botol-pjepi

In [93]:
bottle_pjepi_hdpe_data = [
    Dataset(
        path=img_path,
        target=WasteLabel.RIGID_PLASTIC
    )
    for img_path in bottle_pjepi_hdpe
]

In [94]:
pd.DataFrame(TypeAdapter(list[Dataset]).dump_python(bottle_pjepi_hdpe_data)).to_csv(OUTPUT_FOLDER, index=False, mode="a", header = False)

In [95]:
bottle_pjepi_PET = glob.glob("datasets/roboflow/botol-pjepi/*/PET/*jpg")
bottle_pjepi_PET

['datasets/roboflow/botol-pjepi/train/PET/pet014_jpg.rf.b06c269cbf0adbb46e8cc87029c60d34.jpg',
 'datasets/roboflow/botol-pjepi/train/PET/pet054_jpg.rf.07c0fccc610c65a6daee705a6d85886a.jpg',
 'datasets/roboflow/botol-pjepi/train/PET/pet045_jpg.rf.d77fc23733f3a380d055aa3dba68a010.jpg',
 'datasets/roboflow/botol-pjepi/train/PET/pet040_jpg.rf.e62e1659fabfb639a979afaff88ee0c9.jpg',
 'datasets/roboflow/botol-pjepi/train/PET/pet017_jpg.rf.1213a238b07a516dfb26dc32b7b88566.jpg',
 'datasets/roboflow/botol-pjepi/train/PET/pet040_jpg.rf.47f2dad390e16b2695b95e824b55ff22.jpg',
 'datasets/roboflow/botol-pjepi/train/PET/pet064_jpg.rf.16ab38d6cb228336b13a289541220bf2.jpg',
 'datasets/roboflow/botol-pjepi/train/PET/pet012_jpg.rf.b0ef4d270f0d4789d6e167766ba2718c.jpg',
 'datasets/roboflow/botol-pjepi/train/PET/pet074_jpg.rf.4f96f222b85da1f4de9572ebc4fbe668.jpg',
 'datasets/roboflow/botol-pjepi/train/PET/pet069_jpg.rf.8165a686682b2d8ebec091f094840695.jpg',
 'datasets/roboflow/botol-pjepi/train/PET/pet043_j

In [96]:
bottle_pjepi_PET_data = [
    Dataset(
        path=img_path,
        target=WasteLabel.PET
    )
    for img_path in bottle_pjepi_PET
]

In [97]:
pd.DataFrame(TypeAdapter(list[Dataset]).dump_python(bottle_pjepi_PET_data)).to_csv(OUTPUT_FOLDER, index=False, mode="a", header = False)

### university-d2l2p/tetrapak-xczol/v2


In [98]:
tetrapak_xczol = glob.glob("datasets/roboflow/tetrapak-xczol/*/*.jpg")
tetrapak_xczol

['datasets/roboflow/tetrapak-xczol/train/cm21_jpg.rf.b98ed314bbca9e21dbdc9a0c11a22a9f.jpg',
 'datasets/roboflow/tetrapak-xczol/train/57-_jpg.rf.660687daf28857384d1bb97a50aa8340.jpg',
 'datasets/roboflow/tetrapak-xczol/train/71-_jpg.rf.0c4d25272049ceecbd59acfdd51d4c8a.jpg',
 'datasets/roboflow/tetrapak-xczol/train/th_true-69-_jpg.rf.c5fdef439ef4bd437684fca89f87cf5b.jpg',
 'datasets/roboflow/tetrapak-xczol/train/cart-30-_jpg.rf.6bbd934668694a8f1611398e5dbb921f.jpg',
 'datasets/roboflow/tetrapak-xczol/train/vfresh-16-_jpeg_jpg.rf.cbf7f53c730ad26b5357879b432bd779.jpg',
 'datasets/roboflow/tetrapak-xczol/train/Ufb0553d285814e78b71306c9ccc56642g_png_jpg.rf.7b80c7bd07660cbf215c06e4a3c79ea2.jpg',
 'datasets/roboflow/tetrapak-xczol/train/vina-14-_jpeg_jpg.rf.60cfa17f0769dd178403f88eb3492efb.jpg',
 'datasets/roboflow/tetrapak-xczol/train/cart-117-_jpg.rf.fc2026ac7295b4b0a70b9caa03c0cdda.jpg',
 'datasets/roboflow/tetrapak-xczol/train/vina-64-_jpg.rf.9bc15185a6c1fe67cbeeca6eb33aef7c.jpg',
 'datase

In [99]:
tetrapak_xczol_data = [
    Dataset(
        path=img_path,
        target=WasteLabel.OTHER
    )
    for img_path in tetrapak_xczol
]

In [100]:
pd.DataFrame(TypeAdapter(list[Dataset]).dump_python(tetrapak_xczol_data)).to_csv(OUTPUT_FOLDER, index=False, mode="a", header = False)

### project-space-12/egg-tray-count/v1


In [101]:
egg_tray_count = glob.glob("datasets/roboflow/egg-tray-count/*/*.jpg")
egg_tray_count

['datasets/roboflow/egg-tray-count/train/images97_jpg.rf.06ba8bdadb172a738e53e164635fc445.jpg',
 'datasets/roboflow/egg-tray-count/train/images55_jpg.rf.9d8726909525f99fe8ac3cf61b21387c.jpg',
 'datasets/roboflow/egg-tray-count/train/images61_jpg.rf.26ad2d37004f1e495d1c036227e3d01d.jpg',
 'datasets/roboflow/egg-tray-count/train/images84_jpg.rf.9e963d8ef944c488b5219251e932766d.jpg',
 'datasets/roboflow/egg-tray-count/train/images24_jpg.rf.163e0a50dca7191856614c010cbb312e.jpg',
 'datasets/roboflow/egg-tray-count/train/images109_jpg.rf.b0b5d104cdae6946037b00d744cb687c.jpg',
 'datasets/roboflow/egg-tray-count/train/images19_jpg.rf.c6a2568ee70808018a41a22b23b4b099.jpg',
 'datasets/roboflow/egg-tray-count/train/download-29_jpg.rf.3a6af802b1543f5596ce8d1c3ccc2114.jpg',
 'datasets/roboflow/egg-tray-count/train/images43_jpg.rf.89a5f909463fc6d6e96d733f22e5271e.jpg',
 'datasets/roboflow/egg-tray-count/train/download33_jpg.rf.051ae90f6064544ee6a6ff3053aeb372.jpg',
 'datasets/roboflow/egg-tray-count

In [102]:
egg_tray_count_data = [
    Dataset(
        path=img_path,
        target=WasteLabel.OTHER
    )
    for img_path in egg_tray_count
]

In [103]:
pd.DataFrame(TypeAdapter(list[Dataset]).dump_python(egg_tray_count_data)).to_csv(OUTPUT_FOLDER, index=False, mode="a", header = False)

### work3-dqzz5/bottle-cap-y6pzg/v1


In [104]:
bottle_cap = glob.glob("datasets/roboflow/bottle-cap-y6pzg/*/*")


In [105]:
bottle_cap_data = [
    Dataset(
        path=img_path,
        target=WasteLabel.RIGID_PLASTIC
    )
    for img_path in bottle_cap[:100]
]

In [106]:
pd.DataFrame(TypeAdapter(list[Dataset]).dump_python(bottle_cap_data)).to_csv(OUTPUT_FOLDER, index=False, mode="a", header = False)

### kabies-sickkk/svm-plastic-and-metal/v2


In [107]:
plastic_and_metal =  glob.glob("datasets/roboflow/svm-plastic-and-metal/*/*")
plastic_and_metal

['datasets/roboflow/svm-plastic-and-metal/train/metal',
 'datasets/roboflow/svm-plastic-and-metal/train/plastic',
 'datasets/roboflow/svm-plastic-and-metal/test/metal',
 'datasets/roboflow/svm-plastic-and-metal/test/plastic']

#### Plastic PET

In [108]:
plastic_and_metal_plastic = glob.glob("datasets/roboflow/svm-plastic-and-metal/*/plastic/*.jpg")
plastic_and_metal_plastic

['datasets/roboflow/svm-plastic-and-metal/train/plastic/plastic1591_jpg.rf.dc045384f5d6ccf545bf362ef515b729.jpg',
 'datasets/roboflow/svm-plastic-and-metal/train/plastic/plastic1383_jpg.rf.b61eb7c06072eeecb9e5e9cc028a446b.jpg',
 'datasets/roboflow/svm-plastic-and-metal/train/plastic/plastic1344_jpg.rf.b540c6d4a1121e077258a81b595feff0.jpg',
 'datasets/roboflow/svm-plastic-and-metal/train/plastic/plastic942_jpg.rf.1d3fd7ba98b66acfa1e678a4d115a7d6.jpg',
 'datasets/roboflow/svm-plastic-and-metal/train/plastic/plastic272_jpg.rf.1e9b6459e59acfd2bd74cccccfd9b2c4.jpg',
 'datasets/roboflow/svm-plastic-and-metal/train/plastic/plastic488_jpg.rf.64cd40b64ef2cb1e7b1d8bee579ec874.jpg',
 'datasets/roboflow/svm-plastic-and-metal/train/plastic/plastic871_jpg.rf.3b68e92d0d4efde1d083c054e471f2c9.jpg',
 'datasets/roboflow/svm-plastic-and-metal/train/plastic/plastic1684_jpg.rf.69d3affc9fbc3cc333f8b88557e29874.jpg',
 'datasets/roboflow/svm-plastic-and-metal/train/plastic/plastic459_jpg.rf.506cead3e3276def08

In [109]:
plastic_and_metal_plastic_data = [
    Dataset(
        path=img_path,
        target=WasteLabel.PET
    )
    for img_path in plastic_and_metal_plastic
]

In [110]:
pd.DataFrame(TypeAdapter(list[Dataset]).dump_python(plastic_and_metal_plastic_data)).to_csv(OUTPUT_FOLDER, index=False, mode="a", header = False)

#### Metal

In [111]:
plastic_and_metal_metal = glob.glob("datasets/roboflow/svm-plastic-and-metal/*/metal/*.jpg")
plastic_and_metal_metal

['datasets/roboflow/svm-plastic-and-metal/train/metal/metal1549_jpg.rf.e4f0af25d50efc605ea4936af26ed4e5.jpg',
 'datasets/roboflow/svm-plastic-and-metal/train/metal/metal1319_jpg.rf.5d656b9617a711065804b4d6cc6bcccb.jpg',
 'datasets/roboflow/svm-plastic-and-metal/train/metal/metal710_jpg.rf.e7875fa9b3279aac661e91e1eb23298a.jpg',
 'datasets/roboflow/svm-plastic-and-metal/train/metal/metal870_jpg.rf.3009def8bcbf935807c2f9e4922f38ea.jpg',
 'datasets/roboflow/svm-plastic-and-metal/train/metal/metal442_jpg.rf.a2e61465b947c12743de0400032bdfc3.jpg',
 'datasets/roboflow/svm-plastic-and-metal/train/metal/metal1913_jpg.rf.8c0b7b5174b7a466cf1889d7dbe94b5a.jpg',
 'datasets/roboflow/svm-plastic-and-metal/train/metal/metal41_jpg.rf.30f37d299d9750843d4931e8b887f0de.jpg',
 'datasets/roboflow/svm-plastic-and-metal/train/metal/metal1270_jpg.rf.f7a669911cc4dfb090c6038c8a74ebef.jpg',
 'datasets/roboflow/svm-plastic-and-metal/train/metal/metal1273_jpg.rf.dba05593f339917fff91dded54326aad.jpg',
 'datasets/robo

In [112]:
plastic_and_metal_metal_data = [
    Dataset(
        path=img_path,
        target=WasteLabel.METAL
    )
    for img_path in plastic_and_metal_metal
]

In [113]:
pd.DataFrame(TypeAdapter(list[Dataset]).dump_python(plastic_and_metal_metal_data)).to_csv(OUTPUT_FOLDER, index=False, mode="a", header = False)

### tgmt-wgnd8/metal-ipkdz/v1


In [114]:
metal_ipkdz = glob.glob("datasets/roboflow/metal-ipkdz/*/*.jpg")
metal_ipkdz

['datasets/roboflow/metal-ipkdz/train/metal253_jpg.rf.3474ad91be4f0ef5fb86b836d15eb4b0.jpg',
 'datasets/roboflow/metal-ipkdz/train/metal346_jpg.rf.ae4c5a2975e5c648c55e4613413052ad.jpg',
 'datasets/roboflow/metal-ipkdz/train/163_metal_jpg.rf.a2c199457573ca562a6e6c0b8606a64e.jpg',
 'datasets/roboflow/metal-ipkdz/train/259_metal_jpg.rf.e355400383b01e8fc8193d30c81920bb.jpg',
 'datasets/roboflow/metal-ipkdz/train/metal226_jpg.rf.e8b0c5e56ee13dd571de7ec6d9399b57.jpg',
 'datasets/roboflow/metal-ipkdz/train/metal260_jpg.rf.f1844390e187afcba171f312881e1078.jpg',
 'datasets/roboflow/metal-ipkdz/train/metal206_jpg.rf.8f1f157b8c2c25fe9e1c1d3243a9de07.jpg',
 'datasets/roboflow/metal-ipkdz/train/255_metal_jpg.rf.3ea2e8ccf9e3bae134192544e912dc15.jpg',
 'datasets/roboflow/metal-ipkdz/train/metal236_jpg.rf.c0b0e15b5ce6cbf8e380ac0078ea88e1.jpg',
 'datasets/roboflow/metal-ipkdz/train/165_metal_jpg.rf.d013a597acc3f216b3cbf709bb3449aa.jpg',
 'datasets/roboflow/metal-ipkdz/train/190_metal_jpg.rf.77be21f496c

In [115]:
metal_ipkdz_data = [
    Dataset(
        path=img_path,
        target=WasteLabel.METAL
    )
    for img_path in metal_ipkdz
]

In [116]:
pd.DataFrame(TypeAdapter(list[Dataset]).dump_python(metal_ipkdz_data)).to_csv(OUTPUT_FOLDER, index=False, mode="a", header = False)

### talovtask/plastic-bag-tlche/v1


In [117]:
plastic_bag_tlche = glob.glob("datasets/roboflow/plastic-bag-tlche/*/*.jpg")
plastic_bag_tlche

['datasets/roboflow/plastic-bag-tlche/train/plastic_bag_6_jpg.rf.e8191fa80207a96196b2e42c31b8e352.jpg',
 'datasets/roboflow/plastic-bag-tlche/train/plastic_bag_135_jpg.rf.7710021e9eed2d4e214ee59b1bea8144.jpg',
 'datasets/roboflow/plastic-bag-tlche/train/plastic_bag_66_jpg.rf.6509ede3d1036c146594e55c808ec3bf.jpg',
 'datasets/roboflow/plastic-bag-tlche/train/plastic_bag_199_jpg.rf.95a9a9e2400308d3c6210ec4c0fa9589.jpg',
 'datasets/roboflow/plastic-bag-tlche/train/plastic_bag_150_jpg.rf.44e3cfcb0107ef1c5aa1553cf524cb55.jpg',
 'datasets/roboflow/plastic-bag-tlche/train/plastic_bag_42_jpg.rf.01dd829ae7af5a53a56fbcb0daff0476.jpg',
 'datasets/roboflow/plastic-bag-tlche/train/plastic_bag_49_jpg.rf.7434b9809084654dd23483b17ae6d518.jpg',
 'datasets/roboflow/plastic-bag-tlche/train/plastic_bag_176_jpg.rf.13949f611604ebf43f35f5793a8dde0b.jpg',
 'datasets/roboflow/plastic-bag-tlche/train/plastic_bag_9_jpg.rf.8943ad44cad030d618b0cf70c5876342.jpg',
 'datasets/roboflow/plastic-bag-tlche/train/plastic_b

In [118]:
plastic_bag_tlche_data = [
    Dataset(
        path=img_path,
        target=WasteLabel.FLEXIBLE_PLASTIC
    )
    for img_path in plastic_bag_tlche
]

In [119]:
pd.DataFrame(TypeAdapter(list[Dataset]).dump_python(plastic_bag_tlche_data)).to_csv(OUTPUT_FOLDER, index=False, mode="a", header = False)

### new-workspace-slpmv/bag-qe348/v4

In [120]:
bag_qe348 = glob.glob("datasets/roboflow/bag-qe348/*/*.jpg")
bag_qe348

['datasets/roboflow/bag-qe348/train/60_jpg.rf.dbd8a23ca597024542388e1e70e73f66.jpg',
 'datasets/roboflow/bag-qe348/train/129_jpg.rf.8de91f80b58d02e490b6b8a278d681a3.jpg',
 'datasets/roboflow/bag-qe348/train/26_png.rf.19d06fa9a3bc770cf1a7325ec40aed12.jpg',
 'datasets/roboflow/bag-qe348/train/32_jpg.rf.2513aa713eaf9fc14036c348e1dae3ab.jpg',
 'datasets/roboflow/bag-qe348/train/25_jpeg.rf.6f03aae2b0933b82eb5a537beb8908b6.jpg',
 'datasets/roboflow/bag-qe348/train/16_jpg.rf.433ec2f378f1b6189ee762f1475e8d09.jpg',
 'datasets/roboflow/bag-qe348/train/144_jpg.rf.4e8555c94bb06fb2808f1bf9eba25416.jpg',
 'datasets/roboflow/bag-qe348/train/49_jpg.rf.62c42b5c29a9315a38ec87b0f91a3655.jpg',
 'datasets/roboflow/bag-qe348/train/42_jpeg.rf.ad8e4fae1302427bd863b1e37260508b.jpg',
 'datasets/roboflow/bag-qe348/train/62_jpg.rf.cb37de8919eeb2b9d00054089dbea1cc.jpg',
 'datasets/roboflow/bag-qe348/train/30_jpg.rf.54494f92075c17040089a9d969622664.jpg',
 'datasets/roboflow/bag-qe348/train/50_jpg.rf.cc20f9380f29849

In [121]:
bag_qe348_data = [
    Dataset(
        path=img_path,
        target=WasteLabel.FLEXIBLE_PLASTIC
    )
    for img_path in bag_qe348
]

In [122]:
pd.DataFrame(TypeAdapter(list[Dataset]).dump_python(bag_qe348_data)).to_csv(OUTPUT_FOLDER, index=False, mode="a", header = False)

### testee-rv5vr/metal-zn5s0/v1


In [123]:
metal_zn5s0 = glob.glob("datasets/roboflow/metal-zn5s0/*/*.jpg")
metal_zn5s0

['datasets/roboflow/metal-zn5s0/train/metal-2079-_jpg.rf.245f1ca0121f779cfd8cf8cc3fd85050.jpg',
 'datasets/roboflow/metal-zn5s0/train/metal-1778-_jpg.rf.3b73396a45831b541294ef441127deab.jpg',
 'datasets/roboflow/metal-zn5s0/train/metal-1255-_jpg.rf.21633955754b0918a4f09b87afda29ac.jpg',
 'datasets/roboflow/metal-zn5s0/train/metal-1723-_jpg.rf.88a54a6cc9e2904b1a0b696ccfc6bb50.jpg',
 'datasets/roboflow/metal-zn5s0/train/metal-2008-_jpg.rf.b2ec69c658d8b897fe7c400aeff4d951.jpg',
 'datasets/roboflow/metal-zn5s0/train/metal-1414-_jpg.rf.78f100ee8f42af40e769809e25b07593.jpg',
 'datasets/roboflow/metal-zn5s0/train/metal-1991-_jpg.rf.1a0aee47167328ea5c096e398bc522d7.jpg',
 'datasets/roboflow/metal-zn5s0/train/metal-1819-_jpg.rf.6e177db8036581e59896642bbabf643f.jpg',
 'datasets/roboflow/metal-zn5s0/train/metal-2004-_jpg.rf.f68c73793a6deb58308d00618b31bbf8.jpg',
 'datasets/roboflow/metal-zn5s0/train/metal-1862-_jpg.rf.e2dac433b2598b8421705e337640573a.jpg',
 'datasets/roboflow/metal-zn5s0/train/me

In [124]:
metal_zn5s0_data = [
    Dataset(
        path=img_path,
        target=WasteLabel.METAL
    )
    for img_path in metal_zn5s0
]

In [125]:
pd.DataFrame(TypeAdapter(list[Dataset]).dump_python(metal_zn5s0_data)).to_csv(OUTPUT_FOLDER, index=False, mode="a", header = False)

### minhthong/glass-model/v2


In [126]:
glass_minh = glob.glob("datasets/roboflow/glass-model/*/*.jpg")
glass_minh

['datasets/roboflow/glass-model/train/glass498_jpg.rf.c508f057cfd5a7144876b4b121d54c43.jpg',
 'datasets/roboflow/glass-model/train/glass-245_jpg.rf.2f974e9e520d327034aadd5aa9906ab5.jpg',
 'datasets/roboflow/glass-model/train/R_5110_jpg.rf.f1b8a76bce16ca7e19647987177cb833.jpg',
 'datasets/roboflow/glass-model/train/R_5244_jpg.rf.6a8f2c414abbbbae67508efaaa00add2.jpg',
 'datasets/roboflow/glass-model/train/glass417_jpg.rf.c244c33753d303eb94ad9c26884a81bf.jpg',
 'datasets/roboflow/glass-model/train/glass128_jpg.rf.25dcd6704873007d0c768f52c34d1359.jpg',
 'datasets/roboflow/glass-model/train/Cup_Glass141_jpg.rf.bcbb6ca802c52299d61300ba8c47ee2a.jpg',
 'datasets/roboflow/glass-model/train/glass-462_jpg.rf.8d0e462f6dc11f43d144b658d1cf49ba.jpg',
 'datasets/roboflow/glass-model/train/Cup_Glass356_jpg.rf.595774340da117027157872612ab935c.jpg',
 'datasets/roboflow/glass-model/train/Cup_Glass019_jpg.rf.a7c1faab87132346bf10719aec739f4d.jpg',
 'datasets/roboflow/glass-model/train/R_5098_jpg.rf.5fcc23c0

In [127]:
glass_minh_data = [
    Dataset(
        path=img_path,
        target=WasteLabel.GLASS
    )
    for img_path in glass_minh
]

In [128]:
pd.DataFrame(TypeAdapter(list[Dataset]).dump_python(glass_minh_data)).to_csv(OUTPUT_FOLDER, index=False, mode="a", header = False)

### project-qynru/glass-fc9h7/v1

In [129]:
glass_qynru = glob.glob("datasets/roboflow/glass-fc9h7/*/*.jpg")
glass_qynru

['datasets/roboflow/glass-fc9h7/train/R_5088_jpg.rf.34d58d5057b57056f487c740f2121d02.jpg',
 'datasets/roboflow/glass-fc9h7/train/Cup_Glass359_jpg.rf.cc72f944deeb5e074bc586cdffc8d370.jpg',
 'datasets/roboflow/glass-fc9h7/train/glass-64_jpg.rf.56256fcef408e52c82b85ecf2d9f4b86.jpg',
 'datasets/roboflow/glass-fc9h7/train/glass102_jpg.rf.3bae2b4faf6d39e3463f053d7303cfab.jpg',
 'datasets/roboflow/glass-fc9h7/train/R_5076_jpg.rf.73ad957d8d2511ff3fbe567ea35516ef.jpg',
 'datasets/roboflow/glass-fc9h7/train/R_5244_jpg.rf.acc07dd5722d7ecf851162da8da1e0b1.jpg',
 'datasets/roboflow/glass-fc9h7/train/glass-382_jpg.rf.43ef765ba04102b9bca3d1868af73f49.jpg',
 'datasets/roboflow/glass-fc9h7/train/glass315_jpg.rf.8d87ebd19226e2a643986b6cd94b58d6.jpg',
 'datasets/roboflow/glass-fc9h7/train/Cup_Glass048_jpg.rf.8098ebabed909094990153fccb3b41c7.jpg',
 'datasets/roboflow/glass-fc9h7/train/R_5221_jpg.rf.31756a8b820a0082c0d48e1c9e33e549.jpg',
 'datasets/roboflow/glass-fc9h7/train/R_5165_jpg.rf.795ab93a2950d7d1f

In [130]:
glass_qynru_data = [
    Dataset(
        path=img_path,
        target=WasteLabel.GLASS
    )
    for img_path in glass_qynru
]

In [131]:
pd.DataFrame(TypeAdapter(list[Dataset]).dump_python(glass_qynru_data)).to_csv(OUTPUT_FOLDER, index=False, mode="a", header = False)

### hana-ygz4l/tri-des-dechets-hdpe/v1


In [132]:
tri_hdpe = glob.glob("datasets/roboflow/tri-des-dechets-hdpe/*/*.jpg")
tri_hdpe

['datasets/roboflow/tri-des-dechets-hdpe/train/img_hdpe-1008_jpg.rf.f243b72f3c8f0eb27fc17a63bb702e51.jpg',
 'datasets/roboflow/tri-des-dechets-hdpe/train/img_hdpe-1217_jpg.rf.9d0fce7cefe7002f8fb3715e5f05b261.jpg',
 'datasets/roboflow/tri-des-dechets-hdpe/train/img_hdpe-1035_jpg.rf.582b0e1c4fd94422b2093a486545cbdb.jpg',
 'datasets/roboflow/tri-des-dechets-hdpe/train/img_hdpe-1421_jpg.rf.34c693b02cda989e01c7c44bd6a25cb3.jpg',
 'datasets/roboflow/tri-des-dechets-hdpe/train/img_hdpe-1088_jpg.rf.32004406ac3f88aeec55258cf3a02720.jpg',
 'datasets/roboflow/tri-des-dechets-hdpe/train/img_hdpe-1409_jpg.rf.590a3c80d899f82200b66d2423c0762b.jpg',
 'datasets/roboflow/tri-des-dechets-hdpe/train/img_hdpe-1037_jpg.rf.9382e2aa74ffbd82c8d4506e15a59571.jpg',
 'datasets/roboflow/tri-des-dechets-hdpe/train/img_hdpe-1213_jpg.rf.d1b440b5950631cb719dca8e3f0d40d7.jpg',
 'datasets/roboflow/tri-des-dechets-hdpe/train/img_hdpe-1031_jpg.rf.4c2312db7d5515ef8c1b4eaf9cc4265d.jpg',
 'datasets/roboflow/tri-des-dechets-h

In [133]:
tri_hdpe_data = [
    Dataset(
        path=img_path,
        target=WasteLabel.RIGID_PLASTIC
    )
    for img_path in tri_hdpe
]

In [134]:
pd.DataFrame(TypeAdapter(list[Dataset]).dump_python(tri_hdpe_data)).to_csv(OUTPUT_FOLDER, index=False, mode="a", header = False)

### nararit/classification-pet-hdpe/v1

In [135]:
pet_hdpe = glob.glob("datasets/roboflow/classification-pet-hdpe/*/*")
pet_hdpe

['datasets/roboflow/classification-pet-hdpe/train/HDPE',
 'datasets/roboflow/classification-pet-hdpe/train/PET',
 'datasets/roboflow/classification-pet-hdpe/test/HDPE',
 'datasets/roboflow/classification-pet-hdpe/test/PET',
 'datasets/roboflow/classification-pet-hdpe/valid/HDPE',
 'datasets/roboflow/classification-pet-hdpe/valid/PET']

#### PET

In [136]:
pet_hdpe_pet = glob.glob("datasets/roboflow/classification-pet-hdpe/*/PET/*.jpg")
pet_hdpe_pet

['datasets/roboflow/classification-pet-hdpe/train/PET/2_jpg.rf.eb142b96d5261273c7d49098e06996a3.jpg',
 'datasets/roboflow/classification-pet-hdpe/train/PET/plastic276_jpg.rf.4d6ca089d8b63dfe81a5802a6121978b.jpg',
 'datasets/roboflow/classification-pet-hdpe/train/PET/KakaoTalk_20231012_150047523_13_jpg.rf.a26c4ec683dc32995d023541c0d3aa45.jpg',
 'datasets/roboflow/classification-pet-hdpe/train/PET/-164_jpg.rf.d189bf3ff03d0fac095da8db133d1548.jpg',
 'datasets/roboflow/classification-pet-hdpe/train/PET/PET373_jpg.rf.e27df34598390d1b012a18fbbcdead27.jpg',
 'datasets/roboflow/classification-pet-hdpe/train/PET/500051_jpg.rf.129803ff870877d8339a5191d9f77b33.jpg',
 'datasets/roboflow/classification-pet-hdpe/train/PET/02_03_2020_14_47_06_jpeg_jpg.rf.7dbd61eed6f9a4ba84e4b397efb77743.jpg',
 'datasets/roboflow/classification-pet-hdpe/train/PET/scene00172_png_jpg.rf.837022ab4366bb21255dbbbc34bf0f5e.jpg',
 'datasets/roboflow/classification-pet-hdpe/train/PET/KakaoTalk_20230423_132331531_11_jpg.rf.045

In [137]:
pet_hdpe_pet_data = [
    Dataset(
        path=img_path,
        target=WasteLabel.PET
    )
    for img_path in pet_hdpe_pet
]

In [138]:
pd.DataFrame(TypeAdapter(list[Dataset]).dump_python(pet_hdpe_pet_data)).to_csv(OUTPUT_FOLDER, index=False, mode="a", header = False)

#### HDPE

In [139]:
pet_hdpe_hdpe = glob.glob("datasets/roboflow/classification-pet-hdpe/*/HDPE/*.jpg")
pet_hdpe_hdpe

['datasets/roboflow/classification-pet-hdpe/train/HDPE/IMG_0759_Original_jpeg_jpg.rf.5878a1d5201762cf556a987acc9bfe05.jpg',
 'datasets/roboflow/classification-pet-hdpe/train/HDPE/IMG_0106_JPG_jpg.rf.bb7342b1188b57b193dea7ba9c4ba6fa.jpg',
 'datasets/roboflow/classification-pet-hdpe/train/HDPE/IMG_0741_Original_jpeg_jpg.rf.2483fd0f74f7339a102777e7bd800fd1.jpg',
 'datasets/roboflow/classification-pet-hdpe/train/HDPE/Doge1_jpg.rf.6adacd7eabcd3ebd142be08bb802e522.jpg',
 'datasets/roboflow/classification-pet-hdpe/train/HDPE/IMG_1886_JPG_jpg.rf.4b50ce69ca9f1e352a4d5b46fc8aa89e.jpg',
 'datasets/roboflow/classification-pet-hdpe/train/HDPE/IMG_1929_JPG_jpg.rf.803e89256517b6212a4d8ac608c44156.jpg',
 'datasets/roboflow/classification-pet-hdpe/train/HDPE/IMG_0084_JPG_jpg.rf.f39cab24539a84fec1531c66c68951dc.jpg',
 'datasets/roboflow/classification-pet-hdpe/train/HDPE/IMG_0143_JPG_jpg.rf.1b563c582fd017282b88067c48ec8235.jpg',
 'datasets/roboflow/classification-pet-hdpe/train/HDPE/IMG_0768_Original_jp

In [140]:
pet_hdpe_hdpe_data = [
    Dataset(
        path=img_path,
        target=WasteLabel.RIGID_PLASTIC
    )
    for img_path in pet_hdpe_hdpe
]

In [141]:
pd.DataFrame(TypeAdapter(list[Dataset]).dump_python(pet_hdpe_hdpe_data)).to_csv(OUTPUT_FOLDER, index=False, mode="a", header = False)

### All Data

In [142]:
df = pd.read_csv("datasetv2.csv")

In [143]:
df['target'].value_counts()

target
Plastic Cups        16096
Flexible Plastic    10680
Paper               10235
Metal                5850
Glass                5077
Rigid Plastic        4951
Other                3977
PET                  3967
Hard Plastic         2918
Name: count, dtype: int64