In [None]:
from google.colab import drive
drive.mount('/content/drive')

Mounted at /content/drive


### Data preparation

ADA

In [None]:
!unzip "/content/drive/MyDrive/001_projects/FSL/data/human_annotated/update-190.zip"

HCFA

In [None]:
!unzip "/content/drive/MyDrive/001_projects/FSL/data/augmented_data/hcfa_augmented_data_100.zip"

Archive:  /content/drive/MyDrive/001_projects/FSL/data/augmented_data/hcfa_augmented_data_100.zip
   creating: content/hcfa_augmented_data/
   creating: content/hcfa_augmented_data/images/
   creating: content/hcfa_augmented_data/images/train/
  inflating: content/hcfa_augmented_data/images/train/1179543BAZ001_001_1.jpg  
  inflating: content/hcfa_augmented_data/images/train/11795437AZ001_001_0.jpg  
  inflating: content/hcfa_augmented_data/images/train/11795435AZ013_001_0.jpg  
  inflating: content/hcfa_augmented_data/images/train/11795449AZ011_001_2.jpg  
  inflating: content/hcfa_augmented_data/images/train/117914B4AZ012_001_0.jpg  
  inflating: content/hcfa_augmented_data/images/train/11795447AZ029_001_2.jpg  
  inflating: content/hcfa_augmented_data/images/train/1179543MAZ008_001_2.jpg  
  inflating: content/hcfa_augmented_data/images/train/11795439AZ027_001_0.jpg  
  inflating: content/hcfa_augmented_data/images/train/117914B9AZ027_001_1.jpg  
  inflating: content/hcfa_augmented_

In [None]:
import os
import shutil
from sklearn.model_selection import train_test_split

# Define paths
root_folder = "/content/update-190"
images_folder = os.path.join(root_folder, "images")
labels_folder = os.path.join(root_folder, "labels")

# Create train and val folders
root_train_folder = os.path.join("data", "images", "train")
root_val_folder = os.path.join("data", "images", "valid")
root_train_labels_folder = os.path.join("data", "labels", "train")
root_val_labels_folder = os.path.join("data", "labels", "valid")

os.makedirs(root_train_folder, exist_ok=True)
os.makedirs(root_val_folder, exist_ok=True)
os.makedirs(root_train_labels_folder, exist_ok=True)
os.makedirs(root_val_labels_folder, exist_ok=True)

# Get list of image files
image_files = [f for f in os.listdir(images_folder) if os.path.isfile(os.path.join(images_folder, f))]

# Split the dataset
train_images, val_images = train_test_split(image_files, test_size=0.2, random_state=42)

# Copy images to train folder
for image in train_images:
    shutil.copy(os.path.join(images_folder, image), os.path.join(root_train_folder, image))

# Copy labels to train folder
for image in train_images:
    label_file = os.path.splitext(image)[0] + ".txt"
    shutil.copy(os.path.join(labels_folder, label_file), os.path.join(root_train_labels_folder, label_file))

# Copy images to val folder
for image in val_images:
    shutil.copy(os.path.join(images_folder, image), os.path.join(root_val_folder, image))

# Copy labels to val folder
for image in val_images:
    label_file = os.path.splitext(image)[0] + ".txt"
    shutil.copy(os.path.join(labels_folder, label_file), os.path.join(root_val_labels_folder, label_file))


In [None]:
!pip install ultralytics

Collecting ultralytics
  Downloading ultralytics-8.0.238-py3-none-any.whl (695 kB)
[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m695.2/695.2 kB[0m [31m6.5 MB/s[0m eta [36m0:00:00[0m
Collecting thop>=0.1.1 (from ultralytics)
  Downloading thop-0.1.1.post2209072238-py3-none-any.whl (15 kB)
Installing collected packages: thop, ultralytics
Successfully installed thop-0.1.1.post2209072238 ultralytics-8.0.238


### Start Inference

In [None]:
from ultralytics import YOLO
from PIL import Image

In [None]:
import os
os.environ['WANDB_DISABLED'] = 'true'
best_model_path = "/content/drive/MyDrive/001_projects/FSL/yolo_ada_initial_model_v1/train3/weights/best.pt"
test_image_path = "/content/2027C44MD009_001_1.jpg"

In [None]:
# Load a pretrained model
model = YOLO(best_model_path)

# Run inference on Test Image
results = model(test_image_path)  # results list

# Show the results
for r in results:
    im_array = r.plot(labels= True)  # plot a BGR numpy array of predictions
    im = Image.fromarray(im_array[..., ::-1])  # RGB PIL image
    im.show()  # show image
    im.save('results.jpg')  # save image


image 1/1 /content/2027C44MD009_001_1.jpg: 1440x1152 1 10_Relationship, 1 11_Company_or_plan, 1 12_Policyholder_details, 1 13_DOB, 1 14_Gender, 1 15_SSN, 1 16_Plan_Number, 1 17_Employer_Name, 1 18_Relationship, 1 19_Use, 1 1_Type_of_Transaction, 1 20_Name, 1 21_DOB, 1 22_Gender, 1 23_Patient_ID, 1 24_31_Table, 1 2_Pre_Number, 1 31_A_Other_Fee, 1 32_Total_Fee, 1 33_Missing_Teeth, 1 34_A_Diag_Codes, 1 34_Code_list_Qualifier, 1 35_Remarks, 1 36_Signature, 1 37_Signature, 1 38_Place_of_treatment, 1 39_Enclosures, 1 3_Company_address, 1 40_Orthodontics, 1 41_Date, 1 42_Months_remaining, 1 43_Prosthesis, 1 44_Date, 1 45_Treatment_resulting_form, 1 46_Date_of_accident, 1 47_Auto_Accident_state, 1 48_Dentist_Address, 1 49_NPI, 1 4_Other_Coverage, 1 50_Licence_Number, 1 51_SSN_TIN, 1 52_A_Addl_Provider_id, 1 52_Phone_Number, 1 53_Signature, 1 54_NPI, 1 55_Licence_Number, 1 56_Address, 1 57_Phone_Number, 1 58_Addl_provider_id, 1 5_Name, 1 6_DOB, 1 7_Gender, 1 8_SSN, 1 9_Plan_Number, 21.6ms
Spee