# Libraries and Module

In [None]:
import numpy as np # linear algebra
import pandas as pd # data processing, CSV file I/O (e.g. pd.read_csv)
import matplotlib.pyplot as plt # data visualization
import seaborn as sns # statistical data visualization
from sklearn.preprocessing import OneHotEncoder, LabelEncoder
%matplotlib inline
from sklearn.model_selection import train_test_split

#source : https://www.kaggle.com/code/prashant111/random-forest-classifier-tutorial

In [None]:
pip install --upgrade scikit-learn

Collecting scikit-learn
  Downloading scikit_learn-1.3.2-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (10.8 MB)
[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m10.8/10.8 MB[0m [31m80.9 MB/s[0m eta [36m0:00:00[0m
Installing collected packages: scikit-learn
  Attempting uninstall: scikit-learn
    Found existing installation: scikit-learn 1.2.2
    Uninstalling scikit-learn-1.2.2:
      Successfully uninstalled scikit-learn-1.2.2
Successfully installed scikit-learn-1.3.2


In [None]:
# Mount Google Drive
from google.colab import drive
drive.mount('/content/subprogram6.pkl')

# Create a symbolic link
!ln -s /content/gdrive/My\ Drive/ /mydriveCESU

# List the contents of your Google Drive
!ls /mydriveCESU

In [None]:
data = '/content/cesu-17-below-Maytrabaho.csv'
df = pd.read_csv(data)
# view dimensions of dataset
print('Datasets:', df.shape)

Datasets: (8191, 15)


# Training datasets

In [None]:
data = pd.read_csv('/content/cesu-17-below-Maytrabaho.csv')

# Define custom encoding dictionaries for each categorical column
encoding_dict_kasarian = {'Lalake': 0, 'Babae': 1}
encoding_dict_edad= {'17-below': 0, '18-24': 1, '25-34': 2, '35-44': 3, '45-54': 4, '55-64': 5, '65-Above': 6 }
encoding_dict_antas = {'Hindi nakapagtapos ng Elementarya':0, 'Elementarya':1, 'Hindi nakapagtapos ng Sekundarya':2, 'Sekundarya':3, 'Kolehiyo':4, 'Hindi nakapagtapos ng Kolehiyo':5, 'Masters Degree':6, 'Doctorate Degree':7, 'Hindi nakapag-aral':8}  # Define your categories and values
encoding_dict_uri = {'May Trabaho': 1, 'Walang Trabaho': 0}  # Define your categories and values
#encoding_dict_program = {'Literacy': 0, 'Socio-economic': 1, 'Environmental Stewardship': 2, 'Health and Wellness': 3, 'Cultural Enhancement': 4, 'Values Formation': 5, 'Disaster Management': 6, 'Gender and Development': 7}  # Define your categories and values

# Apply custom encoding to the categorical columns
data['Kasarian'] = data['Kasarian'].map(encoding_dict_kasarian)
data['Edad'] = data['Edad'].map(encoding_dict_edad)
data['Antas na tinapos'] = data['Antas na tinapos'].map(encoding_dict_antas)
data['Uri ng trabaho'] = data['Uri ng trabaho'].map(encoding_dict_uri)
#data['Program'] = data['Program'].map(encoding_dict_program)

# Split the data into training and testing sets
X = data.drop(['Program'], axis=1)  # Features
y = data['Program']  # Target variable

X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.33, random_state=42)


In [None]:
X_train.head()

In [None]:
X_test.head()

In [None]:
# check data types in X_train

X_train.dtypes

In [None]:
# check the shape of X_train and X_test

X_train.shape, X_test.shape

((5487, 14), (2704, 14))

In [None]:
col_names = ['Kasarian', 'Edad', 'Antas na tinapos', 'Uri ng trabaho', 'Serbisyong Pangedukasyon', 'Pagsasanay Pangkabuhayan (Livelihood)', 'Pagtatanim', 'Serbisyong Pangkalusugan', 'Serbisyong Dental', 'Kaalamang Pangkultura', 'Values Formation at Moral Recovery', 'Ayudang Pagkain (Food Assistance)', 'Pagrerecycle', 'Pagsasanay Ukol sa Teknolohiya', 'Program']
df.columns = col_names
col_names
df.head()

# Random Forest Algorithm

In [None]:
from sklearn.ensemble import RandomForestClassifier
from sklearn.metrics import accuracy_score, classification_report, confusion_matrix

rfc = RandomForestClassifier(n_estimators=100, random_state=42)

rfc.fit(X_train, y_train)

y_pred = rfc.predict(X_test)

# Check accuracy score
accuracy = accuracy_score(y_test, y_pred)
print('Model accuracy score with 100 decision-trees: {0:0.4f}'.format(accuracy))


Model accuracy score with 100 decision-trees: 1.0000


In [None]:
# Evaluate the model
accuracy = accuracy_score(y_test, y_pred)
print(f'Accuracy: {accuracy:.2f}')

# Display additional evaluation metrics
print(classification_report(y_test, y_pred))
print(confusion_matrix(y_test, y_pred))

# Export the model

In [None]:
import joblib
# Assuming 'rfc' is your trained Random Forest Classifier
joblib.dump(rfc, 'trained_modelCESU6.pkl')

['trained_modelCESU6.pkl']

In [None]:
from google.colab import files
files.download('trained_modelCESU6.pkl')

<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

# **Walang Trabaho**

In [None]:
import itertools
import csv

combinations = list(itertools.product([0, 1], repeat=10))

csv_file = "cesu-17-below-WalangTrabaho.csv"

with open(csv_file, mode="w", newline="") as file:
    writer = csv.writer(file)
    writer.writerow([
        "Kasarian",
        "Edad",
        "Antas na tinapos",
        "Uri ng trabaho",
        "Serbisyong Pangedukasyon",
        "Pagsasanay Pangkabuhayan (Livelihood)",
        "Pagtatanim",
        "Serbisyong Pangkalusugan",
        "Serbisyong Dental",
        "Kaalamang Pangkultura",
        "Values Formation at Moral Recovery",
        "Ayudang Pagkain (Food Assistance)",
        "Pagrerecycle",
        "Pagsasanay Ukol sa Teknolohiya",
        "Program"
    ])

    constant_values = {
        "edad": "17-below",
        "trabaho": "Walang Trabaho",
    }

    gender_values = ["Babae", "Lalake"]
    education_values = [
        "Hindi nakapagtapos ng Elementarya",
        "Elementarya",
        "Hindi nakapagtapos ng Sekundarya",
        "Sekundarya",



    ]

    for kasarian_value in gender_values:
        for antas_value in education_values:
            constant_values["kasarian"] = kasarian_value
            constant_values["antas"] = antas_value

            for combo in combinations:
                (serbisyong_pangedukasyon, pagsasanay_pangkabuhayan, pagtatanim,
                serbisyong_pangkalusugan, dental, kultura, values, ayudang_pagkain,
                recycle, teknolohiya) = combo

                if serbisyong_pangedukasyon == 1:
                    predict_value = "Literacy"
                elif teknolohiya == 1:
                    predict_value = "Literacy"
                elif values == 1:
                    predict_value = "Values Formation"
                elif kultura == 1:
                    predict_value = "Cultural Enhancement"
                elif pagtatanim == 1:
                    predict_value = "Environmental Stewardship"
                elif recycle == 1:
                    predict_value = "Environmental Stewardship"
                elif serbisyong_pangkalusugan == 1:
                    predict_value = "Health and Wellness"
                elif ayudang_pagkain == 1:
                    predict_value = "Socio-economic"
                elif pagsasanay_pangkabuhayan == 1:
                    predict_value = "Socio-economic"
                elif dental == 1:
                    predict_value = "Health and Wellness"
                else:
                    predict_value = "Literacy"

                # Append the constant values and binary attribute values to the CSV file
                writer.writerow([constant_values["kasarian"], constant_values["edad"],
                                 constant_values["antas"], constant_values["trabaho"]] + list(combo) + [predict_value])

print("CSV file created: " + csv_file)


CSV file created: cesu-17-below-WalangTrabaho.csv


# May Trabaho

In [None]:
import itertools
import csv

combinations = list(itertools.product([0, 1], repeat=10))

csv_file = "cesu-17-below-Maytrabaho.csv"

with open(csv_file, mode="w", newline="") as file:
    writer = csv.writer(file)
    writer.writerow([
        "Kasarian",
        "Edad",
        "Antas na tinapos",
        "Uri ng trabaho",
        "Serbisyong Pangedukasyon",
        "Pagsasanay Pangkabuhayan (Livelihood)",
        "Pagtatanim",
        "Serbisyong Pangkalusugan",
        "Serbisyong Dental",
        "Kaalamang Pangkultura",
        "Values Formation at Moral Recovery",
        "Ayudang Pagkain (Food Assistance)",
        "Pagrerecycle",
        "Pagsasanay Ukol sa Teknolohiya",
        "Program"
    ])

    constant_values = {
        "edad": "17-below",
        "trabaho": "May Trabaho",
    }

    gender_values = ["Babae", "Lalake"]
    education_values = [
        "Hindi nakapagtapos ng Elementarya",
        "Elementarya",
        "Hindi nakapagtapos ng Sekundarya",
        "Sekundarya",



    ]

    for kasarian_value in gender_values:
        for antas_value in education_values:
            constant_values["kasarian"] = kasarian_value
            constant_values["antas"] = antas_value

            for combo in combinations:
                (serbisyong_pangedukasyon, pagsasanay_pangkabuhayan, pagtatanim,
                serbisyong_pangkalusugan, dental, kultura, values, ayudang_pagkain,
                recycle, teknolohiya) = combo

                if teknolohiya == 1:
                    predict_value = "Literacy"
                elif pagsasanay_pangkabuhayan == 1:
                    predict_value = "Socio-economic"
                elif serbisyong_pangedukasyon == 1:
                    predict_value = "Literacy"
                elif values == 1:
                    predict_value = "Values Formation"
                elif kultura == 1:
                    predict_value = "Cultural Enhancement"
                elif pagtatanim == 1:
                    predict_value = "Environmental Stewardship"
                elif recycle == 1:
                    predict_value = "Environmental Stewardship"
                elif serbisyong_pangkalusugan == 1:
                    predict_value = "Health and Wellness"
                elif ayudang_pagkain == 1:
                    predict_value = "Socio-economic"
                elif dental == 1:
                    predict_value = "Health and Wellness"
                else:
                    predict_value = "Literacy"

                # Append the constant values and binary attribute values to the CSV file
                writer.writerow([constant_values["kasarian"], constant_values["edad"],
                                 constant_values["antas"], constant_values["trabaho"]] + list(combo) + [predict_value])

print("CSV file created: " + csv_file)


CSV file created: cesu-17-below-Maytrabaho.csv


# For Subprogram Model


In [None]:
import pandas as pd
from sklearn.model_selection import train_test_split

# Load the CSV data
data2 = pd.read_csv('/content/cesu17-below_subprogram_May_Trabaho.csv')
df2 = pd.DataFrame(data2)
# Define custom encoding dictionaries for each categorical column
encoding_dict_kasarian = {'Lalake': 0, 'Babae': 1}
encoding_dict_edad= {'17-below': 0, '18-24': 1, '25-34': 2, '35-44': 3, '45-54': 4, '55-64': 5, '65-Above': 6 }
encoding_dict_antas = {'Hindi nakapagtapos ng Elementarya':0, 'Elementarya':1, 'Hindi nakapagtapos ng Sekundarya':2, 'Sekundarya':3, 'Kolehiyo':4, 'Hindi nakapagtapos ng Kolehiyo':5, 'Masters Degree':6, 'Doctorate Degree':7, 'Hindi nakapag-aral':8}
encoding_dict_uri = {'May Trabaho': 1, 'Walang Trabaho': 0}
encoding_dict_program = {'Literacy': 0, 'Socio-economic': 1, 'Environmental Stewardship': 2, 'Health and Wellness': 3, 'Cultural Enhancement': 4, 'Values Formation': 5, 'Disaster Management': 6, 'Gender and Development': 7}

# Apply custom encoding to the categorical columns
data2['Kasarian'] = data2['Kasarian'].map(encoding_dict_kasarian)
data2['Edad'] = data2['Edad'].map(encoding_dict_edad)
data2['Antas na tinapos'] = data2['Antas na tinapos'].map(encoding_dict_antas)
data2['Uri ng trabaho'] = data2['Uri ng trabaho'].map(encoding_dict_uri)
data2['Program'] = data2['Program'].map(encoding_dict_program)

# Split the data into training and testing sets
X2 = data2.drop(['Sub Program'], axis=1)  # Features
y2 = data2['Sub Program']  # Target variable

X_train2, X_test2, y_train2, y_test2 = train_test_split(X2, y2, test_size=0.33, random_state=42)


In [None]:
X_train2.head()

In [None]:
X_test2.head()

In [None]:

X_train2.dtypes

In [None]:
col_names = ['Kasarian', 'Edad', 'Antas na tinapos', 'Uri ng trabaho', 'Serbisyong Pangedukasyon', 'Pagsasanay Pangkabuhayan (Livelihood)', 'Pagtatanim', 'Serbisyong Pangkalusugan', 'Serbisyong Dental', 'Kaalamang Pangkultura', 'Values Formation at Moral Recovery', 'Ayudang Pagkain (Food Assistance)', 'Pagrerecycle', 'Pagsasanay Ukol sa Teknolohiya', 'Program', 'Sub Program']
df2.columns = col_names
col_names
df2.head()

In [None]:
from sklearn.ensemble import RandomForestClassifier
from sklearn.metrics import accuracy_score, classification_report, confusion_matrix

rfc2 = RandomForestClassifier(n_estimators=100, random_state=42)

rfc2.fit(X_train2, y_train2)

y_pred2 = rfc2.predict(X_test2)

# Check accuracy score
accuracy = accuracy_score(y_test2, y_pred2)
print('Model accuracy score with 100 decision-trees: {0:0.4f}'.format(accuracy))


Model accuracy score with 100 decision-trees: 1.0000


In [None]:
import joblib
from google.colab import files


joblib.dump(rfc2, 'subprogram6.pkl')
files.download('subprogram6.pkl')

<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

# Walang Trabaho (Sub)

In [None]:
import itertools
import csv

combinations = list(itertools.product([0, 1], repeat=10))

csv_file = "cesu17-below_subprogram_Walang_Trabaho.csv"

with open(csv_file, mode="w", newline="") as file:
    writer = csv.writer(file)
    writer.writerow([
        "Kasarian",
        "Edad",
        "Antas na tinapos",
        "Uri ng trabaho",
        "Serbisyong Pangedukasyon",
        "Pagsasanay Pangkabuhayan (Livelihood)",
        "Pagtatanim",
        "Serbisyong Pangkalusugan",
        "Serbisyong Dental",
        "Kaalamang Pangkultura",
        "Values Formation at Moral Recovery",
        "Ayudang Pagkain (Food Assistance)",
        "Pagrerecycle",
        "Pagsasanay Ukol sa Teknolohiya",
        "Program",
        "Sub Program"
    ])

    constant_values = {
        "edad": "17-below",
        "trabaho": "Walang Trabaho",
    }

    gender_values = ["Babae", "Lalake"]
    education_values = [
        "Hindi nakapagtapos ng Elementarya",
        "Elementarya",
        "Hindi nakapagtapos ng Sekundarya",
        "Sekundarya",


    ]

    for kasarian_value in gender_values:
        for antas_value in education_values:
            constant_values["kasarian"] = kasarian_value
            constant_values["antas"] = antas_value

            for combo in combinations:
                (serbisyong_pangedukasyon, pagsasanay_pangkabuhayan, pagtatanim,
                serbisyong_pangkalusugan, dental, kultura, values, ayudang_pagkain,
                recycle, teknolohiya) = combo

                if serbisyong_pangedukasyon == 1:
                    predict_value = "Literacy"
                    sub_program = "Media and Basic Literacy"
                elif teknolohiya == 1:
                    predict_value = "Literacy"
                    sub_program = "ICT Literacy Program"
                elif values == 1:
                    predict_value = "Values Formation"
                    sub_program = "Personality Development"
                elif kultura == 1:
                    predict_value = "Cultural Enhancement"
                    sub_program = "Culture and Arts"
                elif pagtatanim == 1:
                    predict_value = "Environmental Stewardship"
                    sub_program = "Seminar & Tree Planting Activities"
                elif recycle == 1:
                    predict_value = "Environmental Stewardship"
                    sub_program = "Clean-up Drive"

                elif serbisyong_pangkalusugan == 1:
                    predict_value = "Health and Wellness"
                    sub_program = "Medical and Dental Mission"

                elif ayudang_pagkain == 1:
                    predict_value = "Socio-economic"
                    sub_program = "Food assistance"

                elif pagsasanay_pangkabuhayan == 1:
                    predict_value = "Socio-economic"
                    sub_program = "Training/seminar Program"
                elif dental == 1:
                    predict_value = "Health and Wellness"
                    sub_program = "Medical and Dental Mission"
                else:
                    predict_value = "Literacy"
                    sub_program = "Media and Basic Literacy"

                # Append the constant values and binary attribute values to the CSV file
                writer.writerow([constant_values["kasarian"], constant_values["edad"],
                                 constant_values["antas"], constant_values["trabaho"]] + list(combo) + [predict_value] + [sub_program])

print("CSV file created: " + csv_file)


CSV file created: cesu17-below_subprogram_Walang_Trabaho.csv


# May Trabaho (Sub)

In [None]:
import itertools
import csv

combinations = list(itertools.product([0, 1], repeat=10))

csv_file = "cesu17-below_subprogram_May_Trabaho.csv"

with open(csv_file, mode="w", newline="") as file:
    writer = csv.writer(file)
    writer.writerow([
        "Kasarian",
        "Edad",
        "Antas na tinapos",
        "Uri ng trabaho",
        "Serbisyong Pangedukasyon",
        "Pagsasanay Pangkabuhayan (Livelihood)",
        "Pagtatanim",
        "Serbisyong Pangkalusugan",
        "Serbisyong Dental",
        "Kaalamang Pangkultura",
        "Values Formation at Moral Recovery",
        "Ayudang Pagkain (Food Assistance)",
        "Pagrerecycle",
        "Pagsasanay Ukol sa Teknolohiya",
        "Program",
        "Sub Program"
    ])

    constant_values = {
        "edad": "17-below",
        "trabaho": "May Trabaho",
    }

    gender_values = ["Babae", "Lalake"]
    education_values = [
        "Hindi nakapagtapos ng Elementarya",
        "Elementarya",
        "Hindi nakapagtapos ng Sekundarya",
        "Sekundarya",
    ]

    for kasarian_value in gender_values:
        for antas_value in education_values:
            constant_values["kasarian"] = kasarian_value
            constant_values["antas"] = antas_value
            for combo in combinations:
                (serbisyong_pangedukasyon, pagsasanay_pangkabuhayan, pagtatanim,
                serbisyong_pangkalusugan, dental, kultura, values, ayudang_pagkain,
                recycle, teknolohiya) = combo

                if teknolohiya == 1:
                    predict_value = "Literacy"
                    sub_program = "ICT Literacy Program"
                elif pagsasanay_pangkabuhayan == 1:
                    predict_value = "Socio-economic"
                    sub_program = "Training/seminar Program"
                elif serbisyong_pangedukasyon == 1:
                    predict_value = "Literacy"
                    sub_program = "Media and Basic Literacy"
                elif values == 1:
                    predict_value = "Values Formation"
                    sub_program = "Personality Development"
                elif kultura == 1:
                    predict_value = "Cultural Enhancement"
                    sub_program = "Culture and Arts"
                elif pagtatanim == 1:
                    predict_value = "Environmental Stewardship"
                    sub_program = "Seminar & Tree Planting Activities"
                elif recycle == 1:
                    predict_value = "Environmental Stewardship"
                    sub_program = "Clean-up Drive"
                elif serbisyong_pangkalusugan == 1:
                    predict_value = "Health and Wellness"
                    sub_program = "Medical and Dental Mission"
                elif ayudang_pagkain == 1:
                    predict_value = "Socio-economic"
                    sub_program = "Food assistance"
                elif dental == 1:
                    predict_value = "Health and Wellness"
                    sub_program = "Medical and Dental Mission"
                else:
                    predict_value = "Literacy"
                    sub_program = "ICT Literacy Program"

                # Append the constant values and binary attribute values to the CSV file
                writer.writerow([constant_values["kasarian"], constant_values["edad"],
                                 constant_values["antas"], constant_values["trabaho"]] + list(combo) + [predict_value] + [sub_program])

print("CSV file created: " + csv_file)


CSV file created: cesu17-below_subprogram_May_Trabaho.csv


# Checking the datasets value

In [None]:
import pandas as pd
file_path = "/content/cesu_subprogram_v6.csv"
df = pd.read_csv(file_path)
nan_check = df.isna()

In [None]:
nan_count_per_column = nan_check.sum()
nan_count_total = nan_check.sum().sum()

print("NaN count per column:")
print(nan_count_per_column)

print("\nTotal NaN count in the DataFrame:", nan_count_total)


In [None]:
# Find rows containing NaN values
rows_with_nan = nan_check.any(axis=1)

# Extract the row numbers (indexes) where NaN values exist
rows_with_nan_indexes = df.index[rows_with_nan]

# Print the row numbers
print("Rows with NaN values:")
print(rows_with_nan_indexes)


Rows with NaN values:
Int64Index([], dtype='int64')


In [None]:
# Find rows containing NaN values
rows_with_nan = nan_check.any(axis=1)

# Extract the row numbers (indexes) where NaN values exist
rows_with_nan_indexes = df.index[rows_with_nan]

# Print the row numbers
print("Rows with NaN values:")
print(rows_with_nan_indexes)

# Print specific columns with NaN values in those rows
for row_index in rows_with_nan_indexes:
    nan_columns = nan_check.loc[row_index]
    print(f"NaN columns in row {row_index}:")
    print(nan_columns[nan_columns].index)


Rows with NaN values:
Int64Index([], dtype='int64')


In [None]:

#FOR 17-below WALANG TRABAHO

                if serbisyong_pangedukasyon == 1:
                    predict_value = "Literacy"
                    sub_program = "Media and Basic Literacy"
                elif teknolohiya == 1:
                    predict_value = "Literacy"
                    sub_program = "ICT Literacy Program"
                elif values == 1:
                    predict_value = "Values Formation"
                    sub_program = "Personality Development"
                elif kultura == 1:
                    predict_value = "Cultural Enhancement"
                    sub_program = "Culture and Arts"
                elif pagtatanim == 1:
                    predict_value = "Environmental Stewardship"
                    sub_program = "Seminar & Tree Planting Activities"
                elif recycle == 1:
                    predict_value = "Environmental Stewardship"
                    sub_program = "Clean-up Drive"

                elif serbisyong_pangkalusugan == 1:
                    predict_value = "Health and Wellness"
                    sub_program = "Medical and Dental Mission"

                elif ayudang_pagkain == 1:
                    predict_value = "Socio-economic"
                    sub_program = "Food assistance"

                elif pagsasanay_pangkabuhayan == 1:
                    predict_value = "Socio-economic"
                    sub_program = "Training/seminar Program"
                elif dental == 1:
                    predict_value = "Health and Wellness"
                    sub_program = "Medical and Dental Mission"
                else:
                    predict_value = "Literacy"
                    sub_program = "Media and Basic Literacy"

#FOR 17-below MAY TRABAHO

                if teknolohiya == 1:
                    predict_value = "Literacy"
                    sub_program = "ICT Literacy Program"
                elif pagsasanay_pangkabuhayan == 1:
                    predict_value = "Socio-economic"
                    sub_program = "Training/seminar Program"
                elif serbisyong_pangedukasyon == 1:
                    predict_value = "Literacy"
                    sub_program = "Media and Basic Literacy"
                elif values == 1:
                    predict_value = "Values Formation"
                    sub_program = "Personality Development"
                elif kultura == 1:
                    predict_value = "Cultural Enhancement"
                    sub_program = "Culture and Arts"
                elif pagtatanim == 1:
                    predict_value = "Environmental Stewardship"
                    sub_program = "Seminar & Tree Planting Activities"
                elif recycle == 1:
                    predict_value = "Environmental Stewardship"
                    sub_program = "Clean-up Drive"
                elif serbisyong_pangkalusugan == 1:
                    predict_value = "Health and Wellness"
                    sub_program = "Medical and Dental Mission"
                elif ayudang_pagkain == 1:
                    predict_value = "Socio-economic"
                    sub_program = "Food assistance"
                elif dental == 1:
                    predict_value = "Health and Wellness"
                    sub_program = "Medical and Dental Mission"
                else:
                    predict_value = "Literacy"
                    sub_program = "ICT Literacy Program"



#FOR 18-24 WALANG TRABAHO
	"Hindi nakapagtapos ng Kolehiyo",
	"Kolehiyo"

		            if pagsasanay_pangkabuhayan == 1:
                    predict_value = "Socio-economic"
                    sub_program = "Livelihood Program"
                elif ayudang_pagkain == 1:
                    predict_value = "Socio-economic"
                    sub_program = "Food assistance"
                elif teknolohiya == 1:
                    predict_value = "Literacy"
                    sub_program = "ICT Literacy Program"
                elif serbisyong_pangedukasyon == 1:
                    predict_value = "Literacy"
                    sub_program = "Basic Training/Seminar Program"
                elif serbisyong_pangkalusugan == 1:
                    predict_value = "Health and Wellness"
                    sub_program = "Medical and Dental Mission"
                elif pagtatanim == 1:
                    predict_value = "Environmental Stewardship"
                    sub_program = "Seminar & Tree Planting Activities"
                elif recycle == 1:
                    predict_value = "Environmental Stewardship"
                    sub_program = "Environmental Conservation and Sustainability"
                elif kultura == 1:
                    predict_value = "Cultural Enhancement"
                    sub_program = "Culture and Arts"
                elif values == 1:
                    predict_value = "Values Formation"
                    sub_program = "Personality Development"
                elif dental == 1:
                    predict_value = "Health and Wellness"
                    sub_program = "Medical and Dental Mission"
                else:
                    predict_value = "Socio-economic"
                    sub_program = "Livelihood Program"

#FOR 18-24 MAY TRABAHO
	"Hindi nakapagtapos ng Kolehiyo",
	"Kolehiyo"


                if teknolohiya == 1:
                    predict_value = "Literacy"
                    sub_program = "ICT Literacy Program"
                elif serbisyong_pangkalusugan == 1:
                    predict_value = "Health and Wellness"
                    sub_program = "Bloodletting Activity"
                elif pagsasanay_pangkabuhayan == 1:
                    predict_value = "Socio-economic"
                    sub_program = "Training/seminar Program"
                elif serbisyong_pangedukasyon == 1:
                    predict_value = "Literacy"
                    sub_program = "Financial Literacy"
                elif ayudang_pagkain == 1:
                    predict_value = "Socio-economic"
                    sub_program = "Feeding Program"
                elif pagtatanim == 1:
                    predict_value = "Environmental Stewardship"
                    sub_program = "Seminar & Tree Planting Activities"
                elif dental == 1:
                    predict_value = "Health and Wellness"
                    sub_program = "Medical and Dental Mission"
                elif recycle == 1:
                    predict_value = "Environmental Stewardship"
                    sub_program = "Environmental Conservation and Sustainability"
                elif values == 1:
                    predict_value = "Values Formation"
                    sub_program = "Spiritual Wellness"
                elif kultura == 1:
                    predict_value = "Cultural Enhancement"
                    sub_program = "Culture and Arts"
                else:
                    predict_value = "Literacy"
                    sub_program = "ICT Literacy Program"


#FOR 25-34 WALANG TRABAHO
	"Masters Degree",

		           if pagsasanay_pangkabuhayan == 1:
                    predict_value = "Socio-economic"
                    sub_program = "Livelihood Program"
                elif ayudang_pagkain == 1:
                    predict_value = "Socio-economic"
                    sub_program = "Food assistance"
                elif teknolohiya == 1:
                    predict_value = "Literacy"
                    sub_program = "ICT Literacy Program"
                elif serbisyong_pangkalusugan == 1:
                    predict_value = "Health and Wellness"
                    sub_program = "Basic Food Safety and Sanitation with First Aid"
                elif serbisyong_pangedukasyon == 1:
                    predict_value = "Literacy"
                    sub_program = "Training/Seminar Program"
                elif pagtatanim == 1:
                    predict_value = "Environmental Stewardship"
                    sub_program = "Seminar & Tree Planting Activities"
                elif recycle == 1:
                    predict_value = "Environmental Stewardship"
                    sub_program = "Environmental Conservation and Sustainability"
                elif kultura == 1:
                    predict_value = "Cultural Enhancement"
                    sub_program = "Culture and Arts"
                elif values == 1:
                    predict_value = "Values Formation"
                    sub_program = "Spiritual Wellness"
                elif dental == 1:
                    predict_value = "Health and Wellness"
                    sub_program = "Medical and Dental Mission"
                else:
                    predict_value = "Socio-economic"
                    sub_program = "Livelihood Program"

#FOR 25-34 MAY TRABAHO
	"Masters Degree",

		            if serbisyong_pangkalusugan == 1:
                    predict_value = "Health and Wellness"
                    sub_program = "Medical and Dental Mission"
                elif teknolohiya == 1:
                    predict_value = "Literacy"
                    sub_program = "ICT Literacy Program"
                elif dental == 1:
                    predict_value = "Health and Wellness"
                    sub_program = "Medical and Dental Mission"
                elif pagsasanay_pangkabuhayan == 1:
                    predict_value = "Socio-economic"
                    sub_program = "Training/seminar Program"
                elif serbisyong_pangedukasyon == 1:
                    predict_value = "Literacy"
                    sub_program = "Financial Literacy"
                elif ayudang_pagkain == 1:
                    predict_value = "Socio-economic"
                    sub_program = "Feeding program"
                elif pagtatanim == 1:
                    predict_value = "Environmental Stewardship"
                    sub_program = "Seminar & Tree Planting Activities"
                elif recycle == 1:
                    predict_value = "Environmental Stewardship"
                    sub_program = "Environmental Conservation and Sustainability"
                elif values == 1:
                    predict_value = "Values Formation"
                    sub_program = "Spiritual Wellness"
                elif kultura == 1:
                    predict_value = "Cultural Enhancement"
                    sub_program = "Culture and Arts"
                else:
                    predict_value = "Health and Wellness"
                    sub_program = "Medical and Dental Mission"


#FOR 35-44 WALANG TRABAHO
	"Masters Degree",
  "Doctorate Degree",

		            if pagsasanay_pangkabuhayan == 1:
                    predict_value = "Socio-economic"
                    sub_program = "Livelihood Program"
                elif ayudang_pagkain == 1:
                    predict_value = "Socio-economic"
                    sub_program = "Food Assistance"
                elif serbisyong_pangkalusugan == 1:
                    predict_value = "Health and Wellness"
                    sub_program = "Medical and Dental Mission"
                elif teknolohiya == 1:
                    predict_value = "Literacy"
                    sub_program = "ICT Literacy Program"
                elif serbisyong_pangedukasyon == 1:
                    predict_value = "Literacy"
                    sub_program = "Training/Seminar Program"
                elif pagtatanim == 1:
                    predict_value = "Environmental Stewardship"
                    sub_program = "Seminar & Tree Planting Activities"
                elif recycle == 1:
                    predict_value = "Environmental Stewardship"
                    sub_program = "Environmental Conservation and Sustainability"
                elif kultura == 1:
                    predict_value = "Cultural Enhancement"
                    sub_program = "Culture and Arts"
                elif values == 1:
                    predict_value = "Values Formation"
                    sub_program = "Spiritual Wellness"
                elif dental == 1:
                    predict_value = "Health and Wellness"
                    sub_program = "Medical and Dental Mission"
                else:
                    predict_value = "Socio-economic"
                    sub_program = "Livelihood Program"

#FOR 35-44 MAY TRABAHO
	      "Masters Degree",
        "Doctorate Degree",

		            if serbisyong_pangkalusugan == 1:
                    predict_value = "Health and Wellness"
                    sub_program = "Medical and Dental Mission"
                elif teknolohiya == 1:
                    predict_value = "Literacy"
                    sub_program = "ICT Literacy Program"
                elif dental == 1:
                    predict_value = "Health and Wellness"
                    sub_program = "Medical and Dental Mission"
                elif serbisyong_pangedukasyon == 1:
                    predict_value = "Literacy"
                    sub_program = "Financial Literacy"
                elif ayudang_pagkain == 1:
                    predict_value = "Socio-economic"
                    sub_program = "Feeding Program"
                elif pagtatanim == 1:
                    predict_value = "Environmental Stewardship"
                    sub_program = "Seminar & Tree Planting Activities"
                elif recycle == 1:
                    predict_value = "Environmental Stewardship"
                    sub_program = "Environmental Conservation and Sustainability"
                elif pagsasanay_pangkabuhayan == 1:
                    predict_value = "Socio-economic"
                    sub_program = "Training/seminar Program"
                elif values == 1:
                    predict_value = "Values Formation"
                    sub_program = "Values Formation Program"
                elif kultura == 1:
                    predict_value = "Cultural Enhancement"
                    sub_program = "Culture and Arts"
                else:
                    predict_value = "Health and Wellness"
                    sub_program = "Medical and Dental Mission"

#FOR 45-54 WALANG TRABAHO

	"Masters Degree",
        "Doctorate Degree",

                if pagsasanay_pangkabuhayan == 1:
                    predict_value = "Socio-economic"
                    sub_program = "Livelihood Program"
                elif ayudang_pagkain == 1:
                    predict_value = "Socio-economic"
                    sub_program = "Food assistance"
                elif serbisyong_pangkalusugan == 1:
                    predict_value = "Health and Wellness"
                    sub_program = "Medical and Dental Mission"
                elif teknolohiya == 1:
                    predict_value = "Literacy"
                    sub_program = "ICT Literacy Program "
                elif serbisyong_pangedukasyon == 1:
                    predict_value = "Literacy"
                    sub_program = "Basic Training/Seminar Program"
                elif pagtatanim == 1:
                    predict_value = "Environmental Stewardship"
                    sub_program = "Seminar & Tree Planting Activities"
                elif recycle == 1:
                    predict_value = "Environmental Stewardship"
                    sub_program = "Environmental Conservation and Sustainability"
                elif kultura == 1:
                    predict_value = "Cultural Enhancement"
                    sub_program = "Culture and Arts"
                elif values == 1:
                    predict_value = "Values Formation"
                    sub_program = "Values Formation Program"
                elif dental == 1:
                    predict_value = "Health and Wellness"
                    sub_program = "Medical and Dental Mission"
                else:
                    predict_value = "Socio-economic"
                    sub_program = "Livelihood Program"



#FOR 45-54 MAY TRABAHO
	"Masters Degree",
        "Doctorate Degree",

		            if serbisyong_pangkalusugan == 1:
                    predict_value = "Health and Wellness"
                    sub_program = "Medical and Dental Mission"
                elif teknolohiya == 1:
                    predict_value = "Literacy"
                    sub_program = "ICT Literacy Program"
                elif dental == 1:
                    predict_value = "Health and Wellness"
                    sub_program = "Medical and Dental Mission"
                elif serbisyong_pangedukasyon == 1:
                    predict_value = "Literacy"
                    sub_program = "Financial Literacy"
                elif ayudang_pagkain == 1:
                    predict_value = "Socio-economic"
                    sub_program = "Feeding Program"
                elif pagtatanim == 1:
                    predict_value = "Environmental Stewardship"
                    sub_program = "Seminar & Tree Planting Activities"
                elif recycle == 1:
                    predict_value = "Environmental Stewardship"
                    sub_program = "Environmental Conservation and Sustainability"
                elif pagsasanay_pangkabuhayan == 1:
                    predict_value = "Socio-economic"
                    sub_program = "Training/seminar Program"
                elif values == 1:
                    predict_value = "Values Formation"
                    sub_program = "Values Formation Program"
                elif kultura == 1:
                    predict_value = "Cultural Enhancement"
                    sub_program = "Culture and Arts"
                else:
                    predict_value = "Health and Wellness"
                    sub_program = "Medical and Dental Mission"


#FOR 55-64 WALANG TRABAHO

        "Masters Degree",
        "Doctorate Degree",


                if serbisyong_pangkalusugan == 1:
                    predict_value = "Health and Wellness"
                    sub_program = "Medical and Dental Mission"
                elif ayudang_pagkain == 1:
                    predict_value = "Socio-economic"
                    sub_program = "Food asssistance"
                elif dental == 1:
                    predict_value = "Health and Wellness"
                    sub_program = "Medical and Dental Mission"
                elif pagsasanay_pangkabuhayan == 1:
                    predict_value = "Socio-economic"
                    sub_program = "Livelihood Program"
                elif teknolohiya == 1:
                    predict_value = "Literacy"
                    sub_program = "ICT Literacy Program"
                elif serbisyong_pangedukasyon == 1:
                    predict_value = "Literacy"
                    sub_program = "Basic Training/Seminar Program"
                elif pagtatanim == 1:
                    predict_value = "Environmental Stewardship"
                    sub_program = "Seminar & Tree Planting Activities"
                elif recycle == 1:
                    predict_value = "Environmental Stewardship"
                    sub_program = "Environmental Conservation and Sustainability "
                elif kultura == 1:
                    predict_value = "Cultural Enhancement"
                    sub_program = "Culture and Arts"
                elif values == 1:
                    predict_value = "Values Formation"
                    sub_program = "Values Formation Program"
                else:
                    predict_value = "Health and Wellness"
                    sub_program = "Medical and Dental Mission"

#FOR 55-64 MAY TRABAHO

 		            if serbisyong_pangkalusugan == 1:
                    predict_value = "Health and Wellness"
                    sub_program = "Medical and Dental Mission"
                elif teknolohiya == 1:
                    predict_value = "Literacy"
                    sub_program = "ICT Literacy Program"
                elif dental == 1:
                    predict_value = "Health and Wellness"
                    sub_program = "Medical and Dental Mission"
                elif serbisyong_pangedukasyon == 1:
                    predict_value = "Literacy"
                    sub_program = "Financial Literacy"
                elif ayudang_pagkain == 1:
                    predict_value = "Socio-economic"
                    sub_program = "Feeding Program"
                elif pagtatanim == 1:
                    predict_value = "Environmental Stewardship"
                    sub_program = "Seminar & Tree Planting Activities"
                elif recycle == 1:
                    predict_value = "Environmental Stewardship"
                    sub_program = "Environmental Conservation and Sustainability "
                elif pagsasanay_pangkabuhayan == 1:
                    predict_value = "Socio-economic"
                    sub_program = "Training/seminar Program"
                elif values == 1:
                    predict_value = "Values Formation"
                    sub_program = "Values Formation Program"
                elif kultura == 1:
                    predict_value = "Cultural Enhancement"
                    sub_program = "Culture and Arts"
                else:
                    predict_value = "Health and Wellness"
                    sub_program = "Medical and Dental Mission"


#FOR 65-ABOVE WALANG TRABAHO

        "Masters Degree",
        "Doctorate Degree",


                if serbisyong_pangkalusugan == 1:
                    predict_value = "Health and Wellness"
			              sub_program = "Medical and Dental Mission"
                elif ayudang_pagkain == 1:
                    predict_value = "Socio-economic"
			              sub_program = "Food asssistance"
                elif dental == 1:
                    predict_value = "Health and Wellness"
			              sub_program = "Medical and Dental Mission"
                elif pagsasanay_pangkabuhayan == 1:
                    predict_value = "Socio-economic"
			              sub_program = "Livelihood Program"
                elif teknolohiya == 1:
                    predict_value = "Literacy"
			              sub_program = "ICT Literacy Program"
                elif serbisyong_pangedukasyon == 1:
                    predict_value = "Literacy"
			              sub_program = "Basic Training/Seminar Program"
                elif pagtatanim == 1:
                    predict_value = "Environmental Stewardship"
			              sub_program = "Seminar & Tree Planting Activities"
                elif recycle == 1:
                    predict_value = "Environmental Stewardship"
			              sub_program = "Environmental Conservation and Sustainability"
                elif kultura == 1:
                    predict_value = "Cultural Enhancement"
			              sub_program = "Culture and Arts"
                elif values == 1:
                    predict_value = "Values Formation"
			              sub_program = "Values Formation Program"
                else:
                    predict_value = "Health and Wellness"
			              sub_program = "Medical and Dental Mission"


#FOR 65-Above MAY TRABAHO

 		            if serbisyong_pangkalusugan == 1:
                    predict_value = "Health and Wellness"
			              sub_program = "Medical and Dental Mission "
                elif teknolohiya == 1:
                    predict_value = "Literacy"
			              sub_program = "ICT Literacy Program"
                elif dental == 1:
                    predict_value = "Health and Wellness"
			              sub_program = "Medical and Dental Mission"
                elif serbisyong_pangedukasyon == 1:
                    predict_value = "Literacy"
			              sub_program = "Financial Literacy"
                elif ayudang_pagkain == 1:
                    predict_value = "Socio-economic"
			              sub_program = "Feeding Program"
                elif pagtatanim == 1:
                    predict_value = "Environmental Stewardship"
			              sub_program = "Seminar & Tree Planting Activities"
                elif recycle == 1:
                    predict_value = "Environmental Stewardship"
			              sub_program = "Environmental Conservation and Sustainability"
                elif pagsasanay_pangkabuhayan == 1:
                    predict_value = "Socio-economic"
			              sub_program = "Livelihood Program"
                elif values == 1:
                    predict_value = "Values Formation"
			              sub_program = "Values Formation Program"
                elif kultura == 1:
                    predict_value = "Cultural Enhancement"
			              sub_program = "Culture and Arts."
                else:
                    predict_value = "Health and Wellness"
			              sub_program = "Medical and Dental Mission"






# FOR SPLITTING MODEL


In [1]:
import os
import shutil

# Input and output file paths
input_file_path = '/content/trained_modelCESU6.pkl'
output_directory = 'split_model_parts'

# Create the output directory if it doesn't exist
os.makedirs(output_directory, exist_ok=True)

# Split the file into parts (e.g., 3 parts)
split_size = os.path.getsize(input_file_path) // 3

with open(input_file_path, 'rb') as f_in:
    for part_num in range(3):
        part_path = os.path.join(output_directory, f'part_{part_num + 1}.pkl')
        with open(part_path, 'wb') as f_out:
            shutil.copyfileobj(f_in, f_out, split_size)

print('Model file split into parts.')


Model file split into parts.


In [2]:
#use to combined the part

#cat part_1.pkl part_2.pkl part_3.pkl > combined_modelCESU6.pkl



Model file parts combined.
