In [1]:
import os

In [2]:
os.chdir("../")

In [3]:
%pwd

'c:\\Users\\ben jazia\\OneDrive\\Documents\\GitHub\\Chicken-Disease-MLOps project\\Chicken-Disease-Classification-Project'

In [4]:
from dataclasses import dataclass
from pathlib import Path


@dataclass(frozen=True)
class PrepareBaseModelConfig:
    root_dir: Path
    base_model_path: Path
    updated_base_model_path: Path
    params_image_size: list
    params_learning_rate: float
    params_include_top: bool
    params_weights: str
    params_classes: int

In [5]:
from cnnChickenDiseaseClassifier.constants import *
from cnnChickenDiseaseClassifier.utils.common import read_yaml, create_directories

### Now, the ConfigurationManager class
In a clean design, you only have one ConfigurationManager class in your project (in src/.../config/configuration.py).

That class knows how to read both:
config.yaml (for paths & artifacts)
params.yaml (for hyperparameters)

At the data ingestion stage, we only needed get_data_ingestion_config(), so we showed just that method.
At the base model stage, we expanded the same class to also include get_prepare_base_model_config().

So what looks like “two classes” is actually the same file/class evolving as we add new stages. Our ConfigurationManager will eventually have multiple methods, one per pipeline stage

so in config/configuration.py, we will just copy the get_prepare_base_model_config method.

In [None]:
class ConfigurationManager:
    # we don't actually need to rewrite __init__ again for the base model prep, we could directly jump to adding the new method get_prepare_base_model
    # but the tutorial rewrites it again (the exact same way) to keep things coherent.
    def __init__(
        self, 
        config_filepath = CONFIG_FILE_PATH,
        params_filepath = PARAMS_FILE_PATH):
        self.config = read_yaml(config_filepath)
        self.params = read_yaml(params_filepath)
        create_directories([self.config.artifacts_root])

    def get_prepare_base_model_config(self) -> PrepareBaseModelConfig:
        config = self.config.prepare_base_model
        
        create_directories([config.root_dir])

        prepare_base_model_config = PrepareBaseModelConfig(
            root_dir=Path(config.root_dir),
            base_model_path=Path(config.base_model_path),
            updated_base_model_path=Path(config.updated_base_model_path),
            params_image_size=self.params.IMAGE_SIZE,
            params_learning_rate=self.params.LEARNING_RATE,
            params_include_top=self.params.INCLUDE_TOP,
            params_weights=self.params.WEIGHTS,
            params_classes=self.params.CLASSES
        )

        return prepare_base_model_config

In [8]:
import os
import urllib.request as request
from zipfile import ZipFile
import tensorflow as tf

In [None]:

# the component
class PrepareBaseModel:
    def __init__(self, config: PrepareBaseModelConfig):
        self.config = config
# Stores the config object (dataclass with paths & params).
# So the class always knows where to save models, what image size, learning rate, etc

    
    def get_base_model(self):
        self.model = tf.keras.applications.vgg16.VGG16(
            input_shape=self.config.params_image_size,
            weights=self.config.params_weights,
            include_top=self.config.params_include_top
        )

        self.save_model(path=self.config.base_model_path, model=self.model)
# Loads a pretrained VGG16 base model from Keras Applications.
# Uses parameters (image size, whether to keep the classification head, pretrained weights).
# Saves this raw base model to disk (base_model_path).

    
    @staticmethod # doesn’t use self, only the arguments passed in. 
    # That’s why it’s marked @staticmethod → no need for class instance.
    def _prepare_full_model(model, classes, freeze_all, freeze_till, learning_rate):
        if freeze_all:
            for layer in model.layers:
                model.trainable = False
        elif (freeze_till is not None) and (freeze_till > 0):
            for layer in model.layers[:-freeze_till]: # freezes all but last freeze_till layers.
                model.trainable = False

        flatten_in = tf.keras.layers.Flatten()(model.output) # adds flatten layer to base model output (from last frozen layer)
        prediction = tf.keras.layers.Dense(
            units=classes,
            activation="softmax"
        )(flatten_in) # takes output of flat layer through a dense layer of two output nodes with activation = softmax

        full_model = tf.keras.models.Model(
            inputs=model.input,
            outputs=prediction
        )

        full_model.compile(
            optimizer=tf.keras.optimizers.SGD(learning_rate=learning_rate),
            loss=tf.keras.losses.CategoricalCrossentropy(),
            metrics=["accuracy"]
        )

        full_model.summary()
        return full_model
    

    def update_base_model(self):
        self.full_model = self._prepare_full_model(
            model=self.model,
            classes=self.config.params_classes,
            freeze_all=True,
            freeze_till=None,
            learning_rate=self.config.params_learning_rate
        )

        self.save_model(path=self.config.updated_base_model_path, model=self.full_model)

    
    @staticmethod
    def save_model(path: Path, model: tf.keras.Model):
        model.save(path)

In [10]:

try:
    config = ConfigurationManager()
    prepare_base_model_config = config.get_prepare_base_model_config()
    prepare_base_model = PrepareBaseModel(config=prepare_base_model_config)
    prepare_base_model.get_base_model()
    prepare_base_model.update_base_model()
except Exception as e:
    raise e

[2025-09-11 15:07:50,090: INFO: common: yaml file: config\config.yaml loaded successfully]
[2025-09-11 15:07:50,105: INFO: common: yaml file: params.yaml loaded successfully]
[2025-09-11 15:07:50,107: INFO: common: created directory at: artifacts]
[2025-09-11 15:07:50,109: INFO: common: created directory at: artifacts/prepare_base_model]
Downloading data from https://storage.googleapis.com/tensorflow/keras-applications/vgg16/vgg16_weights_tf_dim_ordering_tf_kernels_notop.h5
[1m58889256/58889256[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m351s[0m 6us/step


