for base model we will be using vgg16 from keras application and tune the model

In [1]:
%pwd
import os 
os.chdir(r"c:\vs\ml\chest-cancer-classification-using-mlflow-dvc")
%pwd

'c:\\vs\\ml\\chest-cancer-classification-using-mlflow-dvc'

In [2]:
import sys
from pathlib import Path

# Add project src directory to Python path
project_root = Path(r"c:\vs\ml\chest-cancer-classification-using-mlflow-dvc\src")
sys.path.append(str(project_root))

i changed to adam optimizer from sgd for better results

Unfroze last 4 VGG16 layers (freeze_till=4) - Now ~3-4M parameters can train

Added intermediate Dense layer (256 units) - Better feature learning

Added Dropout layers (0.5 and 0.3) - Prevents overfitting

In [8]:
#entity
from dataclasses import dataclass
from pathlib import Path

@dataclass(frozen=True)
class PrepareBaseModelConfig:
    root_dir: Path
    base_model_path: Path
    updated_base_model_path: Path
    params_image_size: list
    params_learning_rate: float
    params_include_top: bool
    params_weights: str
    params_classes: int

In [9]:

from cnnClassifier.constants import *
from cnnClassifier.utils.common import read_yaml, create_directories

class ConfigurationManager:
    def __init__(
        self,
        config_filepath = CONFIG_FILE_PATH,
        params_filepath = PARAMS_FILE_PATH):

        self.config = read_yaml(config_filepath)
        self.params = read_yaml(params_filepath)

        create_directories([self.config.artifacts_root])

    def get_prepare_base_model_config(self) -> PrepareBaseModelConfig:
        config = self.config.prepare_base_model
        
        create_directories([config.root_dir])

        prepare_base_model_config = PrepareBaseModelConfig(
            root_dir=Path(config.root_dir),
            base_model_path=Path(config.base_model_path),
            updated_base_model_path=Path(config.updated_base_model_path),
            params_image_size=self.params.IMAGE_SIZE,
            params_learning_rate=self.params.LEARNING_RATE,
            params_include_top=self.params.INCLUDE_TOP,
            params_weights=self.params.WEIGHTS,
            params_classes=self.params.CLASSES
        )

        return prepare_base_model_config

In [10]:
#component
import os 
import tensorflow as tf 
import urllib.request as request
from zipfile import ZipFile
class PrepareBaseModel:
    def __init__(self, config: PrepareBaseModelConfig):
        self.config = config

    def get_base_model(self):
        self.model = tf.keras.applications.vgg16.VGG16(
            input_shape=self.config.params_image_size,
            weights=self.config.params_weights,
            include_top=self.config.params_include_top
        )

        self.save_model(path=self.config.base_model_path, model=self.model)

    @staticmethod
    def _prepare_full_model(model, classes, freeze_all, freeze_till, learning_rate):
        # CRITICAL FIX: Unfreeze last few layers for better learning
        if freeze_all:
            # Freeze all base model layers
            model.trainable = False
        elif (freeze_till is not None) and (freeze_till > 0):
            # Freeze all layers first
            model.trainable = True
            # Then freeze only the first layers, keeping last layers trainable
            for layer in model.layers[:-freeze_till]:
                layer.trainable = False
        else:
            # Train all layers
            model.trainable = True

        # Add custom classification head
        flatten_in = tf.keras.layers.Flatten()(model.output)
        
        # Add dropout for regularization
        dropout1 = tf.keras.layers.Dropout(0.5)(flatten_in)
        
        # Add a dense layer before final classification
        dense1 = tf.keras.layers.Dense(
            units=256,
            activation="relu"
        )(dropout1)
        
        dropout2 = tf.keras.layers.Dropout(0.3)(dense1)
        
        # Final classification layer
        prediction = tf.keras.layers.Dense(
            units=classes,
            activation="softmax"
        )(dropout2)

        full_model = tf.keras.models.Model(
            inputs=model.input,
            outputs=prediction
        )

        # Use Adam optimizer instead of SGD
        full_model.compile(
            optimizer=tf.keras.optimizers.Adam(learning_rate=learning_rate),
            loss=tf.keras.losses.CategoricalCrossentropy(),
            metrics=["accuracy"]
        )

        full_model.summary()
        
        # Print trainable vs non-trainable parameters
        trainable_params = sum([tf.size(w).numpy() for w in full_model.trainable_weights])
        non_trainable_params = sum([tf.size(w).numpy() for w in full_model.non_trainable_weights])
        print(f"\n{'='*60}")
        print(f"Trainable parameters: {trainable_params:,}")
        print(f"Non-trainable parameters: {non_trainable_params:,}")
        print(f"{'='*60}\n")
        
        return full_model
    
    def update_base_model(self):
        # CHANGED: Unfreeze last 4 layers instead of freezing all
        self.full_model = self._prepare_full_model(
            model=self.model,
            classes=self.config.params_classes,
            freeze_all=False,  # Changed from True
            freeze_till=4,     # Unfreeze last 4 layers
            learning_rate=self.config.params_learning_rate
        )

        self.save_model(path=self.config.updated_base_model_path, model=self.full_model)

    @staticmethod
    def save_model(path: Path, model: tf.keras.Model):
        model.save(path)


In [11]:
try:
    config = ConfigurationManager()
    prepare_base_model_config = config.get_prepare_base_model_config()
    prepare_base_model = PrepareBaseModel(config=prepare_base_model_config)
    prepare_base_model.get_base_model()
    prepare_base_model.update_base_model()
except Exception as e:
    raise e

[2025-10-04 02:44:17,301: INFO: common: yaml file: config\config.yaml loaded successfully]
[2025-10-04 02:44:17,317: INFO: common: yaml file: params.yaml loaded successfully]
[2025-10-04 02:44:17,323: INFO: common: created directory at: artifacts]
[2025-10-04 02:44:17,327: INFO: common: created directory at: artifacts/prepare_base_model]



Trainable parameters: 13,503,236
Non-trainable parameters: 7,635,264

