In [1]:
import torch
import torch.nn as nn
import torch.optim as optim
from torch.utils.data import Dataset, DataLoader

In [2]:
load = torch.load(r'/home/smitesh22/Data/DEM_slope_tensorv2.pt')

In [3]:
class DEM_Dataset(Dataset):
    def __init__(self, data):
        self.filename = list(data.keys())
        self.data = data
        
    def __len__(self):
        return len(self.filename)
    
    def __getitem__(self, index):
        filename = self.filename[index]
        data = self.data[filename]
        return data

In [4]:
data = DEM_Dataset(load)

In [5]:
data_loader = DataLoader(data, batch_size=2, shuffle=True)

In [6]:
class AutoEncoder(nn.Module):
    def __init__(self):
        
        super().__init__()
        
        self.encoder = nn.Sequential( # input : 3601*3601
            nn.Conv2d(1, 32, kernel_size=(15, 15), stride=4, padding=1),
            nn.ReLU(),
            nn.Conv2d(32, 64, kernel_size=(8, 8), stride=4, padding=1),
            nn.ReLU(),
            nn.Conv2d(64, 128, kernel_size=(4, 4), stride=2, padding=1),
            nn.ReLU(),
            nn.Conv2d(128, 128, kernel_size=(4, 4), stride=2, padding=1),
            nn.ReLU(),
            
        )
        
        self.decoder = nn.Sequential(
            nn.ConvTranspose2d(128, 128, kernel_size=(4, 4), stride=2, padding=1, output_padding=0),
            nn.ReLU(),
            nn.ConvTranspose2d(128, 64, kernel_size=(4, 4), stride=2, padding=1, output_padding=0),
            nn.ReLU(),
            nn.ConvTranspose2d(64, 32, kernel_size=(8, 8), stride=4, padding=1, output_padding=0),
            nn.ReLU(),
            nn.ConvTranspose2d(32, 1, kernel_size=(15, 15), stride=4, padding=1, output_padding=0),
            nn.Sigmoid(),  # Output is between 0 and 1
        )
        
    def forward(self, x):
        x = self.encoder(x)
        x = self.decoder(x)
        return x
            

        
        
        
    def dimensions(self, x):
        print(f"----------ENCODER----------")
        print(f"Input shape : {x.shape[1], x.shape[2], x.shape[3]}")
        x = self.encoder[0](x)
        print(f"After 1st Conv2d: {x.shape[1], x.shape[2], x.shape[3]}")
        x = self.encoder[1](x)
        print(f"After 1st ReLU: {x.shape[1], x.shape[2], x.shape[3]}")
        x = self.encoder[2](x)
        print(f"After 2nd Conv2d: {x.shape[1], x.shape[2], x.shape[3]}")
        x = self.encoder[3](x)
        print(f"After 2nd ReLU: {x.shape[1], x.shape[2], x.shape[3]}")
        x = self.encoder[4](x)
        print(f"After 3rd Conv2d: {x.shape[1], x.shape[2], x.shape[3]}")
        x = self.encoder[5](x)
        print(f"After 3rd ReLU: {x.shape[1], x.shape[2], x.shape[3]}")
        x = self.encoder[5](x)
        print(f"After 4th Conv2d: {x.shape[1], x.shape[2], x.shape[3]}")
        x = self.encoder[6](x)
        print(f"After 4th ReLU: {x.shape[1], x.shape[2], x.shape[3]}")
        
        print("---------DECODER------------")
        x= self.decoder[0](x)
        print(f"After 1st Transpose: {x.shape[1], x.shape[2], x.shape[3]}")
        x = self.decoder[1](x)
        print(f"After 1st ReLU: {x.shape[1], x.shape[2], x.shape[3]}")
        x = self.decoder[2](x)
        print(f"After 2nd Transpose: {x.shape[1], x.shape[2], x.shape[3]}")
        x = self.decoder[3](x)
        print(f"After 2nd ReLU: {x.shape[1], x.shape[2], x.shape[3]}")
        x = self.decoder[4](x)
        print(f"After 3rd Transpose: {x.shape[1], x.shape[2], x.shape[3]}")
        x = self.decoder[5](x)
        print(f"After 3rd ReLU: {x.shape[1], x.shape[2], x.shape[3]}")
        x = self.decoder[6](x)
        print(f"Decoder output : {x.shape[1], x.shape[2], x.shape[3]}")

In [7]:
model = AutoEncoder()

In [8]:
dummy_input = torch.randn(5, 1, 3601, 3601)

In [9]:
model.dimensions(dummy_input)

----------ENCODER----------
Input shape : (1, 3601, 3601)
After 1st Conv2d: (32, 898, 898)
After 1st ReLU: (32, 898, 898)
After 2nd Conv2d: (64, 224, 224)
After 2nd ReLU: (64, 224, 224)
After 3rd Conv2d: (128, 112, 112)
After 3rd ReLU: (128, 112, 112)
After 4th Conv2d: (128, 112, 112)
After 4th ReLU: (128, 56, 56)
---------DECODER------------
After 1st Transpose: (128, 112, 112)
After 1st ReLU: (128, 112, 112)
After 2nd Transpose: (64, 224, 224)
After 2nd ReLU: (64, 224, 224)
After 3rd Transpose: (32, 898, 898)
After 3rd ReLU: (32, 898, 898)
Decoder output : (1, 3601, 3601)


In [None]:
criterion = nn.MSELoss()
optimizer = optim.Adam(model.parameters(), lr=0.001)

num_epochs = 10  # Set the number of training epochs
for epoch in range(num_epochs):
    model.train()
    for batch_idx, batch_data in enumerate(data_loader):
        # Move the batch data to the GPU if available
        optimizer.zero_grad()
        outputs = model(batch_data)
        loss = criterion(outputs, batch_data)
        loss.backward()
        optimizer.step()
        
        if batch_idx % 10 == 0:
            print(f"Epoch {epoch+1}/{num_epochs}, Batch {batch_idx}/{len(data_loader)}, Loss: {loss.item():.4f}")
