# pytorch profile with tensorboard

ref: [PyTorch Profiler With TensorBoard — PyTorch Tutorials 1.13.1+cu117 documentation](https://pytorch.org/tutorials/intermediate/tensorboard_profiler_tutorial.html)

``` python
pip install tensorboard
pip install torch_tb_profiler
tensorboard --logdir=./log
```

In [21]:
import torch
import torch.nn
import torch.optim
import torch.profiler
import torch.utils.data
import torchvision.datasets
import torchvision.models
import torchvision.transforms as T

In [22]:
transform = T.Compose(
    [T.Resize(224),
     T.ToTensor(),
     T.Normalize((0.5, 0.5, 0.5), (0.5, 0.5, 0.5))])
train_set = torchvision.datasets.CIFAR10(root='./data', train=True, download=True, transform=transform)
train_loader = torch.utils.data.DataLoader(train_set, batch_size=32, shuffle=True)

Files already downloaded and verified


In [23]:
device = torch.device("cuda:0")
model = torchvision.models.resnet18(pretrained=True).cuda(device)
criterion = torch.nn.CrossEntropyLoss().cuda(device)
optimizer = torch.optim.SGD(model.parameters(), lr=0.001, momentum=0.9)
model.train()



ResNet(
  (conv1): Conv2d(3, 64, kernel_size=(7, 7), stride=(2, 2), padding=(3, 3), bias=False)
  (bn1): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
  (relu): ReLU(inplace=True)
  (maxpool): MaxPool2d(kernel_size=3, stride=2, padding=1, dilation=1, ceil_mode=False)
  (layer1): Sequential(
    (0): BasicBlock(
      (conv1): Conv2d(64, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)
      (bn1): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
      (relu): ReLU(inplace=True)
      (conv2): Conv2d(64, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)
      (bn2): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
    )
    (1): BasicBlock(
      (conv1): Conv2d(64, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)
      (bn1): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
      (relu): ReLU(inplace=True)
  

In [24]:
def train(data):
    inputs, labels = data[0].to(device=device), data[1].to(device=device)
    print(inputs.shape)
    outputs = model(inputs)
    loss = criterion(outputs, labels)
    optimizer.zero_grad()
    loss.backward()
    optimizer.step()

In [25]:
with torch.profiler.profile(
        schedule=torch.profiler.schedule(wait=1, warmup=1, active=3, repeat=2),
        on_trace_ready=torch.profiler.tensorboard_trace_handler('./log/resnet18'),
        record_shapes=True,
        profile_memory=True,
        with_stack=True
) as prof:
    for step, batch_data in enumerate(train_loader):
        if step >= (1 + 1 + 3) * 2:
            break
        train(batch_data)
        prof.step()  # Need to call this at the end of each step to notify profiler of steps' boundary.

torch.Size([32, 3, 224, 224])
torch.Size([32, 3, 224, 224])


STAGE:2023-02-21 07:07:08 1222713:1222713 ActivityProfilerController.cpp:294] Completed Stage: Warm Up


torch.Size([32, 3, 224, 224])
torch.Size([32, 3, 224, 224])
torch.Size([32, 3, 224, 224])


STAGE:2023-02-21 07:07:08 1222713:1222713 ActivityProfilerController.cpp:300] Completed Stage: Collection
STAGE:2023-02-21 07:07:10 1222713:1222713 output_json.cpp:417] Completed Stage: Post Processing


torch.Size([32, 3, 224, 224])
torch.Size([32, 3, 224, 224])


STAGE:2023-02-21 07:07:10 1222713:1222713 ActivityProfilerController.cpp:294] Completed Stage: Warm Up


torch.Size([32, 3, 224, 224])
torch.Size([32, 3, 224, 224])
torch.Size([32, 3, 224, 224])


STAGE:2023-02-21 07:07:11 1222713:1222713 ActivityProfilerController.cpp:300] Completed Stage: Collection
STAGE:2023-02-21 07:07:13 1222713:1222713 output_json.cpp:417] Completed Stage: Post Processing


In [26]:

from torch.utils.tensorboard import SummaryWriter
# from torchsummary import summary
# summary(model, input_size=(3, 224, 224))
writer=SummaryWriter('./log')
img = torch.rand([32, 3, 224, 224], dtype=torch.float32).to(device=device)
writer.add_graph(model, input_to_model=img)