How does torch.fx work with activation checkpointing?

Frank_Leeeee · May 30, 2022, 9:51am

I am wondering how we can use torch.utils.checkpoint together with torch.fx.

Simple example is given below:

import torch
import torch.nn as nn
import torch.fx as fx
from torch.utils.checkpoint import checkpoint

class MyModule(torch.nn.Module):
    def __init__(self):
        super().__init__()
        self.linear1 = torch.nn.Linear(2, 2)
        self.linear2 = torch.nn.Linear(2, 2)
        self.linear3 = torch.nn.Linear(2, 2)
        
    def _transform(self, x):
        return x.transpose(1, 0)
    
    def forward(self, x):
        x = self.linear1(x)
        x = self.linear2(x) + self.linear3(x)
        trans_x = self._transform(x)
        return trans_x
    
class NestedModule(torch.nn.Module):
    
    def __init__(self):
        super().__init__()
        self.my_mod = MyModule()
        self.linear4 = torch.nn.Linear(2, 2)
    
    def forward(self, x):
        x = checkpoint(self.my_mod, x)
        return self.linear4(x)
    
nested_mod = NestedModule()
gm = fx.symbolic_trace(nested_mod)
gm.recompile()
print(gm)

The output will ignore the checkpoint logic.

def forward(self, x):
    my_mod_linear1 = self.my_mod.linear1(x);  x = None
    my_mod_linear2 = self.my_mod.linear2(my_mod_linear1)
    my_mod_linear3 = self.my_mod.linear3(my_mod_linear1);  my_mod_linear1 = None
    add = my_mod_linear2 + my_mod_linear3;  my_mod_linear2 = my_mod_linear3 = None
    transpose = add.transpose(1, 0);  add = None
    linear4 = self.linear4(transpose);  transpose = None
    return linear4

Radulescu_Petru · February 12, 2025, 8:24pm

@Frank_Leeeee Did you manage to find something that works?

Frank_Leeeee · February 13, 2025, 3:38am

Hi, I ended up writing my own codegen.

github.com/hpcaitech/ColossalAI

colossalai/fx/codegen/activation_checkpoint_codegen.py

main

from typing import Any, Dict, Iterable, List, Tuple

import torch

import colossalai

try:
    from torch.fx.graph import (
        CodeGen,
        PythonCode,
        _custom_builtins,
        _CustomBuiltin,
        _format_target,
        _is_from_torch,
        _Namespace,
        _origin_type_map,
        inplace_methods,
        magic_methods,
    )
    from torch.fx.node import Argument, Node, _get_qualified_name, _type_repr, map_arg

This file has been truncated. show original