pytorch3d/files/implicitron_config_system.py


# coding: utf-8

# In[ ]:


# Copyright (c) Meta Platforms, Inc. and affiliates. All rights reserved.


# # Implicitron's config system

# Implicitron's components are all based on a unified hierarchical configuration system.
# This allows configurable variables and all defaults to be defined separately for each new component.
# All configs relevant to an experiment are then automatically composed into a single configuration file that fully specifies the experiment.
# An especially important feature is extension points where users can insert their own sub-classes of Implicitron's base components.
#
# The file which defines this system is [here](https://github.com/facebookresearch/pytorch3d/blob/main/pytorch3d/implicitron/tools/config.py) in the PyTorch3D repo.
# The Implicitron volumes tutorial contains a simple example of using the config system.
# This tutorial provides detailed hands-on experience in using and modifying Implicitron's configurable components.
#

# ## 0. Install and import modules
#
# Ensure `torch` and `torchvision` are installed. If `pytorch3d` is not installed, install it using the following cell:

# In[ ]:


import os
import sys
import torch
need_pytorch3d=False
try:
    import pytorch3d
except ModuleNotFoundError:
    need_pytorch3d=True
if need_pytorch3d:
    if torch.__version__.startswith("2.2.") and sys.platform.startswith("linux"):
        # We try to install PyTorch3D via a released wheel.
        pyt_version_str=torch.__version__.split("+")[0].replace(".", "")
        version_str="".join([
            f"py3{sys.version_info.minor}_cu",
            torch.version.cuda.replace(".",""),
            f"_pyt{pyt_version_str}"
        ])
        get_ipython().system('pip install fvcore iopath')
        get_ipython().system('pip install --no-index --no-cache-dir pytorch3d -f https://dl.fbaipublicfiles.com/pytorch3d/packaging/wheels/{version_str}/download.html')
    else:
        # We try to install PyTorch3D from source.
        get_ipython().system("pip install 'git+https://github.com/facebookresearch/pytorch3d.git@stable'")


# Ensure omegaconf is installed. If not, run this cell. (It should not be necessary to restart the runtime.)

# In[ ]:


get_ipython().system('pip install omegaconf')


# In[ ]:


from dataclasses import dataclass
from typing import Optional, Tuple

import torch
from omegaconf import DictConfig, OmegaConf
from pytorch3d.implicitron.tools.config import (
    Configurable,
    ReplaceableBase,
    expand_args_fields,
    get_default_args,
    registry,
    run_auto_creation,
)


# ## 1. Introducing dataclasses
#
# [Type hints](https://docs.python.org/3/library/typing.html) give a taxonomy of types in Python. [Dataclasses](https://docs.python.org/3/library/dataclasses.html) let you create a class based on a list of members which have names, types and possibly default values. The `__init__` function is created automatically, and calls a `__post_init__` function if present as a final step. For example

# In[ ]:


@dataclass
class MyDataclass:
    a: int
    b: int = 8
    c: Optional[Tuple[int, ...]] = None

    def __post_init__(self):
        print(f"created with a = {self.a}")
        self.d = 2 * self.b


# In[ ]:


my_dataclass_instance = MyDataclass(a=18)
assert my_dataclass_instance.d == 16


# 👷 Note that the `dataclass` decorator here is function which modifies the definition of the class itself.
# It runs immediately after the definition.
# Our config system requires that implicitron library code contains classes whose modified versions need to be aware of user-defined implementations.
# Therefore we need the modification of the class to be delayed. We don't use a decorator.
#

# ## 2. Introducing omegaconf and OmegaConf.structured
#
# The [omegaconf](https://github.com/omry/omegaconf/) library provides a DictConfig class which is like a `dict` with str keys, but with extra features for ease-of-use as a configuration system.

# In[ ]:


dc = DictConfig({"a": 2, "b": True, "c": None, "d": "hello"})
assert dc.a == dc["a"] == 2


# OmegaConf has a serialization to and from yaml. The [Hydra](https://hydra.cc/) library relies on this for its configuration files.

# In[ ]:


print(OmegaConf.to_yaml(dc))
assert OmegaConf.create(OmegaConf.to_yaml(dc)) == dc


# OmegaConf.structured provides a DictConfig from a dataclass or instance of a dataclass. Unlike a normal DictConfig, it is type-checked and only known keys can be added.

# In[ ]:


structured = OmegaConf.structured(MyDataclass)
assert isinstance(structured, DictConfig)
print(structured)
print()
print(OmegaConf.to_yaml(structured))


# `structured` knows it is missing a value for `a`.

# Such an object has members compatible with the dataclass, so an initialisation can be performed as follows.

# In[ ]:


structured.a = 21
my_dataclass_instance2 = MyDataclass(**structured)
print(my_dataclass_instance2)


# You can also call OmegaConf.structured on an instance.

# In[ ]:


structured_from_instance = OmegaConf.structured(my_dataclass_instance)
my_dataclass_instance3 = MyDataclass(**structured_from_instance)
print(my_dataclass_instance3)


# ## 3. Our approach to OmegaConf.structured
#
# We provide functions which are equivalent to `OmegaConf.structured` but support more features.
# To achieve the above using our functions, the following is used.
# Note that we indicate configurable classes using a special base class `Configurable`, not a decorator.

# In[ ]:


class MyConfigurable(Configurable):
    a: int
    b: int = 8
    c: Optional[Tuple[int, ...]] = None

    def __post_init__(self):
        print(f"created with a = {self.a}")
        self.d = 2 * self.b


# In[ ]:


# The expand_args_fields function modifies the class like @dataclasses.dataclass.
# If it has not been called on a Configurable object before it has been instantiated, it will
# be called automatically.
expand_args_fields(MyConfigurable)
my_configurable_instance = MyConfigurable(a=18)
assert my_configurable_instance.d == 16


# In[ ]:


# get_default_args also calls expand_args_fields automatically
our_structured = get_default_args(MyConfigurable)
assert isinstance(our_structured, DictConfig)
print(OmegaConf.to_yaml(our_structured))


# In[ ]:


our_structured.a = 21
print(MyConfigurable(**our_structured))


# ## 4. First enhancement: nested types 🪺
#
# Our system allows Configurable classes to contain each other.
# One thing to remember: add a call to `run_auto_creation` in `__post_init__`.

# In[ ]:


class Inner(Configurable):
    a: int = 8
    b: bool = True
    c: Tuple[int, ...] = (2, 3, 4, 6)


class Outer(Configurable):
    inner: Inner
    x: str = "hello"
    xx: bool = False

    def __post_init__(self):
        run_auto_creation(self)


# In[ ]:


outer_dc = get_default_args(Outer)
print(OmegaConf.to_yaml(outer_dc))


# In[ ]:


outer = Outer(**outer_dc)
assert isinstance(outer, Outer)
assert isinstance(outer.inner, Inner)
print(vars(outer))
print(outer.inner)


# Note how inner_args is an extra member of outer. `run_auto_creation(self)` is equivalent to
# ```
#     self.inner = Inner(**self.inner_args)
# ```

# ## 5. Second enhancement: pluggable/replaceable components 🔌
#
# If a class uses `ReplaceableBase` as a base class instead of `Configurable`, we call it a replaceable.
# It indicates that it is designed for child classes to use in its place.
# We might use `NotImplementedError` to indicate functionality which subclasses are expected to implement.
# The system maintains a global `registry` containing subclasses of each ReplaceableBase.
# The subclasses register themselves with it with a decorator.
#
# A configurable class (i.e. a class which uses our system, i.e. a child of `Configurable` or `ReplaceableBase`) which contains a ReplaceableBase must also
# contain a corresponding class_type field of type `str` which indicates which concrete child class to use.

# In[ ]:


class InnerBase(ReplaceableBase):
    def say_something(self):
        raise NotImplementedError


@registry.register
class Inner1(InnerBase):
    a: int = 1
    b: str = "h"

    def say_something(self):
        print("hello from an Inner1")


@registry.register
class Inner2(InnerBase):
    a: int = 2

    def say_something(self):
        print("hello from an Inner2")


# In[ ]:


class Out(Configurable):
    inner: InnerBase
    inner_class_type: str = "Inner1"
    x: int = 19

    def __post_init__(self):
        run_auto_creation(self)

    def talk(self):
        self.inner.say_something()


# In[ ]:


Out_dc = get_default_args(Out)
print(OmegaConf.to_yaml(Out_dc))


# In[ ]:


Out_dc.inner_class_type = "Inner2"
out = Out(**Out_dc)
print(out.inner)


# In[ ]:


out.talk()


# Note in this case there are many `args` members. It is usually fine to ignore them in the code. They are needed for the config.

# In[ ]:


print(vars(out))


# ## 6. Example with torch.nn.Module  🔥
# Typically in implicitron, we use this system in combination with [`Module`](https://pytorch.org/docs/stable/generated/torch.nn.Module.html)s.
# Note in this case it is necessary to call `Module.__init__` explicitly in `__post_init__`.

# In[ ]:


class MyLinear(torch.nn.Module, Configurable):
    d_in: int = 2
    d_out: int = 200

    def __post_init__(self):
        super().__init__()
        self.linear = torch.nn.Linear(in_features=self.d_in, out_features=self.d_out)

    def forward(self, x):
        return self.linear.forward(x)


# In[ ]:


my_linear = MyLinear()
input = torch.zeros(2)
output = my_linear(input)
print("output shape:", output.shape)


# `my_linear` has all the usual features of a Module.
# E.g. it can be saved and loaded with `torch.save` and `torch.load`.
# It has parameters:

# In[ ]:


for name, value in my_linear.named_parameters():
    print(name, value.shape)


# ## 7. Example of implementing your own pluggable component
# Let's say I am using a library with `Out` like in section **5** but I want to implement my own child of InnerBase.
# All I need to do is register its definition, but I need to do this before expand_args_fields is explicitly or implicitly called on Out.

# In[ ]:


@registry.register
class UserImplementedInner(InnerBase):
    a: int = 200

    def say_something(self):
        print("hello from the user")


# At this point, we need to redefine the class Out.
# Otherwise if it has already been expanded without UserImplementedInner, then the following would not work,
# because the implementations known to a class are fixed when it is expanded.
#
# If you are running experiments from a script, the thing to remember here is that you must import your own modules, which register your own implementations,
# before you *use* the library classes.

# In[ ]:


class Out(Configurable):
    inner: InnerBase
    inner_class_type: str = "Inner1"
    x: int = 19

    def __post_init__(self):
        run_auto_creation(self)

    def talk(self):
        self.inner.say_something()


# In[ ]:


out2 = Out(inner_class_type="UserImplementedInner")
print(out2.inner)


# ## 8: Example of making a subcomponent pluggable
#
# Let's look what needs to happen if we have a subcomponent which we make pluggable, to allow users to supply their own.

# In[ ]:


class SubComponent(Configurable):
    x: float = 0.25

    def apply(self, a: float) -> float:
        return a + self.x


class LargeComponent(Configurable):
    repeats: int = 4
    subcomponent: SubComponent

    def __post_init__(self):
        run_auto_creation(self)

    def apply(self, a: float) -> float:
        for _ in range(self.repeats):
            a = self.subcomponent.apply(a)
        return a


# In[ ]:


large_component = LargeComponent()
assert large_component.apply(3) == 4
print(OmegaConf.to_yaml(LargeComponent))


# Made generic:

# In[ ]:


class SubComponentBase(ReplaceableBase):
    def apply(self, a: float) -> float:
        raise NotImplementedError


@registry.register
class SubComponent(SubComponentBase):
    x: float = 0.25

    def apply(self, a: float) -> float:
        return a + self.x


class LargeComponent(Configurable):
    repeats: int = 4
    subcomponent: SubComponentBase
    subcomponent_class_type: str = "SubComponent"

    def __post_init__(self):
        run_auto_creation(self)

    def apply(self, a: float) -> float:
        for _ in range(self.repeats):
            a = self.subcomponent.apply(a)
        return a


# In[ ]:


large_component = LargeComponent()
assert large_component.apply(3) == 4
print(OmegaConf.to_yaml(LargeComponent))


# The following things had to change:
# * The base class SubComponentBase was defined.
# * SubComponent gained a `@registry.register` decoration and had its base class changed to the new one.
# * `subcomponent_class_type` was added as a member of the outer class.
# * In any saved configuration yaml files, the key `subcomponent_args` had to be changed to `subcomponent_SubComponent_args`.

# ## Appendix: gotchas ⚠️
#
# * Omitting to define `__post_init__` or not calling `run_auto_creation` in it.
# * Omitting a type annotation on a field. For example, writing
# ```
#     subcomponent_class_type = "SubComponent"
# ```
# instead of
# ```
#     subcomponent_class_type: str = "SubComponent"
# ```
#
#