Source code for towhee.models.utils.window_partition3d

# original code from https://github.com/SwinTransformer/Video-Swin-Transformer
# modified by Zilliz.

from functools import reduce
from operator import mul


[docs]def window_partition(x, window_size):
    """
    Args:
        x (`torch.Tensor`):
            Tensor with size of (b, d, h, w, c). b is batch size. d is time dimension size. h and w is frame size.
            c is channel size.
        window_size (`tuple[int]`):
            3d window size
    Returns:
        windows (`torch.Tensor`):
            Window partitioned tensor with size (B*num_windows, window_size*window_size, C)
    """
    b, d, h, w, c = x.shape
    x = x.view(b, d // window_size[0], window_size[0],
               h // window_size[1], window_size[1], w // window_size[2], window_size[2], c)
    windows = x.permute(0, 1, 3, 5, 2, 4, 6, 7).contiguous().view(-1, reduce(mul, window_size), c)
    return windows