From d93cd84ccdb338572fe978c08bd95ca93bee11cc Mon Sep 17 00:00:00 2001 From: Phil Wang Date: Thu, 31 Mar 2022 15:22:24 -0700 Subject: [PATCH] let windowed tokens exchange information across heads a la talking heads prior to pointwise attention in sep-vit --- setup.py | 2 +- vit_pytorch/sep_vit.py | 2 +- 2 files changed, 2 insertions(+), 2 deletions(-) diff --git a/setup.py b/setup.py index 2e8a2a2..df44508 100644 --- a/setup.py +++ b/setup.py @@ -3,7 +3,7 @@ from setuptools import setup, find_packages setup( name = 'vit-pytorch', packages = find_packages(exclude=['examples']), - version = '0.32.1', + version = '0.32.2', license='MIT', description = 'Vision Transformer (ViT) - Pytorch', author = 'Phil Wang', diff --git a/vit_pytorch/sep_vit.py b/vit_pytorch/sep_vit.py index 0750609..4b16270 100644 --- a/vit_pytorch/sep_vit.py +++ b/vit_pytorch/sep_vit.py @@ -103,7 +103,7 @@ class DSSA(nn.Module): nn.LayerNorm(dim_head), nn.GELU(), Rearrange('b h n c -> b (h c) n'), - nn.Conv1d(inner_dim, inner_dim * 2, 1, groups = heads), + nn.Conv1d(inner_dim, inner_dim * 2, 1), Rearrange('b (h c) n -> b h n c', h = heads), )