diff --git a/models.py b/models.py index 3fe61b4..2967903 100644 --- a/models.py +++ b/models.py @@ -894,7 +894,7 @@ class PoolFormerBlock(nn.Module): self.norm1 = norm_layer(dim) #self.token_mixer = Pooling(pool_size=pool_size) # self.token_mixer = FNetBlock() - self.window_size = 8 + self.window_size = 4 self.attn_mask = None self.token_mixer = WindowAttention(dim=dim, window_size=to_2tuple(self.window_size), num_heads=4) self.norm2 = norm_layer(dim)