Skip to content

Commit 719048d

Browse files
committed
some better defaults for scalable vit
1 parent d27721a commit 719048d

File tree

2 files changed

+15
-15
lines changed

2 files changed

+15
-15
lines changed

setup.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -3,7 +3,7 @@
33
setup(
44
name = 'vit-pytorch',
55
packages = find_packages(exclude=['examples']),
6-
version = '0.28.0',
6+
version = '0.28.1',
77
license='MIT',
88
description = 'Vision Transformer (ViT) - Pytorch',
99
author = 'Phil Wang',

vit_pytorch/scalable_vit.py

Lines changed: 14 additions & 14 deletions
Original file line numberDiff line numberDiff line change
@@ -81,8 +81,8 @@ def __init__(
8181
self,
8282
dim,
8383
heads = 8,
84-
dim_key = 64,
85-
dim_value = 64,
84+
dim_key = 32,
85+
dim_value = 32,
8686
dropout = 0.,
8787
reduction_factor = 1
8888
):
@@ -132,8 +132,8 @@ def __init__(
132132
dim,
133133
window_size,
134134
heads = 8,
135-
dim_key = 64,
136-
dim_value = 64,
135+
dim_key = 32,
136+
dim_value = 32,
137137
dropout = 0.
138138
):
139139
super().__init__()
@@ -199,12 +199,12 @@ def __init__(
199199
heads = 8,
200200
ff_expansion_factor = 4,
201201
dropout = 0.,
202-
ssa_dim_key = 64,
203-
ssa_dim_value = 64,
202+
ssa_dim_key = 32,
203+
ssa_dim_value = 32,
204204
ssa_reduction_factor = 1,
205-
iwsa_dim_key = 64,
206-
iwsa_dim_value = 64,
207-
iwsa_window_size = 64,
205+
iwsa_dim_key = 32,
206+
iwsa_dim_value = 32,
207+
iwsa_window_size = None,
208208
norm_output = True
209209
):
210210
super().__init__()
@@ -244,12 +244,12 @@ def __init__(
244244
depth,
245245
heads,
246246
reduction_factor,
247+
window_size = None,
248+
iwsa_dim_key = 32,
249+
iwsa_dim_value = 32,
250+
ssa_dim_key = 32,
251+
ssa_dim_value = 32,
247252
ff_expansion_factor = 4,
248-
iwsa_dim_key = 64,
249-
iwsa_dim_value = 64,
250-
window_size = 64,
251-
ssa_dim_key = 64,
252-
ssa_dim_value = 64,
253253
channels = 3,
254254
dropout = 0.
255255
):

0 commit comments

Comments
 (0)