We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 72faca1 commit 1474331Copy full SHA for 1474331
timm/models/dependencyvit.py
@@ -48,7 +48,7 @@ def __init__(
48
self.scale = self.head_dim ** -0.5
49
self.track_dependency_mask = False
50
self.dependency_mask = None
51
- self.head_selector_temperature = 0.1 # appendix D.1, causes nan when 0.1, 0 when 10.0
+ self.head_selector_temperature = 1.0 # appendix D.1, causes nan when 0.1, 0 when 10.0
52
53
self.head_selector = nn.Linear(dim, num_heads)
54
0 commit comments