You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
reasoning_steps=2, # N in the paper - the number of forward evals for the last network (highest hierarchy) above
73
74
relative_period: int|tuple[int, ...] =2, # the relative period for each network evaluation call to the one just previous - in the paper, they do 2 networks with a period of 2
75
+
min_reasoning_steps=1,
76
+
max_reasoning_steps=10,
74
77
ignore_index=-1
75
78
):
76
79
super().__init__()
@@ -124,6 +127,18 @@ def __init__(
124
127
125
128
self.to_pred=Linear(dim, num_tokens, bias=False)
126
129
130
+
# Q(continue|halt) for their adaptive computation time setup
0 commit comments