File tree Expand file tree Collapse file tree 2 files changed +0
-4
lines changed Expand file tree Collapse file tree 2 files changed +0
-4
lines changed Original file line number Diff line number Diff line change @@ -249,12 +249,10 @@ def __init__(self, model_args: TransformerModelArgs):
249
249
self .register_buffer (
250
250
"expert_bias" ,
251
251
torch .zeros (num_experts , dtype = torch .float32 ),
252
- persistent = True ,
253
252
)
254
253
self .register_buffer (
255
254
"tokens_per_expert" ,
256
255
torch .zeros (num_experts , dtype = torch .float32 ),
257
- persistent = True ,
258
256
)
259
257
else :
260
258
self .expert_bias = None
Original file line number Diff line number Diff line change @@ -290,12 +290,10 @@ def __init__(self, model_args: DeepSeekV3ModelArgs):
290
290
self .register_buffer (
291
291
"expert_bias" ,
292
292
torch .zeros (num_experts , dtype = torch .float32 ),
293
- persistent = True ,
294
293
)
295
294
self .register_buffer (
296
295
"tokens_per_expert" ,
297
296
torch .zeros (num_experts , dtype = torch .float32 ),
298
- persistent = True ,
299
297
)
300
298
else :
301
299
self .expert_bias = None
You can’t perform that action at this time.
0 commit comments