We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent fc5974d commit 3575636Copy full SHA for 3575636
keras_hub/src/models/smollm3/smollm3_causal_lm.py
@@ -70,9 +70,10 @@ def call_with_cache(
70
x = self.backbone.token_embedding(token_ids)
71
72
# Each decoder layer has a cache; we update them separately.
73
- position_embeddings = self.backbone.rotary_embedding(x, start_index=cache_update_index)
+
74
updated_cache = []
75
for i in range(self.backbone.num_layers):
76
+ position_embeddings = self.backbone.rotary_embedding(x, start_index=cache_update_index)
77
current_cache = cache[:, i, ...]
78
x, next_cache = self.backbone.transformer_layers[i](
79
x,
0 commit comments