We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent ec66a75 commit 762857cCopy full SHA for 762857c
jetstream_pt/third_party/llama/model_exportable.py
@@ -232,7 +232,7 @@ def forward(
232
), f"Number of caches ({len(caches)}) and layers ({len(self.layers)}) dont match"
233
end = None if start is None else (start + input_pos) % self.env.cache_len
234
for layer, cache in zip(self.layers, caches):
235
- with jax.named_scope("TransformerBlock"):
+ with jax.named_scope("TransformerBlock_Layer_" + str(layer.layer_id)):
236
h = layer(
237
h,
238
freqs_cis,
0 commit comments