Ctrl+K
- state.param_states.decoder.decoder.pre_cross_attention_layer_norm.scale.v
- state.param_states.decoder.decoder.pre_mlp_layer_norm.scale.v
- state.param_states.decoder.decoder.pre_self_attention_layer_norm.scale.v
- state.param_states.decoder.decoder.relpos_bias.rel_embedding.v
- state.param_states.decoder.decoder_norm.scale.v
- state.param_states.decoder.logits_dense.kernel.v
- state.param_states.encoder.encoder.pre_attention_layer_norm.scale.v
- state.param_states.encoder.encoder.pre_mlp_layer_norm.scale.v
- state.param_states.encoder.encoder.relpos_bias.rel_embedding.v
- state.param_states.encoder.encoder_norm.scale.v
- state.param_states.token_embedder.embedding.v
- target.decoder.decoder.encoder_decoder_attention.key.kernel
- target.decoder.decoder.encoder_decoder_attention.out.kernel
- target.decoder.decoder.encoder_decoder_attention.query.kernel
- target.decoder.decoder.encoder_decoder_attention.value.kernel
- target.decoder.decoder.mlp.wi_0.kernel
- target.decoder.decoder.mlp.wi_1.kernel
- target.decoder.decoder.mlp.wo.kernel
- target.decoder.decoder.pre_cross_attention_layer_norm.scale
- target.decoder.decoder.pre_mlp_layer_norm.scale
- target.decoder.decoder.pre_self_attention_layer_norm.scale
- target.decoder.decoder.relpos_bias.rel_embedding
- target.decoder.decoder.self_attention.key.kernel
- target.decoder.decoder.self_attention.out.kernel
- target.decoder.decoder.self_attention.query.kernel
- target.decoder.decoder.self_attention.value.kernel
- target.decoder.decoder_norm.scale
- target.decoder.logits_dense.kernel
- target.encoder.encoder.attention.key.kernel
- target.encoder.encoder.attention.out.kernel
- target.encoder.encoder.attention.query.kernel
- target.encoder.encoder.attention.value.kernel
- target.encoder.encoder.mlp.wi_0.kernel
- target.encoder.encoder.mlp.wi_1.kernel
- target.encoder.encoder.mlp.wo.kernel
- target.encoder.encoder.pre_attention_layer_norm.scale
- target.encoder.encoder.pre_mlp_layer_norm.scale
- target.encoder.encoder.relpos_bias.rel_embedding
- target.encoder.encoder_norm.scale
- target.token_embedder.embedding
-
16.7 kB