We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent a4c0214 commit d135da4Copy full SHA for d135da4
ai_edge_torch/generative/examples/gemma/gemma2.py
@@ -247,6 +247,9 @@ def get_block_config(idx: int) -> cfg.TransformerBlockConfig:
247
rotary_base=10000,
248
rotary_percentage=1.0,
249
qkv_transpose_before_split=True,
250
+ # The safetensors from HF is not using the interleaved qkv format, so
251
+ # we need to disable interleaving here in the model config.
252
+ qkv_fused_interleaved=False,
253
logit_softcap=50.0,
254
sliding_window_size=4096,
255
attn_type=(
0 commit comments