We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
n_rot
1 parent 43fe07c commit dbd8828Copy full SHA for dbd8828
convert-persimmon-to-gguf.py
@@ -88,7 +88,8 @@ def main():
88
gguf_writer.add_embedding_length(hidden_size)
89
gguf_writer.add_block_count(block_count)
90
gguf_writer.add_feed_forward_length(hparams.ffn_hidden_size)
91
- gguf_writer.add_rope_dimension_count(hidden_size // head_count)
+ # ref: https://github.com/ggerganov/llama.cpp/pull/4889/commits/eea19039fc52ea2dbd1aab45b59ab4e3e29a3443
92
+ gguf_writer.add_rope_dimension_count(hidden_size // head_count // 2)
93
gguf_writer.add_head_count(head_count)
94
gguf_writer.add_head_count_kv(head_count_kv)
95
gguf_writer.add_rope_freq_base(hparams.rotary_emb_base)
0 commit comments