We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
--special
1 parent e02b597 commit 3807c3dCopy full SHA for 3807c3d
examples/server/server.cpp
@@ -1182,7 +1182,7 @@ struct server_context {
1182
1183
bool process_token(completion_token_output & result, server_slot & slot) {
1184
// remember which tokens were sampled - used for repetition penalties during sampling
1185
- const std::string token_str = llama_token_to_piece(ctx, result.tok, false);
+ const std::string token_str = llama_token_to_piece(ctx, result.tok, params.special);
1186
slot.sampled = result.tok;
1187
1188
// search stop word and delete it
0 commit comments