You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
printf(" -gaw N, --grp-attn-w N set the group attention width to extend context size through self-extend(default: 512), used together with group attention factor `--grp-attn-n`\n");
2198
2198
printf(" --chat-template JINJA_TEMPLATE\n");
2199
2199
printf(" set custom jinja chat template (default: template taken from model's metadata)\n");
2200
-
printf(" Note: only commonly used templates are accepted, since we don't have jinja parser\n");
2200
+
printf(" only commonly used templates are accepted:\n");
if (sparams.chat_template.empty()) { // custom chat template is not supplied
2802
+
// if a custom chat template is not supplied, we will use the one that comes with the model (if any)
2803
+
if (sparams.chat_template.empty()) {
2802
2804
if (!ctx_server.validate_model_chat_template()) {
2803
2805
LOG_ERROR("The chat template that comes with this model is not yet supported, falling back to chatml. This may cause the model to output suboptimal responses", {});
2804
2806
sparams.chat_template = "chatml";
2805
2807
}
2806
2808
}
2807
2809
2810
+
// print sample chat example to make it clear which template is used
2811
+
{
2812
+
json chat;
2813
+
chat.push_back({{"role", "system"}, {"content", "You are a helpful assistant"}});
0 commit comments