2024-09-25 15:08:29 +00:00
|
|
|
#include "tool-call.h"
|
|
|
|
#include "json-schema-to-grammar.h"
|
|
|
|
#include <algorithm>
|
|
|
|
#include <fstream>
|
|
|
|
#include <map>
|
|
|
|
#include <regex>
|
|
|
|
#include <sstream>
|
|
|
|
#include <string>
|
|
|
|
#include <unordered_map>
|
|
|
|
#include <unordered_set>
|
|
|
|
#include <vector>
|
|
|
|
|
|
|
|
using json = nlohmann::ordered_json;
|
|
|
|
|
2024-10-01 22:12:24 +00:00
|
|
|
llama_tool_call_style llama_tool_call_style_detect(const minja::chat_template & chat_template) {
|
|
|
|
const auto & src = chat_template.source();
|
|
|
|
|
|
|
|
if (src.find("<tool_call>") != std::string::npos) {
|
|
|
|
return Hermes2Pro;
|
|
|
|
} else if (src.find(">>>all") != std::string::npos) {
|
|
|
|
return FunctionaryV3Llama3;
|
|
|
|
} else if (src.find("<|start_header_id|>") != std::string::npos
|
|
|
|
&& src.find("<function=") != std::string::npos) {
|
|
|
|
return FunctionaryV3Llama31;
|
|
|
|
} else if (src.find("<|start_header_id|>ipython<|end_header_id|>") != std::string::npos) {
|
|
|
|
if (src.find("<|python_tag|>") != std::string::npos) {
|
|
|
|
return Llama31;
|
|
|
|
} else {
|
|
|
|
return Llama32;
|
|
|
|
}
|
|
|
|
} else if (src.find("<|START_OF_TURN_TOKEN|><|CHATBOT_TOKEN|>") != std::string::npos) {
|
|
|
|
return CommandRPlus;
|
|
|
|
} else {
|
|
|
|
return UnknownToolCallStyle;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2024-09-25 15:08:29 +00:00
|
|
|
static bool parse_json(std::string::const_iterator & it, const std::string::const_iterator & end, json & out) {
|
|
|
|
// // https://json.nlohmann.me/features/parsing/sax_interface/
|
|
|
|
struct json_error_locator : public nlohmann::json_sax<json> {
|
|
|
|
std::size_t position;
|
|
|
|
bool found_error;
|
|
|
|
|
2024-09-26 02:42:05 +00:00
|
|
|
json_error_locator() : position(0), found_error(false) {}
|
|
|
|
|
2024-09-26 05:50:51 +00:00
|
|
|
bool parse_error(std::size_t position, const std::string &, const json::exception &) override {
|
2024-09-25 15:08:29 +00:00
|
|
|
this->position = position - 1;
|
|
|
|
this->found_error = true;
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
bool null() override { return true; }
|
|
|
|
bool boolean(bool) override { return true; }
|
|
|
|
bool number_integer(number_integer_t) override { return true; }
|
|
|
|
bool number_unsigned(number_unsigned_t) override { return true; }
|
|
|
|
bool number_float(number_float_t, const string_t &) override { return true; }
|
|
|
|
bool string(string_t &) override { return true; }
|
|
|
|
bool binary(binary_t &) override { return true; }
|
|
|
|
bool start_object(std::size_t) override { return true; }
|
|
|
|
bool key(string_t &) override { return true; }
|
|
|
|
bool end_object() override { return true; }
|
|
|
|
bool start_array(std::size_t) override { return true; }
|
|
|
|
bool end_array() override { return true; }
|
|
|
|
};
|
|
|
|
json_error_locator err_loc;
|
|
|
|
json::sax_parse(it, end, &err_loc);
|
|
|
|
|
|
|
|
std::string::const_iterator temptative_end;
|
|
|
|
if (err_loc.found_error) {
|
|
|
|
temptative_end = it + err_loc.position;
|
|
|
|
} else {
|
|
|
|
temptative_end = end;
|
|
|
|
}
|
2024-09-26 02:42:05 +00:00
|
|
|
std::string json_sub {it, temptative_end};
|
2024-09-25 15:08:29 +00:00
|
|
|
try {
|
|
|
|
out = json::parse(json_sub);
|
|
|
|
it = temptative_end;
|
|
|
|
return true;
|
2024-09-26 05:50:51 +00:00
|
|
|
} catch (const std::exception &) {
|
2024-09-25 15:08:29 +00:00
|
|
|
return false;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2024-09-28 17:30:59 +00:00
|
|
|
/**
|
|
|
|
* Takes a prefix regex that must have 1 group to capture the function name, a closing suffix, and expects json parameters in between.
|
|
|
|
* Aggregates the prefix, suffix and in-between text into the content.
|
|
|
|
*/
|
|
|
|
static llama_tool_calls parse_json_tool_calls(const json & tools, const std::string& input, const std::regex & function_regex, const std::regex & close_regex, bool check_names) {
|
|
|
|
std::smatch match;
|
|
|
|
|
|
|
|
llama_tool_calls result;
|
|
|
|
auto end = input.end();
|
|
|
|
auto it = input.begin();
|
|
|
|
|
|
|
|
std::unordered_set<std::string> tool_names;
|
|
|
|
if (check_names) {
|
|
|
|
for (const auto & tool : tools) {
|
|
|
|
if (tool.contains("type") && tool["type"] == "function") {
|
|
|
|
tool_names.insert(tool["function"]["name"]);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
while (it != end) {
|
|
|
|
std::sregex_iterator rend;
|
|
|
|
std::sregex_iterator rit(it, end, function_regex);
|
|
|
|
if (rit == rend) {
|
|
|
|
result.content += std::string(it, end);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
auto name = rit->str(1);
|
|
|
|
if (check_names && tool_names.find(name) == tool_names.end()) {
|
|
|
|
result.content += std::string(it, rit->suffix().first);
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
result.content += std::string(it, rit->prefix().second);
|
|
|
|
it = rit->suffix().first;
|
|
|
|
|
|
|
|
|
|
|
|
json arguments;
|
|
|
|
if (!parse_json(it, end, arguments)) {
|
|
|
|
throw std::runtime_error("Failed to parse json tool call arguments");
|
|
|
|
}
|
|
|
|
if (!std::regex_search(it, end, match, close_regex)) {
|
|
|
|
throw std::runtime_error("Malformed input, missing closing pattern");
|
|
|
|
}
|
|
|
|
it = match.suffix().first;
|
|
|
|
result.tool_calls.push_back({name, arguments.dump()});
|
|
|
|
}
|
|
|
|
return result;
|
|
|
|
}
|
|
|
|
|
2024-09-25 15:08:29 +00:00
|
|
|
static llama_tool_calls parse_hermes_tool_calls(const std::string& input) {
|
|
|
|
try {
|
|
|
|
std::regex start_pattern(R"([\n\s]*<tool_call>)");
|
|
|
|
std::regex middle_pattern(R"([\n\s]*</tool_call>[\n\s]*<tool_call>)");
|
|
|
|
std::regex end_pattern(R"([\n\s]*</tool_call>[\n\s]*$)");
|
2024-09-26 01:27:46 +00:00
|
|
|
|
2024-09-25 15:08:29 +00:00
|
|
|
auto end = input.end();
|
|
|
|
std::sregex_iterator rend;
|
|
|
|
std::sregex_iterator rit(input.begin(), end, start_pattern);
|
|
|
|
if (rit == rend) {
|
|
|
|
return {input, {}};
|
|
|
|
}
|
|
|
|
|
|
|
|
llama_tool_calls result;
|
|
|
|
result.content = rit->prefix();
|
|
|
|
|
|
|
|
auto it = rit->suffix().first;
|
|
|
|
while (it != end) {
|
|
|
|
json call;
|
|
|
|
if (!parse_json(it, end, call)) {
|
|
|
|
throw std::runtime_error("Failed to parse json tool call");
|
|
|
|
}
|
|
|
|
result.tool_calls.push_back({
|
|
|
|
call["name"],
|
|
|
|
call["arguments"].dump(),
|
|
|
|
});
|
|
|
|
rit = {it, end, middle_pattern};
|
|
|
|
if (rit != rend) {
|
|
|
|
it = rit->suffix().first;
|
|
|
|
} else {
|
|
|
|
rit = {it, end, end_pattern};
|
|
|
|
if (rit == rend) {
|
|
|
|
throw std::runtime_error("Malformed input, missing </tool_call>");
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return result;
|
|
|
|
} catch (const std::exception & e) {
|
|
|
|
return {input, {}};
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2024-09-28 17:30:59 +00:00
|
|
|
static llama_tool_calls parse_llama_3_tool_calls(const json & tools, const std::string& input, bool allow_python_tag) {
|
|
|
|
if (allow_python_tag) {
|
|
|
|
static std::regex python_tag_regex(R"(<\|python_tag\|>([\s\S\n]*)$)");
|
|
|
|
std::smatch match;
|
|
|
|
if (std::regex_search(input, match, python_tag_regex)) {
|
|
|
|
return {
|
|
|
|
match.prefix().str(), {
|
|
|
|
{"ipython", (json {{"code", match[1].str()}}).dump()},
|
2024-09-25 15:08:29 +00:00
|
|
|
}
|
2024-09-28 17:30:59 +00:00
|
|
|
};
|
2024-09-25 15:08:29 +00:00
|
|
|
}
|
|
|
|
}
|
2024-09-28 17:30:59 +00:00
|
|
|
static std::regex function_regex("(?:^|\\n)\\{\"name\": \"([^\"]+)\", \"parameters\": ");
|
|
|
|
static std::regex close_regex("\\}");
|
|
|
|
return parse_json_tool_calls(tools, input, function_regex, close_regex, /* check_names= */ false);
|
2024-09-25 16:33:00 +00:00
|
|
|
}
|
2024-09-25 15:08:29 +00:00
|
|
|
|
2024-09-27 06:06:33 +00:00
|
|
|
static llama_tool_calls parse_functionary_v3_llama_3_1_tool_calls(const json & tools, const std::string& input) {
|
2024-09-26 04:56:15 +00:00
|
|
|
// This version of Functionary still supports the llama 3.1 tool call format for the python tool.
|
|
|
|
static std::regex python_tag_regex(R"(<\|python_tag\|>([\s\S\n]*)$)");
|
|
|
|
std::smatch match;
|
|
|
|
if (std::regex_search(input, match, python_tag_regex)) {
|
|
|
|
return {
|
|
|
|
match.prefix().str(), {
|
|
|
|
{"ipython", (json {{"code", match[1].str()}}).dump()},
|
|
|
|
}
|
|
|
|
};
|
|
|
|
}
|
2024-09-26 02:42:05 +00:00
|
|
|
static std::regex function_regex(R"(<function=(\w+)>)");
|
|
|
|
static std::regex close_regex(R"(</function>)");
|
2024-09-28 17:30:59 +00:00
|
|
|
return parse_json_tool_calls(tools, input, function_regex, close_regex, /* check_names= */ false);
|
2024-09-26 02:42:05 +00:00
|
|
|
}
|
|
|
|
|
2024-09-27 06:06:33 +00:00
|
|
|
static llama_tool_calls parse_functionary_v3_tool_calls(const json & tools, const std::string& input) {
|
|
|
|
static std::regex function_regex(R"((?:>>>)?(\w+)\n)");
|
2024-09-28 17:30:59 +00:00
|
|
|
static std::regex close_regex(R"($|(?=>>>))");
|
|
|
|
return parse_json_tool_calls(tools, input, function_regex, close_regex, /* check_names= */ true);
|
2024-09-25 15:08:29 +00:00
|
|
|
}
|
|
|
|
|
2024-09-26 16:19:29 +00:00
|
|
|
llama_tool_calls parse_tool_calls(llama_tool_call_style style, const json & tools, const std::string& input) {
|
|
|
|
switch (style) {
|
|
|
|
case llama_tool_call_style::Llama31:
|
2024-09-28 17:30:59 +00:00
|
|
|
return parse_llama_3_tool_calls(tools, input, /* parse_llama_3_tool_calls= */ true);
|
|
|
|
case llama_tool_call_style::Llama32:
|
|
|
|
return parse_llama_3_tool_calls(tools, input, /* parse_llama_3_tool_calls= */ false);
|
2024-09-26 16:19:29 +00:00
|
|
|
case llama_tool_call_style::FunctionaryV3Llama3:
|
2024-09-27 06:06:33 +00:00
|
|
|
return parse_functionary_v3_tool_calls(tools, input);
|
2024-09-26 16:19:29 +00:00
|
|
|
case llama_tool_call_style::FunctionaryV3Llama31:
|
2024-09-27 06:06:33 +00:00
|
|
|
return parse_functionary_v3_llama_3_1_tool_calls(tools, input);
|
2024-09-26 16:19:29 +00:00
|
|
|
case llama_tool_call_style::Hermes2Pro:
|
|
|
|
return parse_hermes_tool_calls(input);
|
|
|
|
default:
|
|
|
|
throw std::runtime_error("Unsupported tool call style");
|
2024-09-25 15:08:29 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
llama_tool_call_handler llama_tool_call_handler_init(
|
2024-10-01 22:12:24 +00:00
|
|
|
llama_tool_call_style style,
|
|
|
|
const minja::chat_template & tmpl,
|
2024-09-25 15:08:29 +00:00
|
|
|
bool allow_content,
|
|
|
|
bool parallel_tool_calls,
|
2024-09-28 16:46:36 +00:00
|
|
|
const nlohmann::ordered_json & messages,
|
2024-09-25 15:08:29 +00:00
|
|
|
const nlohmann::ordered_json & tools)
|
|
|
|
{
|
|
|
|
llama_tool_call_handler handler;
|
2024-09-26 01:27:46 +00:00
|
|
|
|
2024-10-01 22:12:24 +00:00
|
|
|
switch (style) {
|
2024-09-28 17:30:59 +00:00
|
|
|
case llama_tool_call_style::Llama31:
|
|
|
|
case llama_tool_call_style::Llama32: {
|
|
|
|
static auto builtin_tools = json {"wolfram_alpha", "brave_search"};
|
|
|
|
|
2024-10-01 22:12:24 +00:00
|
|
|
auto uses_python_tag = style == llama_tool_call_style::Llama31;
|
2024-09-28 17:30:59 +00:00
|
|
|
|
|
|
|
// Technically we should only trigger on `"\n{\"name\": \"" + name + "\""` for each tool name,
|
2024-09-28 18:05:10 +00:00
|
|
|
// but Llama-3.2-3B (and 1B) struggles to output valid tool calls so we're "guiding" it strongly as soon
|
2024-09-28 17:30:59 +00:00
|
|
|
// as it seems to be outputting some JSON.
|
|
|
|
// TODO: make this conditional on a very small model (e.g. 1B / 3B).
|
2024-10-01 22:12:24 +00:00
|
|
|
auto eagerly_match_any_json = style == llama_tool_call_style::Llama32;
|
2024-09-28 17:30:59 +00:00
|
|
|
|
2024-09-26 16:19:29 +00:00
|
|
|
handler.grammar = build_grammar([&](const llama_grammar_builder & builder) {
|
|
|
|
std::vector<std::string> tool_rules;
|
|
|
|
|
|
|
|
for (const auto & tool : tools) {
|
|
|
|
const auto & function = tool["function"];
|
|
|
|
std::string name = function["name"];
|
|
|
|
auto parameters = function["parameters"];
|
|
|
|
builder.resolve_refs(parameters);
|
2024-09-28 17:30:59 +00:00
|
|
|
if (uses_python_tag && (name == "ipython" || builtin_tools.contains(name))) {
|
2024-09-26 16:19:29 +00:00
|
|
|
tool_rules.push_back(builder.add_rule("ipython-call", "\"<|python_tag|>\" .*"));
|
|
|
|
if (allow_content) {
|
|
|
|
handler.grammar_trigger_words.push_back("<|python_tag|>");
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
//"<|start_header_id|>assistant<|end_header_id|>\n\n{\"name\": \"" + name + "\", " +
|
|
|
|
tool_rules.push_back(
|
|
|
|
builder.add_rule(
|
|
|
|
name + "-call",
|
2024-09-28 17:30:59 +00:00
|
|
|
"\"\\n\"? \"{\\\"name\\\": \\\"" + name + "\\\", \\\"parameters\\\": \" " +
|
2024-09-26 16:19:29 +00:00
|
|
|
builder.add_schema(name + "-args", parameters) +
|
|
|
|
" \"}\""));
|
2024-09-28 17:30:59 +00:00
|
|
|
if (allow_content && !eagerly_match_any_json) {
|
2024-09-27 05:04:41 +00:00
|
|
|
handler.grammar_trigger_words.push_back("\n{\"name\": \"" + name + "\"");
|
2024-09-26 16:19:29 +00:00
|
|
|
}
|
2024-09-26 05:51:46 +00:00
|
|
|
}
|
|
|
|
}
|
2024-09-25 15:08:29 +00:00
|
|
|
|
2024-09-28 17:30:59 +00:00
|
|
|
if (allow_content && eagerly_match_any_json) {
|
|
|
|
handler.grammar_trigger_words.push_back("\n{\"");
|
|
|
|
handler.grammar_trigger_words.push_back("{\"");
|
|
|
|
}
|
|
|
|
|
2024-09-26 16:19:29 +00:00
|
|
|
builder.add_rule("root", join(tool_rules.begin(), tool_rules.end(), " | "));
|
|
|
|
});
|
|
|
|
handler.additional_stop_words.push_back("<|eom_id|>");
|
2024-09-28 16:46:36 +00:00
|
|
|
handler.prompt = tmpl.apply(messages, tools, /* add_generation_prompt= */ true, {
|
|
|
|
{"builtin_tools", builtin_tools},
|
|
|
|
});
|
2024-09-26 16:19:29 +00:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
case llama_tool_call_style::FunctionaryV3Llama3: {
|
|
|
|
// >>>all\nlet's call functions>>>fn1\n{"arg1": 1...}\n>>>fn2\n{"arg1": 1...}...
|
|
|
|
// Using ">>>f1\n", ">>>f2\n"... as trigger words for the grammar
|
|
|
|
handler.grammar = build_grammar([&](const llama_grammar_builder & builder) {
|
2024-09-27 06:06:33 +00:00
|
|
|
std::vector<std::string> first_tool_rules;
|
|
|
|
std::vector<std::string> subsequent_tool_rules;
|
2024-09-26 16:19:29 +00:00
|
|
|
for (size_t i = 0, n = tools.size(); i < n; i++) {
|
|
|
|
auto & tool = tools[i];
|
|
|
|
const auto & function = tool["function"];
|
|
|
|
std::string name = function["name"];
|
|
|
|
auto parameters = function["parameters"];
|
2024-09-27 06:06:33 +00:00
|
|
|
auto args_rule = builder.add_schema(name + "-args", parameters);
|
|
|
|
first_tool_rules.push_back(builder.add_rule(name + "-call", "\"" + name + "\\n\" " + args_rule));
|
2024-09-28 17:30:59 +00:00
|
|
|
subsequent_tool_rules.push_back(builder.add_rule(name + "-call2", "\">>>" + name + "\\n\" " + args_rule));
|
2024-09-25 15:08:29 +00:00
|
|
|
if (allow_content) {
|
2024-09-27 06:06:33 +00:00
|
|
|
handler.grammar_trigger_words.push_back(name + "\n");
|
2024-09-26 16:19:29 +00:00
|
|
|
handler.grammar_trigger_words.push_back(">>>" + name + "\n");
|
2024-09-25 15:08:29 +00:00
|
|
|
}
|
2024-09-26 16:19:29 +00:00
|
|
|
}
|
2024-09-27 06:06:33 +00:00
|
|
|
auto first_rule = builder.add_rule("first_tool_call", join(first_tool_rules.begin(), first_tool_rules.end(), " | ")) + " space";
|
|
|
|
if (parallel_tool_calls) {
|
|
|
|
auto subsequent_rule = builder.add_rule("subsequent_tool_call", join(subsequent_tool_rules.begin(), subsequent_tool_rules.end(), " | ")) + " space";
|
|
|
|
builder.add_rule("root", first_rule + " (" + subsequent_rule + ")*");
|
|
|
|
} else {
|
|
|
|
builder.add_rule("root", first_rule);
|
|
|
|
}
|
2024-09-26 16:19:29 +00:00
|
|
|
});
|
2024-09-28 16:46:36 +00:00
|
|
|
handler.prompt = tmpl.apply(messages, tools, /* add_generation_prompt= */ true);
|
2024-09-26 16:19:29 +00:00
|
|
|
// handler.parser = parse_functionary_3_2_tool_calls;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case llama_tool_call_style::FunctionaryV3Llama31: {
|
|
|
|
// ./tests/chat/templates/meetkai-functionary-medium-v3.1.jinja
|
|
|
|
// https://github.com/MeetKai/functionary/blob/main/tests/prompt_test_v3-llama3.1.txt
|
|
|
|
// TODO: handle tool {type: code_interpreter} as python
|
|
|
|
handler.grammar = build_grammar([&](const llama_grammar_builder & builder) {
|
|
|
|
std::vector<std::string> tool_rules;
|
|
|
|
for (size_t i = 0, n = tools.size(); i < n; i++) {
|
|
|
|
auto & tool = tools[i];
|
|
|
|
const auto & function = tool["function"];
|
|
|
|
std::string name = function["name"];
|
|
|
|
auto parameters = function["parameters"];
|
|
|
|
if (name == "python") {
|
|
|
|
tool_rules.push_back(builder.add_rule("python-call", "\"<|python_tag|>\" .*"));
|
|
|
|
if (allow_content) {
|
|
|
|
handler.grammar_trigger_words.push_back("<|python_tag|>");
|
|
|
|
}
|
|
|
|
} else {
|
2024-09-28 21:32:47 +00:00
|
|
|
tool_rules.push_back(builder.add_rule(name + "-call", "\"<function=" + name + ">\" " + builder.add_schema(name + "-args", parameters) + " \"</function>\" space"));
|
2024-09-25 15:08:29 +00:00
|
|
|
}
|
|
|
|
}
|
2024-09-26 16:19:29 +00:00
|
|
|
auto tool_call = builder.add_rule("tool_call", join(tool_rules.begin(), tool_rules.end(), " | ")) + " space";
|
|
|
|
builder.add_rule("root", parallel_tool_calls ? "(" + tool_call + ")+" : tool_call);
|
|
|
|
if (allow_content) {
|
|
|
|
handler.grammar_trigger_words.push_back("<function=");
|
|
|
|
}
|
|
|
|
});
|
2024-09-28 16:46:36 +00:00
|
|
|
handler.prompt = tmpl.apply(messages, tools, /* add_generation_prompt= */ true);
|
2024-09-26 16:19:29 +00:00
|
|
|
// handler.parser = parse_functionary_3_2_tool_calls;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case llama_tool_call_style::Hermes2Pro: {
|
|
|
|
// NousResearchHermesPro_2
|
|
|
|
// (content)?(<tool_call>{"name": "foo", "arguments": {"a": 1}}</tool_call>)*
|
|
|
|
handler.grammar = build_grammar([&](const llama_grammar_builder & builder) {
|
|
|
|
std::vector<std::string> tool_rules;
|
|
|
|
for (const auto & tool : tools) {
|
|
|
|
const auto & function = tool["function"];
|
|
|
|
std::string name = function["name"];
|
|
|
|
auto parameters = function["parameters"];
|
|
|
|
builder.resolve_refs(parameters);
|
|
|
|
tool_rules.push_back(builder.add_schema(name + "-call", {
|
|
|
|
{"type", "object"},
|
|
|
|
{"properties", json {
|
|
|
|
{"name", json {{"const", name}}},
|
|
|
|
{"arguments", parameters},
|
|
|
|
}},
|
|
|
|
{"required", json::array({"name", "arguments"})},
|
|
|
|
}));
|
|
|
|
}
|
2024-09-25 15:08:29 +00:00
|
|
|
|
2024-09-28 21:32:47 +00:00
|
|
|
auto tool_call = "\"<tool_call>\" space " + builder.add_rule("tool_call", join(tool_rules.begin(), tool_rules.end(), " | ")) + " \"</tool_call>\" space";
|
2024-09-26 16:19:29 +00:00
|
|
|
builder.add_rule("root", parallel_tool_calls ? "(" + tool_call + ")+" : tool_call);
|
|
|
|
if (allow_content) {
|
|
|
|
handler.grammar_trigger_words.push_back("<tool_call>");
|
|
|
|
}
|
|
|
|
});
|
2024-09-28 16:46:36 +00:00
|
|
|
handler.prompt = tmpl.apply(messages, tools, /* add_generation_prompt= */ true);
|
2024-09-26 16:19:29 +00:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
default:
|
|
|
|
throw std::runtime_error("Unsupported tool call style");
|
2024-09-25 15:08:29 +00:00
|
|
|
}
|
|
|
|
return handler;
|
|
|
|
}
|