llama.cpp/common/tool-call.h

#pragma once

#include "ggml.h"
#include "common.h"
#include "chat-template.hpp"
// Change JSON_ASSERT from assert() to GGML_ASSERT:
#define JSON_ASSERT GGML_ASSERT
#include "json.hpp"

enum llama_tool_call_style {
    UnknownToolCallStyle,
    Llama31,
    Llama32,
    FunctionaryV3Llama3,
    FunctionaryV3Llama31,
    Hermes2Pro,
    CommandRPlus,
};

struct llama_tool_call {
    std::string name;
    std::string arguments;
};

struct llama_tool_calls {
    std::string content;
    std::vector<llama_tool_call> tool_calls;
};

struct llama_tool_call_handler {
    std::string prompt;
    std::string grammar;
    std::vector<std::string> grammar_trigger_words;
    std::vector<std::string> additional_stop_words;
};

llama_tool_call_style llama_tool_call_style_detect(const minja::chat_template & chat_template);

llama_tool_calls parse_tool_calls(llama_tool_call_style style, const nlohmann::ordered_json & tools, const std::string& input);

llama_tool_call_handler llama_tool_call_handler_init(
    llama_tool_call_style style,
    const minja::chat_template & tmpl,
    bool allow_content,
    bool parallel_tool_calls,
    const nlohmann::ordered_json & messages,
    const nlohmann::ordered_json & tools);
`tool-call`: basic Functionary 3.2, Llama 3.1, Hermes 2 Pro grammar generators + parsers 2024-09-25 15:08:29 +00:00			`#pragma once`

			`#include "ggml.h"`
fix gcc build 2024-09-26 05:50:51 +00:00			`#include "common.h"`
`tool-call`: prepare possible externalization of minja + factor tool call style out of template 2024-10-01 22:12:24 +00:00			`#include "chat-template.hpp"`
`tool-call`: basic Functionary 3.2, Llama 3.1, Hermes 2 Pro grammar generators + parsers 2024-09-25 15:08:29 +00:00			`// Change JSON_ASSERT from assert() to GGML_ASSERT:`
			`#define JSON_ASSERT GGML_ASSERT`
			`#include "json.hpp"`
`tool-call`: prepare possible externalization of minja + factor tool call style out of template 2024-10-01 22:12:24 +00:00
			`enum llama_tool_call_style {`
			`UnknownToolCallStyle,`
			`Llama31,`
			`Llama32,`
			`FunctionaryV3Llama3,`
			`FunctionaryV3Llama31,`
			`Hermes2Pro,`
			`CommandRPlus,`
			`};`
`tool-call`: factor chat template away from legacy API 2024-09-26 16:19:29 +00:00
			`struct llama_tool_call {`
			`std::string name;`
			`std::string arguments;`
			`};`
`tool-call`: basic Functionary 3.2, Llama 3.1, Hermes 2 Pro grammar generators + parsers 2024-09-25 15:08:29 +00:00
			`struct llama_tool_calls {`
			`std::string content;`
`tool-call`: factor chat template away from legacy API 2024-09-26 16:19:29 +00:00			`std::vector<llama_tool_call> tool_calls;`
`tool-call`: basic Functionary 3.2, Llama 3.1, Hermes 2 Pro grammar generators + parsers 2024-09-25 15:08:29 +00:00			`};`

			`struct llama_tool_call_handler {`
`tool-call`: let the tool call handler expand chat template, moving builtin_tools down as extra_context 2024-09-28 16:46:36 +00:00			`std::string prompt;`
`tool-call`: basic Functionary 3.2, Llama 3.1, Hermes 2 Pro grammar generators + parsers 2024-09-25 15:08:29 +00:00			`std::string grammar;`
			`std::vector<std::string> grammar_trigger_words;`
			`std::vector<std::string> additional_stop_words;`
			`};`

`tool-call`: prepare possible externalization of minja + factor tool call style out of template 2024-10-01 22:12:24 +00:00			`llama_tool_call_style llama_tool_call_style_detect(const minja::chat_template & chat_template);`

`tool-call`: factor chat template away from legacy API 2024-09-26 16:19:29 +00:00			`llama_tool_calls parse_tool_calls(llama_tool_call_style style, const nlohmann::ordered_json & tools, const std::string& input);`
`tool-call`: basic Functionary 3.2, Llama 3.1, Hermes 2 Pro grammar generators + parsers 2024-09-25 15:08:29 +00:00
			`llama_tool_call_handler llama_tool_call_handler_init(`
`tool-call`: prepare possible externalization of minja + factor tool call style out of template 2024-10-01 22:12:24 +00:00			`llama_tool_call_style style,`
			`const minja::chat_template & tmpl,`
`tool-call`: basic Functionary 3.2, Llama 3.1, Hermes 2 Pro grammar generators + parsers 2024-09-25 15:08:29 +00:00			`bool allow_content,`
			`bool parallel_tool_calls,`
`tool-call`: let the tool call handler expand chat template, moving builtin_tools down as extra_context 2024-09-28 16:46:36 +00:00			`const nlohmann::ordered_json & messages,`
`tool-call`: basic Functionary 3.2, Llama 3.1, Hermes 2 Pro grammar generators + parsers 2024-09-25 15:08:29 +00:00			`const nlohmann::ordered_json & tools);`