mirror of
https://github.com/ggerganov/llama.cpp.git
synced 2025-01-13 04:00:16 +00:00
50 lines
1.3 KiB
C++
50 lines
1.3 KiB
C++
#pragma once
|
|
|
|
#include "ggml.h"
|
|
#include "common.h"
|
|
#include "chat-template.hpp"
|
|
// Change JSON_ASSERT from assert() to GGML_ASSERT:
|
|
#define JSON_ASSERT GGML_ASSERT
|
|
#include "json.hpp"
|
|
|
|
enum llama_tool_call_style {
|
|
UnknownToolCallStyle,
|
|
Generic,
|
|
Llama31,
|
|
Llama32,
|
|
FunctionaryV3Llama3,
|
|
FunctionaryV3Llama31,
|
|
Hermes2Pro,
|
|
CommandRPlus,
|
|
};
|
|
|
|
struct llama_tool_call {
|
|
std::string name;
|
|
std::string arguments;
|
|
};
|
|
|
|
struct llama_tool_calls {
|
|
std::string content;
|
|
std::vector<llama_tool_call> tool_calls;
|
|
};
|
|
|
|
struct llama_tool_call_handler {
|
|
std::string prompt;
|
|
std::string grammar;
|
|
std::vector<std::string> grammar_trigger_words;
|
|
std::vector<std::string> additional_stop_words;
|
|
};
|
|
|
|
llama_tool_call_style llama_tool_call_style_detect(const minja::chat_template & chat_template);
|
|
|
|
llama_tool_calls parse_tool_calls(llama_tool_call_style style, const nlohmann::ordered_json & tools, const std::string& input);
|
|
|
|
llama_tool_call_handler llama_tool_call_handler_init(
|
|
llama_tool_call_style style,
|
|
const minja::chat_template & tmpl,
|
|
bool allow_content,
|
|
bool parallel_tool_calls,
|
|
const nlohmann::ordered_json & messages,
|
|
const nlohmann::ordered_json & tools,
|
|
const nlohmann::ordered_json & json_schema = {});
|