mirror of
https://github.com/ggerganov/llama.cpp.git
synced 2024-12-29 04:44:34 +00:00
speculative : minor fixup
This commit is contained in:
parent
f27ddc57d7
commit
ccc8f63f9f
@ -41,8 +41,9 @@ int main(int argc, char ** argv) {
|
|||||||
|
|
||||||
// load the target model
|
// load the target model
|
||||||
common_init_result llama_init_tgt = common_init_from_params(params);
|
common_init_result llama_init_tgt = common_init_from_params(params);
|
||||||
|
|
||||||
model_tgt = llama_init_tgt.model;
|
model_tgt = llama_init_tgt.model;
|
||||||
ctx_tgt = llama_init_tgt.context;
|
ctx_tgt = llama_init_tgt.context;
|
||||||
|
|
||||||
// load the draft model
|
// load the draft model
|
||||||
params.model = params.model_draft;
|
params.model = params.model_draft;
|
||||||
@ -53,8 +54,9 @@ int main(int argc, char ** argv) {
|
|||||||
|
|
||||||
params.cpuparams_batch.n_threads = params.draft_cpuparams_batch.n_threads;
|
params.cpuparams_batch.n_threads = params.draft_cpuparams_batch.n_threads;
|
||||||
common_init_result llama_init_dft = common_init_from_params(params);
|
common_init_result llama_init_dft = common_init_from_params(params);
|
||||||
|
|
||||||
model_dft = llama_init_dft.model;
|
model_dft = llama_init_dft.model;
|
||||||
ctx_dft = llama_init_dft.context;
|
ctx_dft = llama_init_dft.context;
|
||||||
|
|
||||||
if (!common_speculative_are_compatible(ctx_tgt, ctx_dft)) {
|
if (!common_speculative_are_compatible(ctx_tgt, ctx_dft)) {
|
||||||
return 1;
|
return 1;
|
||||||
|
@ -70,7 +70,7 @@ int main(void) {
|
|||||||
|
|
||||||
// non-existence arg in specific example (--draft cannot be used outside llama-speculative)
|
// non-existence arg in specific example (--draft cannot be used outside llama-speculative)
|
||||||
argv = {"binary_name", "--draft", "123"};
|
argv = {"binary_name", "--draft", "123"};
|
||||||
assert(false == common_params_parse(argv.size(), list_str_to_char(argv).data(), params, LLAMA_EXAMPLE_SERVER));
|
assert(false == common_params_parse(argv.size(), list_str_to_char(argv).data(), params, LLAMA_EXAMPLE_EMBEDDING));
|
||||||
|
|
||||||
|
|
||||||
printf("test-arg-parser: test valid usage\n\n");
|
printf("test-arg-parser: test valid usage\n\n");
|
||||||
|
Loading…
Reference in New Issue
Block a user