diff --git a/examples/speculative-simple/speculative-simple.cpp b/examples/speculative-simple/speculative-simple.cpp index 6dee64834..fb63435ab 100644 --- a/examples/speculative-simple/speculative-simple.cpp +++ b/examples/speculative-simple/speculative-simple.cpp @@ -41,8 +41,9 @@ int main(int argc, char ** argv) { // load the target model common_init_result llama_init_tgt = common_init_from_params(params); + model_tgt = llama_init_tgt.model; - ctx_tgt = llama_init_tgt.context; + ctx_tgt = llama_init_tgt.context; // load the draft model params.model = params.model_draft; @@ -53,8 +54,9 @@ int main(int argc, char ** argv) { params.cpuparams_batch.n_threads = params.draft_cpuparams_batch.n_threads; common_init_result llama_init_dft = common_init_from_params(params); + model_dft = llama_init_dft.model; - ctx_dft = llama_init_dft.context; + ctx_dft = llama_init_dft.context; if (!common_speculative_are_compatible(ctx_tgt, ctx_dft)) { return 1; diff --git a/tests/test-arg-parser.cpp b/tests/test-arg-parser.cpp index 3665238b5..93850b037 100644 --- a/tests/test-arg-parser.cpp +++ b/tests/test-arg-parser.cpp @@ -70,7 +70,7 @@ int main(void) { // non-existence arg in specific example (--draft cannot be used outside llama-speculative) argv = {"binary_name", "--draft", "123"}; - assert(false == common_params_parse(argv.size(), list_str_to_char(argv).data(), params, LLAMA_EXAMPLE_SERVER)); + assert(false == common_params_parse(argv.size(), list_str_to_char(argv).data(), params, LLAMA_EXAMPLE_EMBEDDING)); printf("test-arg-parser: test valid usage\n\n");