server : return error on too large embedding input (#7389)

This commit is contained in:
Georgi Gerganov 2024-05-20 08:56:05 +03:00 committed by GitHub
parent 2789baf480
commit e932094d58
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -1981,8 +1981,7 @@ struct server_context {
slot.state = SLOT_STATE_PROCESSING; slot.state = SLOT_STATE_PROCESSING;
slot.command = SLOT_COMMAND_NONE; slot.command = SLOT_COMMAND_NONE;
slot.release(); slot.release();
slot.print_timings(); send_error(slot, "input is too large to process. increase the physical batch size", ERROR_TYPE_SERVER);
send_final_response(slot);
continue; continue;
} }
} else { } else {