mirror of
https://github.com/ggerganov/llama.cpp.git
synced 2025-01-12 19:50:17 +00:00
ci: server: tests python env on github container ubuntu latest / fix n_predict (#6935)
* ci: server: fix python env * ci: server: fix server tests after #6638 * ci: server: fix windows is not building PR branch
This commit is contained in:
parent
928e0b7013
commit
b7368332e2
31
.github/workflows/server.yml
vendored
31
.github/workflows/server.yml
vendored
@ -41,24 +41,16 @@ jobs:
|
|||||||
sanitizer: ""
|
sanitizer: ""
|
||||||
fail-fast: false # While -DLLAMA_SANITIZE_THREAD=ON is broken
|
fail-fast: false # While -DLLAMA_SANITIZE_THREAD=ON is broken
|
||||||
|
|
||||||
container:
|
|
||||||
image: ubuntu:latest
|
|
||||||
ports:
|
|
||||||
- 8888
|
|
||||||
options: --cpus 4
|
|
||||||
|
|
||||||
steps:
|
steps:
|
||||||
- name: Dependencies
|
- name: Dependencies
|
||||||
id: depends
|
id: depends
|
||||||
run: |
|
run: |
|
||||||
apt-get update
|
sudo apt-get update
|
||||||
apt-get -y install \
|
sudo apt-get -y install \
|
||||||
build-essential \
|
build-essential \
|
||||||
xxd \
|
xxd \
|
||||||
git \
|
git \
|
||||||
cmake \
|
cmake \
|
||||||
python3-pip \
|
|
||||||
python3-venv \
|
|
||||||
curl \
|
curl \
|
||||||
wget \
|
wget \
|
||||||
language-pack-en \
|
language-pack-en \
|
||||||
@ -71,6 +63,17 @@ jobs:
|
|||||||
fetch-depth: 0
|
fetch-depth: 0
|
||||||
ref: ${{ github.event.inputs.sha || github.event.pull_request.head.sha || github.sha || github.head_ref || github.ref_name }}
|
ref: ${{ github.event.inputs.sha || github.event.pull_request.head.sha || github.sha || github.head_ref || github.ref_name }}
|
||||||
|
|
||||||
|
- name: Python setup
|
||||||
|
id: setup_python
|
||||||
|
uses: actions/setup-python@v5
|
||||||
|
with:
|
||||||
|
python-version: '3.11'
|
||||||
|
|
||||||
|
- name: Tests dependencies
|
||||||
|
id: test_dependencies
|
||||||
|
run: |
|
||||||
|
pip install -r examples/server/tests/requirements.txt
|
||||||
|
|
||||||
- name: Verify server deps
|
- name: Verify server deps
|
||||||
id: verify_server_deps
|
id: verify_server_deps
|
||||||
run: |
|
run: |
|
||||||
@ -101,13 +104,6 @@ jobs:
|
|||||||
-DLLAMA_SANITIZE_${{ matrix.sanitizer }}=ON ;
|
-DLLAMA_SANITIZE_${{ matrix.sanitizer }}=ON ;
|
||||||
cmake --build . --config ${{ matrix.build_type }} -j $(nproc) --target server
|
cmake --build . --config ${{ matrix.build_type }} -j $(nproc) --target server
|
||||||
|
|
||||||
- name: Setup python env
|
|
||||||
id: pipenv
|
|
||||||
run: |
|
|
||||||
cd examples/server/tests
|
|
||||||
python3 -m venv venv
|
|
||||||
. venv/bin/activate
|
|
||||||
pip install -r requirements.txt
|
|
||||||
|
|
||||||
- name: Tests
|
- name: Tests
|
||||||
id: server_integration_tests
|
id: server_integration_tests
|
||||||
@ -133,6 +129,7 @@ jobs:
|
|||||||
uses: actions/checkout@v4
|
uses: actions/checkout@v4
|
||||||
with:
|
with:
|
||||||
fetch-depth: 0
|
fetch-depth: 0
|
||||||
|
ref: ${{ github.event.inputs.sha || github.event.pull_request.head.sha || github.sha || github.head_ref || github.ref_name }}
|
||||||
|
|
||||||
- name: libCURL
|
- name: libCURL
|
||||||
id: get_libcurl
|
id: get_libcurl
|
||||||
|
@ -1208,7 +1208,7 @@ struct server_context {
|
|||||||
}
|
}
|
||||||
|
|
||||||
auto n_ctx_train = llama_n_ctx_train(model);
|
auto n_ctx_train = llama_n_ctx_train(model);
|
||||||
if (slot.params.n_predict < 1 && slot.ga_n == 1
|
if (slot.params.n_predict < 1 && slot.n_predict < 1 && slot.ga_n == 1
|
||||||
&& slot.n_prompt_tokens + slot.n_decoded >= n_ctx_train) {
|
&& slot.n_prompt_tokens + slot.n_decoded >= n_ctx_train) {
|
||||||
LOG_WARNING("n_predict is not set and self-context extend is disabled."
|
LOG_WARNING("n_predict is not set and self-context extend is disabled."
|
||||||
" Limiting generated tokens to n_ctx_train to avoid EOS-less generation infinite loop", {
|
" Limiting generated tokens to n_ctx_train to avoid EOS-less generation infinite loop", {
|
||||||
|
Loading…
Reference in New Issue
Block a user