tool-call: script to prefetch models used in server tests

2025-01-13 04:00:16 +00:00 · 2024-10-28 02:01:00 +00:00 · 2024-10-28 02:01:00 +00:00 · dd6d0241a7
commit dd6d0241a7
parent 7fde6d0091
1 changed files with 67 additions and 0 deletions
--- a/scripts/fetch_server_test_models.py
+++ b/scripts/fetch_server_test_models.py
@ -0,0 +1,67 @@
 '''
    This script fetches all the models used in the server tests.
    This is useful for slow tests that use larger models, to avoid them timing out on the model downloads.
    It is meant to be run from the root of the repository.
    Example:
        python scripts/fetch_server_test_models.py
        ( cd examples/server/tests && ./tests.sh --tags=slow )
 '''
 import os
 from behave.parser import Parser
 import glob
 import re
 from pydantic import BaseModel
 import subprocess
 class HuggingFaceModel(BaseModel):
    hf_repo: str
    hf_file: str
    class Config:
        frozen = True
 models = set()
 model_file_re = re.compile(r'a model file ([^\s\n\r]+) from HF repo ([^\s\n\r]+)')
 def process_step(step):
    if (match := model_file_re.search(step.name)):
        (hf_file, hf_repo) = match.groups()
        models.add(HuggingFaceModel(hf_repo=hf_repo, hf_file=hf_file))
 feature_files = glob.glob(
    os.path.join(
        os.path.dirname(__file__),
        '../examples/server/tests/features/*.feature'))
 for feature_file in feature_files:
    with open(feature_file, 'r') as file:
        feature = Parser().parse(file.read())
        if not feature: continue
    if feature.background:
        for step in feature.background.steps:
            process_step(step)
    for scenario in feature.walk_scenarios(with_outlines=True):
        for step in scenario.steps:
            process_step(step)
 cli_path = os.environ.get(
    'LLAMA_SERVER_BIN_PATH',
    os.path.join(
        os.path.dirname(__file__),
        '../build/bin/Release/llama-cli.exe' if os.name == 'nt' else '../build/bin/llama-cli'))
 for m in models:
    if '<' in m.hf_repo or '<' in m.hf_file:
        continue
    print(f'# Ensuring model at {m.hf_repo} / {m.hf_file} is fetched')
    subprocess.check_call([cli_path, '-hfr', m.hf_repo, '-hff', m.hf_file, '-fa', '-n', '1', '-p', 'Hey', '--no-warmup'])