feat: add LocalAI support #217

Workflow file for this run

	name: CI

	on:
	pull_request:
	branches: [main]

	jobs:
	build:
	runs-on: ubuntu-latest

	strategy:
	matrix:
	python-version:
	- "3.10"
	- "3.11"
	- "3.12"

	steps:
	- uses: actions/checkout@v4

	- name: Install UV
	run: curl -LsSf https://astral.sh/uv/install.sh \| sh

	- name: Source Cargo Environment
	run: source $HOME/.cargo/env

	- name: Set up Python ${{ matrix.python-version }}
	run: uv python install ${{ matrix.python-version }}

	- name: Ruff
	run: \|
	uvx ruff check -v
	uvx ruff format --check -v

	- name: Run tests
	run: uv run pytest tests -m 'not integration'

	# This integration tests the OpenAI API, using Ollama to host models.
	# This lets us test PRs from forks which can't access secrets like API keys.
	ollama:
	runs-on: ubuntu-latest

	strategy:
	matrix:
	python-version:
	# Only test the latest python version.
	- "3.12"
	ollama-model:
	# For quicker CI, use a smaller, tool-capable model than the default.
	- "qwen2.5:0.5b"

	steps:
	- uses: actions/checkout@v4

	- name: Install UV
	run: curl -LsSf https://astral.sh/uv/install.sh \| sh

	- name: Source Cargo Environment
	run: source $HOME/.cargo/env

	- name: Set up Python
	run: uv python install ${{ matrix.python-version }}

	- name: Install Ollama
	run: curl -fsSL https://ollama.com/install.sh \| sh

	- name: Start Ollama
	run: \|
	# Run the background, in a way that survives to the next step
	nohup ollama serve > ollama.log 2>&1 &

	# Block using the ready endpoint
	time curl --retry 5 --retry-connrefused --retry-delay 1 -sf http://localhost:11434 \|\| (cat ollama.log && exit 1)

	# Tests use OpenAI which does not have a mechanism to pull models. Run a
	# simple prompt to (pull and) test the model first.
	- name: Test Ollama model
	run: ollama run $OLLAMA_MODEL hello \|\| (cat ollama.log && exit 1)
	env:
	OLLAMA_MODEL: ${{ matrix.ollama-model }}

	- name: Run Ollama tests
	run: uv run pytest tests -m integration -k ollama \|\| (cat ollama.log && exit 1)
	env:
	OLLAMA_MODEL: ${{ matrix.ollama-model }}

	# This integration tests the OpenAI API, using LocalAI to host models.
	# This lets us test PRs from forks which can't access secrets like API keys.
	localai:
	runs-on: ubuntu-latest

	strategy:
	matrix:
	python-version:
	# Only test the latest python version.
	- "3.12"

	steps:
	- uses: actions/checkout@v4

	- name: Install UV
	run: curl -LsSf https://astral.sh/uv/install.sh \| sh

	- name: Source Cargo Environment
	run: source $HOME/.cargo/env

	- name: Set up Python
	run: uv python install ${{ matrix.python-version }}

	- name: Download LocalAI
	run: gh release download -R mudler/LocalAI -p local-ai-Linux-x86_64
	env:
	GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}

	- name: Install LocalAI
	run: \|
	mv local-ai-Linux-x86_64 /usr/local/bin/local-ai
	chmod +x /usr/local/bin/local-ai

	- name: Start LocalAI
	run: \|
	# Run the background, in a way that survives to the next step
	nohup local-ai run > localai.log 2>&1 &

	# Note: we don't `local-ai run` with the `LOCALAI_MODELS` env var
	# because the it would introduce a race. The below check would pass
	# before the model is downloaded.

	# Block using the ready endpoint
	time curl --retry 5 --retry-connrefused --retry-delay 1 -sf http://localhost:8080/readyz \|\| (cat localai && exit 1)

	# Tests use OpenAI which does not have a mechanism to install models.
	# This blocks until the model is installed to prevent failures.
	- name: Install LocalAI model
	run: \|
	# Use the default model until we find a small one that passes tests.
	LOCALAI_MODEL=$(uv run python -c "from src.exchange.providers.localai import LOCALAI_MODEL; print(LOCALAI_MODEL)")
	local-ai models install $LOCALAI_MODEL \|\| (cat localai && exit 1)

	- name: Run LocalAI tests
	run: uv run pytest tests -m integration -k localai \|\| (cat localai && exit 1)

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

feat: add LocalAI support #217

Workflow file

feat: add LocalAI support #217

Jobs

Run details

Workflow file for this run