Skip to content

refactor: remove --multi-retrieval CLI option #64

refactor: remove --multi-retrieval CLI option

refactor: remove --multi-retrieval CLI option #64

name: Test API Server
on:
push:
branches:
- dev
- main
- release-*
- feat-*
- ci-*
- refactor-*
- fix-*
- test-*
paths:
- '.github/workflows/test_api_server.yml'
- '**/Cargo.toml'
- '**/*.rs'
- '**/*.sh'
- '**/.cargo/config.toml'
- 'tests/*.hurl'
pull_request:
branches:
- dev
- main
types: [opened, synchronize, reopened]
paths:
- '.github/workflows/**'
- '**/Cargo.toml'
- '**/*.rs'
- '**/*.sh'
- 'tests/*.hurl'
jobs:
test-api-server:
runs-on: ubuntu-latest
strategy:
matrix:
wasmedge_version: [0.14.1]
steps:
- name: Clone project
id: checkout
uses: actions/checkout@v3
- name: Install Rust-nightly
uses: actions-rust-lang/setup-rust-toolchain@v1
with:
toolchain: nightly
target: wasm32-wasip1
components: rustfmt, clippy
- name: Install Rust-stable
uses: actions-rust-lang/setup-rust-toolchain@v1
with:
target: wasm32-wasip1
- name: Install WasmEdge
run: |
curl -sSf https://raw.githubusercontent.com/WasmEdge/WasmEdge/master/utils/install_v2.sh | bash -s -- -v ${{ matrix.wasmedge_version }}
ls -al $HOME/.wasmedge/bin
- name: Install Hurl
run: |
curl --location --remote-name https://github.com/Orange-OpenSource/hurl/releases/download/5.0.1/hurl_5.0.1_amd64.deb
sudo apt update && sudo apt install ./hurl_5.0.1_amd64.deb
- name: Install Qdrant and download snapshot
run: |
# Download Qdrant
curl -LO https://github.com/qdrant/qdrant/releases/download/v1.11.4/qdrant-x86_64-unknown-linux-musl.tar.gz
tar -xvf qdrant-x86_64-unknown-linux-musl.tar.gz
rm qdrant-x86_64-unknown-linux-musl.tar.gz
# Download snapshot
curl -LO https://huggingface.co/datasets/gaianet/paris/resolve/main/paris_768_nomic-embed-text-v1.5-f16.snapshot
mv paris_768_nomic-embed-text-v1.5-f16.snapshot default.snapshot
ls -al
- name: Build rag-api-server on linux
env:
RUSTFLAGS: "--cfg wasmedge --cfg tokio_unstable"
run: |
cargo build -p rag-api-server --release
cp target/wasm32-wasip1/release/rag-api-server.wasm ./rag-api-server.wasm
- name: Download models
run: |
curl -LO https://huggingface.co/second-state/Qwen2-1.5B-Instruct-GGUF/resolve/main/Qwen2-1.5B-Instruct-Q3_K_M.gguf
curl -LO https://huggingface.co/second-state/Nomic-embed-text-v1.5-Embedding-GGUF/resolve/main/nomic-embed-text-v1.5-f16.gguf
- name: Start rag-api-server for testing chat completions
run: |
nohup $HOME/.wasmedge/bin/wasmedge --dir .:. --nn-preload default:GGML:AUTO:Qwen2-1.5B-Instruct-Q3_K_M.gguf --nn-preload embedding:GGML:AUTO:nomic-embed-text-v1.5-f16.gguf rag-api-server.wasm --model-name Qwen2-1.5B-Instruct,nomic-embed-text-v1.5 --ctx-size 4096,512 --batch-size 16,512 --prompt-template chatml,embedding --rag-policy last-user-message --socket-addr 0.0.0.0:9069 > ./start-llamaedge.log 2>&1 &
sleep 30
cat start-llamaedge.log
- name: Run test_chat.hurl
run: |
hurl --test --jobs 1 ./tests/test_chat.hurl
- name: Run test_embeddings.hurl
run: |
hurl --test --jobs 1 ./tests/test_embeddings.hurl
- name: Start Qdrant
run: |
nohup ./qdrant > ./start-qdrant.log 2>&1 &
sleep 5
cat start-qdrant.log
- name: Import the default.snapshot file to Qdrant
run: |
curl -s -X POST http://localhost:6333/collections/default/snapshots/upload?priority=snapshot -H 'Content-Type:multipart/form-data' -F '[email protected]'
- name: Run test_rag.hurl
run: |
hurl --test --jobs 1 ./tests/test_rag.hurl
- name: Stop rag-api-server for testing chat completions
run: |
pkill -f wasmedge
- name: Stop Qdrant
run: |
pkill -f qdrant