diff --git a/.github/workflows/test_api_server.yml b/.github/workflows/test_api_server.yml index a2fb962..f495a53 100644 --- a/.github/workflows/test_api_server.yml +++ b/.github/workflows/test_api_server.yml @@ -61,6 +61,13 @@ jobs: curl --location --remote-name https://github.com/Orange-OpenSource/hurl/releases/download/5.0.1/hurl_5.0.1_amd64.deb sudo apt update && sudo apt install ./hurl_5.0.1_amd64.deb + - name: Install Qdrant + run: | + curl -LO https://github.com/qdrant/qdrant/releases/download/v1.11.4/qdrant-x86_64-unknown-linux-musl.tar.gz + tar -xzf qdrant-x86_64-unknown-linux-musl.tar.gz -C . + rm qdrant-x86_64-unknown-linux-musl.tar.gz + ls -al + - name: Build rag-api-server on linux env: RUSTFLAGS: "--cfg wasmedge --cfg tokio_unstable" @@ -73,6 +80,12 @@ jobs: curl -LO https://huggingface.co/second-state/Qwen2-1.5B-Instruct-GGUF/resolve/main/Qwen2-1.5B-Instruct-Q3_K_M.gguf curl -LO https://huggingface.co/second-state/Nomic-embed-text-v1.5-Embedding-GGUF/resolve/main/nomic-embed-text-v1.5-f16.gguf + - name: Start Qdrant + run: | + nohup ./qdrant > ./start-qdrant.log 2>&1 & + sleep 2 + cat start-qdrant.log + - name: Start rag-api-server for testing chat completions run: | nohup $HOME/.wasmedge/bin/wasmedge --dir .:. --nn-preload default:GGML:AUTO:Qwen2-1.5B-Instruct-Q3_K_M.gguf --nn-preload embedding:GGML:AUTO:nomic-embed-text-v1.5-f16.gguf rag-api-server.wasm --model-name Qwen2-1.5B-Instruct,nomic-embed-text-v1.5 --ctx-size 4096,512 --batch-size 16,512 --prompt-template chatml,embedding --socket-addr 0.0.0.0:8080 > ./start-llamaedge.log 2>&1 & @@ -90,3 +103,7 @@ jobs: - name: Stop rag-api-server for testing chat completions run: | pkill -f wasmedge + + - name: Stop Qdrant + run: | + pkill -f qdrant