From 6a2c824d7903c66187d2a9a3bdcb4dc0c7b0b0e4 Mon Sep 17 00:00:00 2001 From: Xin Liu Date: Fri, 20 Sep 2024 13:38:59 +0900 Subject: [PATCH] ci(test_api_server): update workflow Signed-off-by: Xin Liu --- .github/workflows/test_api_server.yml | 24 +++++++++++++++++------- 1 file changed, 17 insertions(+), 7 deletions(-) diff --git a/.github/workflows/test_api_server.yml b/.github/workflows/test_api_server.yml index f495a53..174f32f 100644 --- a/.github/workflows/test_api_server.yml +++ b/.github/workflows/test_api_server.yml @@ -61,11 +61,17 @@ jobs: curl --location --remote-name https://github.com/Orange-OpenSource/hurl/releases/download/5.0.1/hurl_5.0.1_amd64.deb sudo apt update && sudo apt install ./hurl_5.0.1_amd64.deb - - name: Install Qdrant + - name: Install Qdrant and download snapshot run: | + # Download Qdrant curl -LO https://github.com/qdrant/qdrant/releases/download/v1.11.4/qdrant-x86_64-unknown-linux-musl.tar.gz tar -xzf qdrant-x86_64-unknown-linux-musl.tar.gz -C . rm qdrant-x86_64-unknown-linux-musl.tar.gz + + # Download snapshot + curl -LO https://huggingface.co/datasets/gaianet/paris/resolve/main/paris_768_nomic-embed-text-v1.5-f16.snapshot + tar -xzOf paris_768_nomic-embed-text-v1.5-f16.snapshot > default.snapshot + ls -al - name: Build rag-api-server on linux @@ -80,12 +86,6 @@ jobs: curl -LO https://huggingface.co/second-state/Qwen2-1.5B-Instruct-GGUF/resolve/main/Qwen2-1.5B-Instruct-Q3_K_M.gguf curl -LO https://huggingface.co/second-state/Nomic-embed-text-v1.5-Embedding-GGUF/resolve/main/nomic-embed-text-v1.5-f16.gguf - - name: Start Qdrant - run: | - nohup ./qdrant > ./start-qdrant.log 2>&1 & - sleep 2 - cat start-qdrant.log - - name: Start rag-api-server for testing chat completions run: | nohup $HOME/.wasmedge/bin/wasmedge --dir .:. --nn-preload default:GGML:AUTO:Qwen2-1.5B-Instruct-Q3_K_M.gguf --nn-preload embedding:GGML:AUTO:nomic-embed-text-v1.5-f16.gguf rag-api-server.wasm --model-name Qwen2-1.5B-Instruct,nomic-embed-text-v1.5 --ctx-size 4096,512 --batch-size 16,512 --prompt-template chatml,embedding --socket-addr 0.0.0.0:8080 > ./start-llamaedge.log 2>&1 & @@ -100,6 +100,16 @@ jobs: run: | hurl --test --jobs 1 ./tests/test_embeddings.hurl + - name: Start Qdrant + run: | + nohup ./qdrant > ./start-qdrant.log 2>&1 & + sleep 5 + cat start-qdrant.log + + - name: Import the default.snapshot file to Qdrant + run: | + curl -s -X POST http://localhost:6333/collections/default/snapshots/upload?priority=snapshot -H 'Content-Type:multipart/form-data' -F 'snapshot=@default.snapshot') + - name: Stop rag-api-server for testing chat completions run: | pkill -f wasmedge