-
Notifications
You must be signed in to change notification settings - Fork 9
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
ci(test_api_server): update workflow
Signed-off-by: Xin Liu <[email protected]>
- Loading branch information
Showing
1 changed file
with
17 additions
and
7 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
|
@@ -61,11 +61,17 @@ jobs: | |
curl --location --remote-name https://github.com/Orange-OpenSource/hurl/releases/download/5.0.1/hurl_5.0.1_amd64.deb | ||
sudo apt update && sudo apt install ./hurl_5.0.1_amd64.deb | ||
- name: Install Qdrant | ||
- name: Install Qdrant and download snapshot | ||
run: | | ||
# Download Qdrant | ||
curl -LO https://github.com/qdrant/qdrant/releases/download/v1.11.4/qdrant-x86_64-unknown-linux-musl.tar.gz | ||
tar -xzf qdrant-x86_64-unknown-linux-musl.tar.gz -C . | ||
rm qdrant-x86_64-unknown-linux-musl.tar.gz | ||
# Download snapshot | ||
curl -LO https://huggingface.co/datasets/gaianet/paris/resolve/main/paris_768_nomic-embed-text-v1.5-f16.snapshot | ||
tar -xzOf paris_768_nomic-embed-text-v1.5-f16.snapshot > default.snapshot | ||
ls -al | ||
- name: Build rag-api-server on linux | ||
|
@@ -80,12 +86,6 @@ jobs: | |
curl -LO https://huggingface.co/second-state/Qwen2-1.5B-Instruct-GGUF/resolve/main/Qwen2-1.5B-Instruct-Q3_K_M.gguf | ||
curl -LO https://huggingface.co/second-state/Nomic-embed-text-v1.5-Embedding-GGUF/resolve/main/nomic-embed-text-v1.5-f16.gguf | ||
- name: Start Qdrant | ||
run: | | ||
nohup ./qdrant > ./start-qdrant.log 2>&1 & | ||
sleep 2 | ||
cat start-qdrant.log | ||
- name: Start rag-api-server for testing chat completions | ||
run: | | ||
nohup $HOME/.wasmedge/bin/wasmedge --dir .:. --nn-preload default:GGML:AUTO:Qwen2-1.5B-Instruct-Q3_K_M.gguf --nn-preload embedding:GGML:AUTO:nomic-embed-text-v1.5-f16.gguf rag-api-server.wasm --model-name Qwen2-1.5B-Instruct,nomic-embed-text-v1.5 --ctx-size 4096,512 --batch-size 16,512 --prompt-template chatml,embedding --socket-addr 0.0.0.0:8080 > ./start-llamaedge.log 2>&1 & | ||
|
@@ -100,6 +100,16 @@ jobs: | |
run: | | ||
hurl --test --jobs 1 ./tests/test_embeddings.hurl | ||
- name: Start Qdrant | ||
run: | | ||
nohup ./qdrant > ./start-qdrant.log 2>&1 & | ||
sleep 5 | ||
cat start-qdrant.log | ||
- name: Import the default.snapshot file to Qdrant | ||
run: | | ||
curl -s -X POST http://localhost:6333/collections/default/snapshots/upload?priority=snapshot -H 'Content-Type:multipart/form-data' -F '[email protected]') | ||
- name: Stop rag-api-server for testing chat completions | ||
run: | | ||
pkill -f wasmedge | ||
|