-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathci.yml
27 lines (27 loc) · 1.14 KB
/
ci.yml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
prepare:
steps:
- name: Clone repository
command: git clone https://github.com/ggerganov/llama.cpp.git | (cd llama.cpp ;
git pull)
- name: Clean
command: cd llama.cpp && make clean
- name: Build Llama Cpp
command: cd llama.cpp && if [ -v NV_LIBCUBLAS_VERSION ]; then echo 'Make for
gpu' && LLAMA_CUDA=1 make; else echo 'Make for cpu' && make; fi
- name: Download model
command: "[ -f
/home/user/app/llama.cpp/models/Meta-Llama-3.1-8B-Instruct-Q4_K_M.gguf ]
|| wget -P /home/user/app/llama.cpp/models
https://huggingface.co/lmstudio-community/Meta-Llama-3.1-8B-Instruct-GG\
UF/resolve/main/Meta-Llama-3.1-8B-Instruct-Q4_K_M.gguf"
test:
steps: []
run:
steps:
- name: Run
command: cd llama.cpp && if [ -v NV_LIBCUBLAS_VERSION ]; then echo 'Starting gpu
server' && ./llama-server -m
./models/Meta-Llama-3.1-8B-Instruct-Q4_K_M.gguf -c 30000 --port 3000
--host 0.0.0.0 -ngl 35; else echo 'Starting cpu server'
&& ./llama-server -m ./models/Meta-Llama-3.1-8B-Instruct-Q4_K_M.gguf -c
30000 --port 3000 --host 0.0.0.0 -t 8; fi