Mihaiii commited on
Commit
080b892
·
verified ·
1 Parent(s): 115e01f

Upload 2 files

Browse files
Files changed (2) hide show
  1. Dockerfile +21 -0
  2. script.sh +8 -0
Dockerfile ADDED
@@ -0,0 +1,21 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ FROM ghcr.io/ggerganov/llama.cpp:server-cuda-7c27a19b2eb91bb0f43c7f7aec0386cec2dddc33
2
+
3
+ RUN apt-get update && apt-get install -y wget pip python3 git
4
+
5
+ ENTRYPOINT ["/bin/sh", "-c"]
6
+
7
+ WORKDIR llama.cpp
8
+
9
+ RUN wget -q https://huggingface.co/Mihaiii/shieldgemma-2b-Q5_K_M-GGUF/resolve/main/shieldgemma-2b-q5_k_m-imat.gguf
10
+ RUN wget -q https://huggingface.co/bartowski/gemma-2-2b-it-GGUF/resolve/main/gemma-2-2b-it-Q5_K_M.gguf
11
+
12
+ COPY script.sh .
13
+
14
+ RUN chmod +x ./script.sh
15
+ RUN chmod 777 .
16
+
17
+ RUN git clone https://github.com/Mihaiii/trivia.git
18
+ RUN cd trivia && pip install -r requirements.txt
19
+ RUN chmod 777 ./trivia
20
+
21
+ CMD ["./script.sh"]
script.sh ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ #!/bin/bash
2
+ ../llama-server -m ./shieldgemma-2b-q5_k_m-imat.gguf -c 8192 -t 4 --port 8000 --host 127.0.0.1 --parallel 2 -cb &
3
+ ../llama-server -m ./gemma-2-2b-it-Q5_K_M.gguf -c 8192 -t --port 7888 --host 127.0.0.1 --parallel 2 -cb &
4
+
5
+ sleep 5
6
+
7
+ cd trivia
8
+ uvicorn app:app --port 7860 --host 0.0.0.0