MrAli commited on
Commit
361043a
·
verified ·
1 Parent(s): 511b17b

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +8 -17
app.py CHANGED
@@ -7,10 +7,8 @@ os.system("ulimit -l unlimited")
7
  app = FastAPI()
8
 
9
  hf_hub_download("TheBloke/deepseek-coder-1.3b-base-GGUF", "deepseek-coder-1.3b-base.Q5_K_M.gguf", local_dir="./")
10
- hf_hub_download("TheBloke/deepseek-coder-6.7B-base-GGUF", "deepseek-coder-6.7b-base.Q4_K_M.gguf", local_dir="./")
11
-
12
  model_l = Llama(model_path="./deepseek-coder-1.3b-base.Q5_K_M.gguf", n_ctx=16000, n_gpu_layers=0, n_threads=2, use_mlock=True)
13
- model_f = Llama(model_path="./deepseek-coder-6.7b-base.Q5_K_M.gguf", n_ctx=16000, n_gpu_layers=0, n_threads=2, use_mlock=True)
14
 
15
  @app.get("/check")
16
  async def index():
@@ -21,20 +19,13 @@ async def completion(request: Request):
21
  data = await request.json()
22
  prompt = data["prompt"]
23
  mode = data['mode']
24
- if mode == 'f':
25
- res = model_f(
26
- prompt,
27
- temperature=0.6,
28
- echo=False,
29
- max_tokens=41,
30
- )
31
- else:
32
- res = model_l(
33
- prompt,
34
- temperature=0.6,
35
- echo=False,
36
- max_tokens=41,
37
- )
38
  return {"responses": res["choices"]}
39
 
40
  if __name__ == "__main__":
 
7
  app = FastAPI()
8
 
9
  hf_hub_download("TheBloke/deepseek-coder-1.3b-base-GGUF", "deepseek-coder-1.3b-base.Q5_K_M.gguf", local_dir="./")
 
 
10
  model_l = Llama(model_path="./deepseek-coder-1.3b-base.Q5_K_M.gguf", n_ctx=16000, n_gpu_layers=0, n_threads=2, use_mlock=True)
11
+
12
 
13
  @app.get("/check")
14
  async def index():
 
19
  data = await request.json()
20
  prompt = data["prompt"]
21
  mode = data['mode']
22
+
23
+ res = model_l(
24
+ prompt,
25
+ temperature=0.6,
26
+ echo=False,
27
+ max_tokens=41,
28
+ )
 
 
 
 
 
 
 
29
  return {"responses": res["choices"]}
30
 
31
  if __name__ == "__main__":