arya-ai-model commited on
Commit
0512849
·
1 Parent(s): 6df1721

First commit

Browse files
Files changed (1) hide show
  1. app.py +5 -0
app.py CHANGED
@@ -1,8 +1,13 @@
 
1
  import torch
2
  from fastapi import FastAPI, HTTPException
3
  from pydantic import BaseModel
4
  from transformers import AutoTokenizer, AutoModelForCausalLM, GenerationConfig
5
 
 
 
 
 
6
  # Model setup
7
  MODEL_NAME = "deepseek-ai/deepseek-llm-7b-base"
8
  DEVICE = "cuda" if torch.cuda.is_available() else "cpu"
 
1
+ import os
2
  import torch
3
  from fastapi import FastAPI, HTTPException
4
  from pydantic import BaseModel
5
  from transformers import AutoTokenizer, AutoModelForCausalLM, GenerationConfig
6
 
7
+ # Set custom cache directory
8
+ os.environ["HF_HOME"] = "/tmp/huggingface"
9
+ os.environ["TRANSFORMERS_CACHE"] = "/tmp/huggingface"
10
+
11
  # Model setup
12
  MODEL_NAME = "deepseek-ai/deepseek-llm-7b-base"
13
  DEVICE = "cuda" if torch.cuda.is_available() else "cpu"