Spaces:
Runtime error
Runtime error
Commit
·
0512849
1
Parent(s):
6df1721
First commit
Browse files
app.py
CHANGED
@@ -1,8 +1,13 @@
|
|
|
|
1 |
import torch
|
2 |
from fastapi import FastAPI, HTTPException
|
3 |
from pydantic import BaseModel
|
4 |
from transformers import AutoTokenizer, AutoModelForCausalLM, GenerationConfig
|
5 |
|
|
|
|
|
|
|
|
|
6 |
# Model setup
|
7 |
MODEL_NAME = "deepseek-ai/deepseek-llm-7b-base"
|
8 |
DEVICE = "cuda" if torch.cuda.is_available() else "cpu"
|
|
|
1 |
+
import os
|
2 |
import torch
|
3 |
from fastapi import FastAPI, HTTPException
|
4 |
from pydantic import BaseModel
|
5 |
from transformers import AutoTokenizer, AutoModelForCausalLM, GenerationConfig
|
6 |
|
7 |
+
# Set custom cache directory
|
8 |
+
os.environ["HF_HOME"] = "/tmp/huggingface"
|
9 |
+
os.environ["TRANSFORMERS_CACHE"] = "/tmp/huggingface"
|
10 |
+
|
11 |
# Model setup
|
12 |
MODEL_NAME = "deepseek-ai/deepseek-llm-7b-base"
|
13 |
DEVICE = "cuda" if torch.cuda.is_available() else "cpu"
|