File size: 698 Bytes
2809bee
 
 
 
 
1ad1638
644ee1c
1ad1638
2809bee
 
 
 
 
 
 
 
 
 
 
1ad1638
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
from fastapi import FastAPI
from transformers import AutoModelForCausalLM, AutoTokenizer, pipeline

app = FastAPI()

# πŸš€ 軽量γͺζ—₯本θͺžγƒ’γƒ‡γƒ«γ‚’ιΈζŠžοΌˆ7B β†’ 3.6BοΌ‰
MODEL_NAME = "rinna/japanese-gpt-neox-3.6b"
tokenizer = AutoTokenizer.from_pretrained(MODEL_NAME, use_fast=False)
model = AutoModelForCausalLM.from_pretrained(MODEL_NAME)
generator = pipeline("text-generation", model=model, tokenizer=tokenizer)

@app.get("/")
def root():
    return {"message": "DeepSeek API is running!"}

@app.get("/generate")
def generate(prompt: str, max_length: int = 100):
    result = generator(prompt, max_length=max_length, do_sample=True)[0]['generated_text']
    return {"response": result}