ethertech-healthcare-line-of-therapy-extractor

Sleeping

alpeshsonar commited on Sep 3, 2024

Commit

e1968b9

verified ·

1 Parent(s): 7065e35

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -2,15 +2,17 @@ import gradio as gr
 from transformers import T5Tokenizer, T5ForConditionalGeneration
 import torch
 from pydantic import BaseModel
 # Initialize FastAPI and Gradio
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 # Load the tokenizer and model once for use in both FastAPI and Gradio
 tokenizer = T5Tokenizer.from_pretrained("alpeshsonar/lot-t5-small-filter", legacy=False)
-model = T5ForConditionalGeneration.from_pretrained("alpeshsonar/lot-t5-small-filter").to(device)
 # Gradio interface
 def generate_text(input_text):
     inputs = tokenizer.encode("Extract lots from given text.\n" + input_text, return_tensors="pt").to(device)
     outputs = model.generate(inputs, max_new_tokens=1024)

 from transformers import T5Tokenizer, T5ForConditionalGeneration
 import torch
 from pydantic import BaseModel
+import spaces
 # Initialize FastAPI and Gradio
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 # Load the tokenizer and model once for use in both FastAPI and Gradio
 tokenizer = T5Tokenizer.from_pretrained("alpeshsonar/lot-t5-small-filter", legacy=False)
+model = T5ForConditionalGeneration.from_pretrained("alpeshsonar/lot-t5-small-filter", torch_dtype=torch.bfloat16).to(device)
 # Gradio interface
+@spaces.GPU(duration=360)
 def generate_text(input_text):
     inputs = tokenizer.encode("Extract lots from given text.\n" + input_text, return_tensors="pt").to(device)
     outputs = model.generate(inputs, max_new_tokens=1024)