rashedalhuniti commited on
Commit
9f16574
·
verified ·
1 Parent(s): 9e51e1d

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +12 -9
app.py CHANGED
@@ -1,13 +1,16 @@
1
  import gradio as gr
2
  from transformers import AutoModelForCausalLM, AutoTokenizer
3
- import torch
4
 
5
- # Load JAIS-13B model and tokenizer
6
- model_name = "InceptionAI/jais-13b"
7
- tokenizer = AutoTokenizer.from_pretrained(model_name)
8
- model = AutoModelForCausalLM.from_pretrained(model_name, torch_dtype=torch.float16, device_map="auto")
9
 
10
- def generate_response(prompt, max_length=512, temperature=0.7):
11
- inputs = tokenizer(prompt, return_tensors="pt").to("cuda")
12
- with torch.no_grad():
13
- output = model
 
 
 
 
 
 
1
  import gradio as gr
2
  from transformers import AutoModelForCausalLM, AutoTokenizer
 
3
 
4
+ # Load model and tokenizer
5
+ model = AutoModelForCausalLM.from_pretrained("inceptionai/jais-13b", trust_remote_code=True)
6
+ tokenizer = AutoTokenizer.from_pretrained("inceptionai/jais-13b", trust_remote_code=True)
 
7
 
8
+ def generate_text(prompt):
9
+ inputs = tokenizer(prompt, return_tensors="pt")
10
+ outputs = model.generate(**inputs)
11
+ return tokenizer.decode(outputs[0], skip_special_tokens=True)
12
+
13
+ # Create Gradio interface
14
+ interface = gr.Interface(fn=generate_text, inputs="text", outputs="text")
15
+
16
+ interface.launch()