Christoph Holthaus
commited on
Commit
·
9307da2
1
Parent(s):
bd16ace
dev
Browse files
app.py
CHANGED
@@ -4,6 +4,7 @@ from llama_cpp import Llama
|
|
4 |
from time import time
|
5 |
import gradio as gr
|
6 |
import psutil
|
|
|
7 |
|
8 |
# load like this - use tne variable everywhere
|
9 |
model_path=os.getenv("MODEL_PATH")
|
@@ -30,11 +31,10 @@ print(f"DEBUG: Memory free: {psutil.virtual_memory().free / (1024.0 ** 3)} GiB")
|
|
30 |
print(f"DEBUG: Memory available: {psutil.virtual_memory().available / (1024.0 ** 3)} GiB")
|
31 |
print(f"DEBUG: Memory: {psutil.virtual_memory().total / (1024.0 ** 3)} GiB")
|
32 |
|
33 |
-
|
34 |
from threading import Thread
|
35 |
from typing import Iterator
|
36 |
|
37 |
-
import gradio as gr
|
38 |
import spaces
|
39 |
import torch
|
40 |
from transformers import AutoModelForCausalLM, AutoTokenizer, TextIteratorStreamer
|
|
|
4 |
from time import time
|
5 |
import gradio as gr
|
6 |
import psutil
|
7 |
+
import os
|
8 |
|
9 |
# load like this - use tne variable everywhere
|
10 |
model_path=os.getenv("MODEL_PATH")
|
|
|
31 |
print(f"DEBUG: Memory available: {psutil.virtual_memory().available / (1024.0 ** 3)} GiB")
|
32 |
print(f"DEBUG: Memory: {psutil.virtual_memory().total / (1024.0 ** 3)} GiB")
|
33 |
|
34 |
+
|
35 |
from threading import Thread
|
36 |
from typing import Iterator
|
37 |
|
|
|
38 |
import spaces
|
39 |
import torch
|
40 |
from transformers import AutoModelForCausalLM, AutoTokenizer, TextIteratorStreamer
|