RealVis_v5.0_BF16_E

Sleeping

ford442 commited on Dec 1, 2024

Commit

f8d4d9e

1 Parent(s): 68bb8b3

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -18,17 +18,19 @@ from typing import Tuple
 from transformers import AutoTokenizer, AutoModelForCausalLM
 import paramiko
-os.system("chmod +x ./magma.sh")
-os.system("./magma.sh")
-torch.backends.cuda.matmul.allow_tf32 = True
-torch.backends.cuda.matmul.allow_bf16_reduced_precision_reduction = True
 torch.backends.cuda.matmul.allow_fp16_reduced_precision_reduction = False
-torch.backends.cudnn.allow_tf32 = True
 torch.backends.cudnn.deterministic = False
-torch.backends.cudnn.benchmark = True
 torch.backends.cuda.preferred_blas_library="cublas"
-torch.backends.cuda.preferred_linalg_library="magma"
 torch.set_float32_matmul_precision("highest")
@@ -123,7 +125,7 @@ def load_and_prepare_model(model_id):
 # Preload and compile both models
 models = {key: load_and_prepare_model(value) for key, value in MODEL_OPTIONS.items()}
-MAX_SEED = np.iinfo(np.int32).max
 def upload_to_ftp(filename):
     try:
@@ -168,7 +170,7 @@ def generate(
     global models
     pipe = models[model_choice]
     seed = int(randomize_seed_fn(seed, randomize_seed))
-    generator = torch.Generator(device=device).manual_seed(seed)
     prompt, negative_prompt = apply_style(style_selection, prompt, negative_prompt)
@@ -220,7 +222,7 @@ def generate_cpu(
     pipe.to("cpu")
     seed = int(randomize_seed_fn(seed, randomize_seed))
-    generator = torch.Generator(device=device).manual_seed(seed)
     prompt, negative_prompt = apply_style(style_selection, prompt, negative_prompt)

 from transformers import AutoTokenizer, AutoModelForCausalLM
 import paramiko
+os.system("chmod +x ./cusparselt.sh")
+os.system("./cusparselt.sh")
+os.system("chmod +x ./cudnn.sh")
+os.system("./cudnn.sh")
+torch.backends.cuda.matmul.allow_tf32 = False
+torch.backends.cuda.matmul.allow_bf16_reduced_precision_reduction = False
 torch.backends.cuda.matmul.allow_fp16_reduced_precision_reduction = False
+torch.backends.cudnn.allow_tf32 = False
 torch.backends.cudnn.deterministic = False
+torch.backends.cudnn.benchmark = False
 torch.backends.cuda.preferred_blas_library="cublas"
+torch.backends.cuda.preferred_linalg_library="cusolver"
 torch.set_float32_matmul_precision("highest")
 # Preload and compile both models
 models = {key: load_and_prepare_model(value) for key, value in MODEL_OPTIONS.items()}
+MAX_SEED = np.iinfo(np.int64).max
 def upload_to_ftp(filename):
     try:
     global models
     pipe = models[model_choice]
     seed = int(randomize_seed_fn(seed, randomize_seed))
+    generator = torch.Generator(device='cpu').manual_seed(seed)
     prompt, negative_prompt = apply_style(style_selection, prompt, negative_prompt)
     pipe.to("cpu")
     seed = int(randomize_seed_fn(seed, randomize_seed))
+    generator = torch.Generator(device='cpu').manual_seed(seed)
     prompt, negative_prompt = apply_style(style_selection, prompt, negative_prompt)