Spaces:

prithivMLmods
/

Florence-2-Image-Caption

Running

App Files Files Community

prithivMLmods commited on Jul 27

Commit

e583785

verified ·

1 Parent(s): 82970ac

Update app.py

Browse files

Files changed (1) hide show

app.py +2 -14

app.py CHANGED Viewed

@@ -4,31 +4,20 @@ import torch
 from PIL import Image
 from transformers import AutoProcessor, AutoModelForCausalLM
-# Upgrade transformers to the latest version
-try:
-    subprocess.run('pip install --upgrade transformers', check=True, shell=True)
-    print("Successfully upgraded transformers.")
-except subprocess.CalledProcessError as e:
-    print(f"Error upgrading transformers: {e}")
-    print("Continuing with the current version, but this may cause issues.")
-# Attempt to install flash-attn (optional, for performance)
 try:
     subprocess.run('pip install flash-attn --no-build-isolation', env={'FLASH_ATTENTION_SKIP_CUDA_BUILD': "TRUE"}, check=True, shell=True)
-    print("Successfully installed flash-attn.")
 except subprocess.CalledProcessError as e:
     print(f"Error installing flash-attn: {e}")
     print("Continuing without flash-attn.")
 # Determine the device to use
 device = "cuda" if torch.cuda.is_available() else "cpu"
-print(f"Using device: {device}")
 # Load the base model and processor
 try:
     vision_language_model_base = AutoModelForCausalLM.from_pretrained('microsoft/Florence-2-base', trust_remote_code=True).to(device).eval()
     vision_language_processor_base = AutoProcessor.from_pretrained('microsoft/Florence-2-base', trust_remote_code=True)
-    print("Base model and processor loaded successfully.")
 except Exception as e:
     print(f"Error loading base model: {e}")
     vision_language_model_base = None
@@ -38,7 +27,6 @@ except Exception as e:
 try:
     vision_language_model_large = AutoModelForCausalLM.from_pretrained('microsoft/Florence-2-large', trust_remote_code=True).to(device).eval()
     vision_language_processor_large = AutoProcessor.from_pretrained('microsoft/Florence-2-large', trust_remote_code=True)
-    print("Large model and processor loaded successfully.")
 except Exception as e:
     print(f"Error loading large model: {e}")
     vision_language_model_large = None
@@ -113,4 +101,4 @@ image_description_interface = gr.Interface(
 )
 # Launch the interface
-image_description_interface.launch(debug=True, ssr_mode=False)

 from PIL import Image
 from transformers import AutoProcessor, AutoModelForCausalLM
+# Attempt to install flash-attn
 try:
     subprocess.run('pip install flash-attn --no-build-isolation', env={'FLASH_ATTENTION_SKIP_CUDA_BUILD': "TRUE"}, check=True, shell=True)
 except subprocess.CalledProcessError as e:
     print(f"Error installing flash-attn: {e}")
     print("Continuing without flash-attn.")
 # Determine the device to use
 device = "cuda" if torch.cuda.is_available() else "cpu"
 # Load the base model and processor
 try:
     vision_language_model_base = AutoModelForCausalLM.from_pretrained('microsoft/Florence-2-base', trust_remote_code=True).to(device).eval()
     vision_language_processor_base = AutoProcessor.from_pretrained('microsoft/Florence-2-base', trust_remote_code=True)
 except Exception as e:
     print(f"Error loading base model: {e}")
     vision_language_model_base = None
 try:
     vision_language_model_large = AutoModelForCausalLM.from_pretrained('microsoft/Florence-2-large', trust_remote_code=True).to(device).eval()
     vision_language_processor_large = AutoProcessor.from_pretrained('microsoft/Florence-2-large', trust_remote_code=True)
 except Exception as e:
     print(f"Error loading large model: {e}")
     vision_language_model_large = None
 )
 # Launch the interface
+image_description_interface.launch(debug=True)