Spaces:

darknoon
/

chameleon

Build error

App Files Files Community

darknoon commited on Jul 11, 2024

Commit

7dbba05

1 Parent(s): 85c421c

fixing conversation formatting

Browse files

Files changed (1) hide show

app.py +58 -29

app.py CHANGED Viewed

@@ -10,54 +10,82 @@ import requests
 model_path = "facebook/chameleon-7b"
 # model = ChameleonForCausalLM.from_pretrained(model_path, torch_dtype=torch.bfloat16, low_cpu_mem_usage=True, device_map="auto")
 # processor = ChameleonProcessor.from_pretrained(model_path)
-model = AutoModelForCausalLM.from_pretrained(model_path, torch_dtype=torch.bfloat16, low_cpu_mem_usage=True, device_map="auto", use_auth_token=True)
 model.eval()
-processor = ChameleonProcessor.from_pretrained(model_path, use_auth_token=True)
 tokenizer = processor.tokenizer
-def load_example_image():
-    global image
-    if not image:
-        image = Image.open(requests.get("https://uploads4.wikiart.org/images/paul-klee/death-for-the-idea-1915.jpg!Large.jpg", stream=True).raw)
-    return image
 @spaces.GPU(duration=90)
 def respond(
     message,
-    history: list[tuple[str, str]],
     system_message,
     max_tokens,
     temperature,
     top_p,
 ):
-    # messages = [{"role": "system", "content": system_message}]
-    # for val in history:
-    #     if val[0]:
-    #         messages.append({"role": "user", "content": val[0]})
-    #     if val[1]:
-    #         messages.append({"role": "assistant", "content": val[1]})
-    # messages.append({"role": "user", "content": message})
     response = ""
-    prompt = "I'm very intrigued by this work of art:<image>Please tell me about the artist."
-    image = load_example_image()
-    inputs = processor(prompt, images=[image], return_tensors="pt").to(model.device, dtype=torch.bfloat16)
     streamer = TextIteratorStreamer(tokenizer)
     generation_kwargs = dict(inputs, streamer=streamer, max_new_tokens=20)
-    # launch generation in the background
-    thread = Thread(target=model.generate, kwargs=generation_kwargs)
-    thread.start()
-    partial_message = ""
-    for new_token in streamer:
-        partial_message += new_token
-        yield partial_message
 """
@@ -65,6 +93,7 @@ For information on how to customize the ChatInterface, peruse the gradio docs: h
 """
 demo = gr.ChatInterface(
     respond,
     additional_inputs=[
         gr.Textbox(value="You are a friendly Chatbot.", label="System message"),
         gr.Slider(minimum=1, maximum=2048, value=512, step=1, label="Max new tokens"),
@@ -81,4 +110,4 @@ demo = gr.ChatInterface(
 if __name__ == "__main__":
-    demo.launch()

 model_path = "facebook/chameleon-7b"
 # model = ChameleonForCausalLM.from_pretrained(model_path, torch_dtype=torch.bfloat16, low_cpu_mem_usage=True, device_map="auto")
 # processor = ChameleonProcessor.from_pretrained(model_path)
+model = AutoModelForCausalLM.from_pretrained(model_path, torch_dtype=torch.bfloat16, low_cpu_mem_usage=True, device_map="auto")
 model.eval()
+processor = ChameleonProcessor.from_pretrained(model_path)
 tokenizer = processor.tokenizer
+multimodal_file = tuple[str, str]
+multimodal_message = list[str | multimodal_file] | multimodal_file
+# todo: verify this type with gr.ChatInterface
+message_t = str | multimodal_message
+history_t = list[tuple[str, str] | list[tuple[multimodal_message, multimodal_message]]]
+def history_to_prompt(
+        message,
+        history: history_t,
+        eot_id = "<reserved08706>",
+        image_placeholder = "<image>"
+    ):
+    prompt = ""
+    images = []
+    for turn in history + (message, None):
+        print("turn:", turn)
+        # turn should be a tuple of user message and assistant message
+        for message in turn:
+            if isinstance(message, str):
+                prompt += user_message
+                prompt += eot_id
+            if isinstance(message, list):
+                for item in message:
+                    if isinstance(item, str):
+                        prompt += item
+                    elif isinstance(item, tuple):
+                        image_path, alt = item
+                        prompt += image_placeholder
+                        image = Image.open(requests.get(image_path, stream=True).raw)
+                        images.append(image)
+            else:
+                prompt += f"(unhandled message type: {message})"
+            prompt += eot_id
+    return prompt, images
 @spaces.GPU(duration=90)
 def respond(
     message,
+    history: history_t,
     system_message,
     max_tokens,
     temperature,
     top_p,
 ):
     response = ""
+    print(f"message: {message}\nhistory:\n\n{history}\n")
+    prompt, images = history_to_prompt(message, history)
+    print(f"prompt:\n\n{prompt}\n")
+    # prompt = "I'm very intrigued by this work of art:<image>Please tell me about the artist."
+    # image = Image.open(requests.get("https://uploads4.wikiart.org/images/paul-klee/death-for-the-idea-1915.jpg!Large.jpg", stream=True).raw)
+    # images = [image]
+    inputs = processor(prompt, images=images, return_tensors="pt").to(model.device, dtype=torch.bfloat16)
     streamer = TextIteratorStreamer(tokenizer)
     generation_kwargs = dict(inputs, streamer=streamer, max_new_tokens=20)
+    try:
+        # launch generation in the background
+        thread = Thread(target=model.generate, kwargs=generation_kwargs)
+        thread.start()
+        partial_message = ""
+        for new_token in streamer:
+            partial_message += new_token
+            yield partial_message
+    except e:
+        return f"Error: {e}"
 """
 """
 demo = gr.ChatInterface(
     respond,
+    multimodal=True,
     additional_inputs=[
         gr.Textbox(value="You are a friendly Chatbot.", label="System message"),
         gr.Slider(minimum=1, maximum=2048, value=512, step=1, label="Max new tokens"),
 if __name__ == "__main__":
+    demo.launch(debug=True)