Spaces:

SharryOG
/

AI

Sleeping

SharryOG commited on Jun 23, 2024

Commit

db30e0b

verified ·

1 Parent(s): 8f8bf75

Create app.py

Files changed (1) hide show

app.py ADDED Viewed

+import gradio as gr
+#from transformers import AutoModelForCausalLM, AutoProcessor
+# Load the model and processor
+model_id = "microsoft/Phi-3-vision-128k-instruct"
+#model = AutoModelForCausalLM.from_pretrained(model_id, device_map="cuda", trust_remote_code=True, torch_dtype="auto", _attn_implementation='flash_attention_2')
+#processor = AutoProcessor.from_pretrained(model_id, trust_remote_code=True)
+# Define the function to generate text
+def generate_text(image, prompt):
+    # Process the input
+    inputs = ""
+    # Generate the text
+    generation_args = {
+        "max_new_tokens": 500,
+        "temperature": 0.0,
+        "do_sample": False,
+    }
+    return image + prompt
+# Create the Gradio application
+gr.Interface(
+    fn=generate_text,
+    inputs=[
+        gr.Image(type="pil"),
+        gr.Textbox(label="Prompt")
+    ],
+    outputs=gr.Textbox(),
+    title="Phi-3-Vision Model",
+    description="Generate text based on an image and prompt using the Phi-3-Vision model."
+).launch(share=True)