Gemini-Image-Edit

Running

App Files Files Community

Wiuhh commited on Aug 14

Commit

153d837

verified ·

1 Parent(s): 41a4a34

Update app.py

Browse files

Files changed (1) hide show

app.py +138 -115

app.py CHANGED Viewed

@@ -10,154 +10,177 @@ import mimetypes
 from google import genai
 from google.genai import types
-# Aapki Gemini API Key yahan daal di gayi hai.
-GEMINI_API_KEY = "AIzaSyCrhWiAEQmCidtE2QZw3CTiLt7F8yv5M7A"
 def save_binary_file(file_name, data):
     with open(file_name, "wb") as f:
         f.write(data)
-def generate(text, file_name, model="gemini-2.0-flash-exp"):
-    # Client ko hardcoded API key se initialize karein.
-    client = genai.Client(api_key=GEMINI_API_KEY)
-    files = [
-        client.files.upload(file=file_name),
-    ]
-    contents = [
-        types.Content(
-            role="user",
-            parts=[
-                types.Part.from_uri(
-                    file_uri=files[0].uri,
-                    mime_type=files[0].mime_type,
-                ),
-                types.Part.from_text(text=text),
-            ],
-        ),
     ]
-    generate_content_config = types.GenerateContentConfig(
         temperature=1,
         top_p=0.95,
         top_k=40,
         max_output_tokens=8192,
-        response_modalities=[
-            "image",
-            "text",
-        ],
-        response_mime_type="text/plain",
     )
-    with tempfile.NamedTemporaryFile(suffix=".png", delete=False) as tmp:
-        temp_path = tmp.name
-        for chunk in client.models.generate_content_stream(
-            model=model,
-            contents=contents,
-            config=generate_content_config,
-        ):
-            if not chunk.candidates or not chunk.candidates[0].content or not chunk.candidates[0].content.parts:
-                continue
-            inline_data = chunk.candidates[0].content.parts[0].inline_data
-            if inline_data:
-                save_binary_file(temp_path, inline_data.data)
-                print(
-                    "File of mime type "
-                    f"{inline_data.mime_type} saved to: {temp_path} and prompt input :{text}"
-                )
-            else:
-                print(chunk.text)
-    del files
-    return temp_path
 def process_image_and_prompt(composite_pil, prompt):
-    # Save the composite image to a temporary file.
     with tempfile.NamedTemporaryFile(suffix=".png", delete=False) as tmp:
         composite_path = tmp.name
-        composite_pil.save(composite_path)
     file_name = composite_path
     input_text = prompt
-    model = "gemini-2.0-flash-exp"
-    gemma_edited_image_path = generate(text=input_text, file_name=file_name, model=model)
-    print("image_path ", gemma_edited_image_path)
-    result_img = Image.open(gemma_edited_image_path)
-    if result_img.mode == "RGBA":
-        result_img = result_img.convert("RGB")
-    return [result_img]
-# Build a Blocks-based interface to include the custom HTML header.
-with gr.Blocks() as demo:
-    # HTML Header for the application.
-    gr.HTML(
     """
-    <div style='display: flex; align-items: center; justify-content: center; gap: 20px'>
-    <div style="background-color: var(--block-background-fill); border-radius: 8px">
-        <img src="https://www.gstatic.com/lamda/images/gemini_favicon_f069958c85030456e93de685481c559f160ea06b.png" style="width: 100px; height: 100px;">
-    </div>
-    <div>
-        <h1>Gen AI Image Editing</h1>
-        <p>Gemini using for Image Editing</p>
-        <p>Powered by <a href="https://gradio.app/">Gradio</a> ⚡️</p>
-        <p>Get an API Key <a href="https://aistudio.google.com/apikey">here</a></p>
-        <p>Follow me on Instagram: <a href="https://www.instagram.com/nihal_gazi_io/">nihal_gazi_io</a></p>
-        <p>Or contact me through Discord: <b><i>@nihal_gazi_io</i></b></p>
-    </div>
     </div>
     """
     )
-    # Define examples to be shown within the Gradio interface
     examples = [
-        # Each example is a list corresponding to the inputs:
-        # [Input Image, Prompt]
-        ["data/1.webp", 'change text to "AMEER"'],
-        ["data/2.webp", "remove the spoon from  hand only"],
-        ["data/3.webp", 'change text to "Make it "'],
-        ["data/1.jpg", "add  joker style only on face"],
-         ["data/1777043.jpg", "add  joker style only on face"],
-         ["data/2807615.jpg","add lipstick on lip only "],
-         ["data/76860.jpg", "add lipstick on lip only "],
-         ["data/2807615.jpg", "make it happy looking face only"],
     ]
-    gr.Markdown("Upload an image and enter a prompt to generate outputs in the gallery. Do not Use NFSW Images")
-    with gr.Row():
-        with gr.Column():
-            image_input = gr.Image(
-                type="pil",
-                label="Upload Image",
-                image_mode="RGBA"
-            )
-            # API Key Textbox ko yahan se hata diya gaya hai
-            prompt_input = gr.Textbox(
-                lines=2,
-                placeholder="Enter prompt here...",
-                label="Prompt"
-            )
-            submit_btn = gr.Button("Generate")
-        with gr.Column():
-            output_gallery = gr.Gallery(label="Generated Outputs")
-    # Set up the interaction.
     submit_btn.click(
         fn=process_image_and_prompt,
-        inputs=[image_input, prompt_input], # Inputs se API key hata di gayi hai
         outputs=output_gallery,
-    )
-    gr.Examples(
-        examples=examples,
-        inputs=[image_input, prompt_input], # Inputs se API key hata di gayi hai
-        label="Try these examples"
     )
-demo.launch(share=True)

 from google import genai
 from google.genai import types
+from dotenv import load_dotenv
+# .env file se environment variables (API_KEY) load karein
+load_dotenv()
+def get_api_key():
+    """Environment variable se Gemini API Key haasil karein."""
+    api_key = os.environ.get("GEMINI_API_KEY")
+    if not api_key:
+        # Agar key na mile to Gradio app mein ek error dikhayein
+        raise gr.Error("Gemini API Key nahi mili. Kripya apni .env file check karein.")
+    return api_key
 def save_binary_file(file_name, data):
     with open(file_name, "wb") as f:
         f.write(data)
+def generate(text, file_name, model="gemini-1.5-flash-latest"): # Model ko update kar diya gaya hai
+    # API key environment se lein
+    api_key = get_api_key()
+    genai.configure(api_key=api_key)
+    # Model ko initialize karein
+    model_instance = genai.GenerativeModel(model)
+    # File upload karein (naya, behtar tareeka)
+    uploaded_file = genai.upload_file(path=file_name)
+    # Prompt tayyar karein
+    prompt_parts = [
+        uploaded_file,
+        text,
     ]
+    # Generation config (isey zaroorat ke mutabik rakha ja sakta hai)
+    generation_config = genai.GenerationConfig(
         temperature=1,
         top_p=0.95,
         top_k=40,
         max_output_tokens=8192,
+        response_mime_type="image/png" # Seedhe image response maangein
     )
+    try:
+        response = model_instance.generate_content(
+            prompt_parts,
+            generation_config=generation_config,
+            stream=True
+        )
+        # Response se image data collect karein
+        image_data = bytearray()
+        for chunk in response:
+             if chunk.parts:
+                 for part in chunk.parts:
+                     if part.inline_data:
+                         image_data.extend(part.inline_data.data)
+        if not image_data:
+            # Agar koi image generate na ho, to text response check karein
+            full_response_text = "".join(chunk.text for chunk in response)
+            print("Model se koi image nahi aayi. Response:", full_response_text)
+            raise gr.Error("Maaf kijiye, image generate nahi ho saki. Kripya apna prompt badal kar koshish karein.")
+        # Image data ko temporary file mein save karein
+        with tempfile.NamedTemporaryFile(suffix=".png", delete=False) as tmp:
+            temp_path = tmp.name
+            tmp.write(image_data)
+        print(f"File {temp_path} par save ho gayi. Prompt: {text}")
+        return temp_path
+    finally:
+        # Temporary uploaded file ko delete karein
+        genai.delete_file(uploaded_file.name)
 def process_image_and_prompt(composite_pil, prompt):
+    if composite_pil is None:
+        raise gr.Error("Kripya pehle ek image upload karein!")
+    if not prompt.strip():
+        raise gr.Error("Kripya prompt enter karein ki image ke saath kya karna hai.")
+    # Input image ko temporary file mein save karein.
     with tempfile.NamedTemporaryFile(suffix=".png", delete=False) as tmp:
         composite_path = tmp.name
+        # Ensure image is in RGB format before saving if it has an alpha channel
+        if composite_pil.mode == 'RGBA':
+            composite_pil = composite_pil.convert('RGB')
+        composite_pil.save(composite_path, "PNG")
     file_name = composite_path
     input_text = prompt
+    model = "gemini-1.5-flash-latest" # Sabse naya aur behtar model istemal karein
+    edited_image_path = generate(text=input_text, file_name=file_name, model=model)
+    print("Generated image path: ", edited_image_path)
+    if edited_image_path:
+        result_img = Image.open(edited_image_path)
+        return [result_img]
+    else:
+        # Agar koi path na mile to error dikhayein
+        raise gr.Error("Image banane mein asamarth. Koshish karein dobara.")
+# Behtar UI/UX ke liye Gradio Blocks interface
+with gr.Blocks(theme=gr.themes.Soft(primary_hue="sky")) as demo:
+    gr.Markdown(
     """
+    <div style='text-align: center; margin-bottom: 20px;'>
+      <h1 style='font-size: 2.5em; color: #333;'>🎨 AI Image Editor 🎨</h1>
+      <p style='font-size: 1.2em; color: #666;'>Upload an image and tell me how you want to change it.</p>
     </div>
     """
     )
+    # Udaharan (Examples) jo interface mein dikhaye jaayenge
     examples = [
+        ["assets/1.webp", 'change the text on the t-shirt to "AMEER"'],
+        ["assets/2.webp", "remove the spoon from the hand"],
+        ["assets/3.webp", 'change the text to "MAKE IT AWESOME"'],
+        ["assets/1.jpg", "apply a joker style makeup on the face"],
+        ["assets/1777043.jpg", "add cyberpunk neon lights in the background"],
+        ["assets/2807615.jpg", "add subtle red lipstick on the lips"],
     ]
+    with gr.Row(gap="20"):
+        with gr.Column(scale=1):
+            with gr.Group():
+                gr.Markdown("### 1. Upload Your Image")
+                image_input = gr.Image(
+                    type="pil",
+                    label="Image Input",
+                    height=400,
+                    image_mode="RGBA",
+                    show_label=False
+                )
+            with gr.Group():
+                gr.Markdown("### 2. Describe Your Edit")
+                prompt_input = gr.Textbox(
+                    lines=3,
+                    placeholder="e.g., 'remove the person in the background' or 'make the sky look like a sunset'",
+                    label="Prompt",
+                    show_label=False,
+                )
+            submit_btn = gr.Button("✨ Apply Edits", variant="primary", size="lg")
+        with gr.Column(scale=1):
+            with gr.Group():
+                 gr.Markdown("### 3. See the Result")
+                 output_gallery = gr.Gallery(
+                     label="Generated Output",
+                     height=500,
+                     show_label=False,
+                     preview=True
+                 )
+    gr.Examples(
+        examples=examples,
+        inputs=[image_input, prompt_input],
+        outputs=output_gallery,
+        fn=process_image_and_prompt,
+        cache_examples=True,
+        label="Or try one of these examples 👇"
+    )
     submit_btn.click(
         fn=process_image_and_prompt,
+        inputs=[image_input, prompt_input],
         outputs=output_gallery,
     )
+demo.launch(share=True, debug=True)