ezmary-image-edit

Running

App Files Files Community

Hamed744 commited on 13 days ago

Commit

c0e2510

verified ·

1 Parent(s): 7356cac

Update app.py

Browse files

Files changed (1) hide show

app.py +174 -137

app.py CHANGED Viewed

@@ -1,144 +1,141 @@
 import json
 import os
 import tempfile
-from PIL import Image
 import gradio as gr
 from google import genai
 from google.genai import types
 import concurrent.futures
 def save_binary_file(file_name, data):
     with open(file_name, "wb") as f:
         f.write(data)
-def needs_translation(text):
-    # Simple check for non-English characters (Persian, Arabic, Urdu, etc.)
-    non_english_chars = set("ءآأؤإئابةتثجحخدذرزسشصضطظعغفقكلمنهوىيپچژکگی")
-    return any(char in non_english_chars for char in text)
-def translate_prompt(text, api_key, model="gemini-2.0-flash-exp"):
     try:
-        client = genai.Client(api_key=api_key.strip())
-        pre_prompt = (
-            "Translate the following text to English accurately and naturally. "
-            "Keep the translation concise and clear. "
-            "Do not include any additional explanations or context in the translation."
-        )
-        full_text = pre_prompt + "\n" + text
-        contents = [
-            types.Content(
-                role="user",
-                parts=[types.Part.from_text(text=full_text)],
-            ),
-        ]
-        generate_content_config = types.GenerateContentConfig(
-            temperature=0.5,
-            top_p=0.9,
-            top_k=40,
-            max_output_tokens=8192,
-            response_mime_type="text/plain",
-        )
-        text_response = ""
         for chunk in client.models.generate_content_stream(
             model=model,
             contents=contents,
             config=generate_content_config,
         ):
-            if chunk.candidates and chunk.candidates[0].content and chunk.candidates[0].content.parts:
                 text_response += chunk.text + "\n"
-        return text_response.strip()
-    except Exception as e:
-        print(f"Translation error: {str(e)}")
-        return text
-def generate_with_api(api_key, text, file_name, model="gemini-2.0-flash-exp"):
-    try:
-        client = genai.Client(api_key=api_key.strip())
-        files = [client.files.upload(file=file_name)]
-        pre_prompt = (
-            "The following instruction is in English. Process it carefully. "
-            "Your task is to edit the image based on the instruction. "
-            "If the instruction asks to change text in the image, identify the existing text and replace it. "
-            "Ensure the new text matches the style, font, and position of the original text."
-        )
-        full_text = pre_prompt + "\n" + text
-        contents = [
-            types.Content(
-                role="user",
-                parts=[
-                    types.Part.from_uri(
-                        file_uri=files[0].uri,
-                        mime_type=files[0].mime_type,
-                    ),
-                    types.Part.from_text(text=full_text),
-                ],
-            ),
-        ]
-        generate_content_config = types.GenerateContentConfig(
-            temperature=1,
-            top_p=0.95,
-            top_k=40,
-            max_output_tokens=8192,
-            response_modalities=["image", "text"],
-            response_mime_type="text/plain",
-        )
-        with tempfile.NamedTemporaryFile(suffix=".png", delete=False) as tmp:
-            temp_path = tmp.name
-            for chunk in client.models.generate_content_stream(
-                model=model,
-                contents=contents,
-                config=generate_content_config,
-            ):
-                if chunk.candidates and chunk.candidates[0].content and chunk.candidates[0].content.parts:
-                    candidate = chunk.candidates[0].content.parts[0]
-                    if candidate.inline_data:
-                        save_binary_file(temp_path, candidate.inline_data.data)
-                        return temp_path, ""
-                    elif candidate.text:
-                        return None, candidate.text
-        return None, "No response from API"
-    except Exception as e:
-        return None, f"API Error: {str(e)}"
-    finally:
-        if 'files' in locals():
-            del files
 def process_single_api(api_key, prompt, file_name, model):
     if not api_key:
         return None, "API key not provided"
     try:
-        # Check if translation is needed
-        if needs_translation(prompt):
-            processed_prompt = translate_prompt(prompt, api_key, model)
-        else:
-            processed_prompt = prompt
-        # Generate image with dedicated API
-        image_path, text_response = generate_with_api(api_key, processed_prompt, file_name, model)
         if image_path:
             result_img = Image.open(image_path)
             if result_img.mode == "RGBA":
                 result_img = result_img.convert("RGB")
             return result_img, ""
         return None, text_response if text_response else "No image generated"
     except Exception as e:
-        return None, f"Processing Error: {str(e)}"
 def process_image_and_prompt(composite_pil, prompt):
     try:
@@ -157,13 +154,13 @@ def process_image_and_prompt(composite_pil, prompt):
         result_images = []
         error_messages = []
-        # Fully parallel and independent API execution
         with concurrent.futures.ThreadPoolExecutor(max_workers=4) as executor:
             futures = {
                 executor.submit(
                     process_single_api,
                     api_key, prompt, composite_path, model
-                ): api_key[-4:] for api_key in api_keys if api_key
             }
             for future in concurrent.futures.as_completed(futures):
@@ -171,18 +168,17 @@ def process_image_and_prompt(composite_pil, prompt):
                 if image:
                     result_images.append(image)
                 if error:
-                    error_messages.append(f"API {futures[future]}: {error}")
         os.unlink(composite_path)
         if not result_images:
-            error_msg = "\n".join(error_messages) if error_messages else "All APIs failed without specific errors"
-            return None, f"{error_msg}\n\nPlease check your command and try again."
         return result_images, ""
     except Exception as e:
-        return None, f"System Error: {str(e)}"
 css = """
 footer { visibility: hidden; }
@@ -192,45 +188,86 @@ display: none !important;
 }
 """
-with gr.Blocks(css=css) as demo:
-    gr.HTML("""
     <div class="header-container">
-    <div><img src="https://uploadkon.ir/uploads/4a3e22_25IMG-%DB%B2%DB%B0%DB%B2%DB%B5%DB%B0%DB%B3%DB%B2%DB%B2-%DB%B1%DB%B7%DB%B1%DB%B8%DB%B5%DB%B2.jpg" alt="Alfa AI logo"></div>
-    <div><h1>ویرایش جادویی تصاویر با هوش مصنوعی آلفا</h1></div>
     </div>
-    """)
-    with gr.Accordion("⚠️ راهنمای استفاده", open=False):
         gr.Markdown("""
         ### راهنمای استفاده
         - تصویر خود را آپلود کرده و دستور ویرایش را وارد کنید
-        - سیستم به طور خودکار زبان دستور شما را تشخیص می‌دهد
-        - هر تصویر نتیجه از یک API مستقل تولید می‌شود
         """)
-    with gr.Row():
-        with gr.Column():
-            image_input = gr.Image(type="pil", label="تصویر را آپلود کنید", image_mode="RGBA")
-            prompt_input = gr.Textbox(lines=2, placeholder="دستور ویرایش (هر زبانی)...", label="دستور ویرایش")
-            submit_btn = gr.Button("اعمال تغییرات")
-        with gr.Column():
-            output_gallery = gr.Gallery(label="تصاویر ویرایش شده")
-            output_text = gr.Textbox(label="پیام سیستم")
     submit_btn.click(
-        process_image_and_prompt,
         inputs=[image_input, prompt_input],
-        outputs=[output_gallery, output_text]
     )
     gr.Examples(
-        examples=[
-            ["examples/1.jpg", "متن را به 'سلام' تغییر بده"],
-            ["examples/2.jpg", "Change the text to 'Hello'"],
-            ["examples/3.jpg", "حذف شیء قرمز رنگ از تصویر"],
-        ],
-        inputs=[image_input, prompt_input]
     )
-demo.queue(concurrency_count=4).launch()

 import json
 import os
+import time
+import uuid
 import tempfile
+from PIL import Image, ImageDraw, ImageFont
 import gradio as gr
+import base64
+import mimetypes
 from google import genai
 from google.genai import types
 import concurrent.futures
+import langdetect
 def save_binary_file(file_name, data):
     with open(file_name, "wb") as f:
         f.write(data)
+def translate_prompt_to_english(text, api_key, model="gemini-2.0-flash-exp"):
+    # Detect the language of the input text
     try:
+        detected_lang = langdetect.detect(text)
+        # If the language is English, return the text as is
+        if detected_lang == "en":
+            return text
+    except:
+        pass
+    client = genai.Client(api_key=api_key.strip())
+    pre_prompt = (
+        "Translate the following text to English accurately and naturally, as a native English speaker would phrase it. "
+        "Keep the translation concise and clear, avoiding unnecessary words or literal translations. "
+        "For example, if the text is 'متن را به \"امیر\" تغییر بده', translate it to 'Change the text to \"Amir\"'. "
+        "Do not include any additional explanations or context in the translation."
+    )
+    full_text = pre_prompt + "\n" + text
+    contents = [
+        types.Content(
+            role="user",
+            parts=[
+                types.Part.from_text(text=full_text),
+            ],
+        ),
+    ]
+    generate_content_config = types.GenerateContentConfig(
+        temperature=0.5,
+        top_p=0.9,
+        top_k=40,
+        max_output_tokens=8192,
+        response_mime_type="text/plain",
+    )
+    text_response = ""
+    for chunk in client.models.generate_content_stream(
+        model=model,
+        contents=contents,
+        config=generate_content_config,
+    ):
+        if not chunk.candidates or not chunk.candidates[0].content or not chunk.candidates[0].content.parts:
+            continue
+        text_response += chunk.text + "\n"
+    return text_response.strip()
+def generate_with_api(api_key, text, file_name, model="gemini-2.0-flash-exp"):
+    client = genai.Client(api_key=api_key.strip())
+    files = [client.files.upload(file=file_name)]
+    pre_prompt = (
+        "The following instruction is in English. Process it carefully. "
+        "Your task is to edit the image based on the instruction. If the instruction asks to change the text in the image, identify the existing text in the image and replace it with the new text specified in the instruction. "
+        "For example, if the instruction says 'Change the text to \"Amir\"', find the text in the image (e.g., 'HONEY') and replace it with 'Amir'. Do not use the instruction text itself as the new text. "
+        "Ensure the new text matches the style, font, and position of the original text as closely as possible. Generate an edited image with the changes applied."
+    )
+    full_text = pre_prompt + "\n" + text
+    contents = [
+        types.Content(
+            role="user",
+            parts=[
+                types.Part.from_uri(
+                    file_uri=files[0].uri,
+                    mime_type=files[0].mime_type,
+                ),
+                types.Part.from_text(text=full_text),
+            ],
+        ),
+    ]
+    generate_content_config = types.GenerateContentConfig(
+        temperature=1,
+        top_p=0.95,
+        top_k=40,
+        max_output_tokens=8192,
+        response_modalities=["image", "text"],
+        response_mime_type="text/plain",
+    )
+    text_response = ""
+    image_path = None
+    with tempfile.NamedTemporaryFile(suffix=".png", delete=False) as tmp:
+        temp_path = tmp.name
         for chunk in client.models.generate_content_stream(
             model=model,
             contents=contents,
             config=generate_content_config,
         ):
+            if not chunk.candidates or not chunk.candidates[0].content or not chunk.candidates[0].content.parts:
+                continue
+            candidate = chunk.candidates[0].content.parts[0]
+            if candidate.inline_data:
+                save_binary_file(temp_path, candidate.inline_data.data)
+                image_path = temp_path
+                break
+            else:
                 text_response += chunk.text + "\n"
+    del files
+    return image_path, text_response
 def process_single_api(api_key, prompt, file_name, model):
     if not api_key:
         return None, "API key not provided"
     try:
+        translated_prompt = translate_prompt_to_english(prompt, api_key, model)
+        image_path, text_response = generate_with_api(api_key, translated_prompt, file_name, model)
         if image_path:
             result_img = Image.open(image_path)
             if result_img.mode == "RGBA":
                 result_img = result_img.convert("RGB")
             return result_img, ""
         return None, text_response if text_response else "No image generated"
     except Exception as e:
+        return None, f"Error with API {api_key[-4:]}: {str(e)}"
 def process_image_and_prompt(composite_pil, prompt):
     try:
         result_images = []
         error_messages = []
+        # اجرای همزمان با 4 thread (هر API در یک thread جدا)
         with concurrent.futures.ThreadPoolExecutor(max_workers=4) as executor:
             futures = {
                 executor.submit(
                     process_single_api,
                     api_key, prompt, composite_path, model
+                ): api_key for api_key in api_keys
             }
             for future in concurrent.futures.as_completed(futures):
                 if image:
                     result_images.append(image)
                 if error:
+                    error_messages.append(error)
         os.unlink(composite_path)
         if not result_images:
+            return None, "\n".join(error_messages) + "\n\n**توجه**: اگر تصویر تولید نشد، لطفاً دستور خود را واضح‌تر بنویسید یا دوباره امتحان کنید."
         return result_images, ""
     except Exception as e:
+        raise gr.Error(f"خطا در پردازش: {e}", duration=5)
 css = """
 footer { visibility: hidden; }
 }
 """
+with gr.Blocks(css_paths="style.css", css=css) as demo:
+    gr.HTML(
+    """
     <div class="header-container">
+    <div>
+    <img src="https://uploadkon.ir/uploads/4a3e22_25IMG-%DB%B2%DB%B0%DB%B2%DB%B5%DB%B0%DB%B3%DB%B2%DB%B2-%DB%B1%DB%B7%DB%B1%DB%B8%DB%B5%DB%B2.jpg" alt="Alfa AI logo">
+    </div>
+    <div>
+    <h1>ویرایش جادویی تصاویر با هوش مصنوعی آلفا</h1>
+    </div>
     </div>
+    """
+    )
+    with gr.Accordion("⚠️ راهنمای استفاده", open=False, elem_classes="config-accordion"):
         gr.Markdown("""
         ### راهنمای استفاده
         - تصویر خود را آپلود کرده و دستور ویرایش را وارد کنید
+        - در صورت بروز خطا، پیام مربوطه نمایش داده خواهد شد
+        - فقط تصاویر با فرمت PNG آپلود کنید
+        - از آپلود تصاویر نامناسب خودداری کنید
+        """)
+    with gr.Accordion("📌 دستورالعمل‌های ویرایش", open=False, elem_classes="instructions-accordion"):
+        gr.Markdown("""
+        ### نمونه دستورات ویرایش
+        - متن تصویر را به \"متن جدید\" تغییر بده
+        - شیء خاصی را از تصویر حذف کن
+        - استایل خاصی به بخشی از تصویر اضافه کن
+        - تغییرات رنگی روی تصویر اعمال کن
         """)
+    with gr.Row(elem_classes="main-content"):
+        with gr.Column(elem_classes="input-column"):
+            image_input = gr.Image(
+                type="pil",
+                label="تصویر را آپلود کنید",
+                image_mode="RGBA",
+                elem_id="image-input",
+                elem_classes="upload-box"
+            )
+            prompt_input = gr.Textbox(
+                lines=2,
+                placeholder="تصویر چیکار بشه؟ اینجا بنویسید...",
+                label="دستور ویرایش",
+                elem_classes="prompt-input"
+            )
+            submit_btn = gr.Button("اعمال تغییرات", elem_classes="generate-btn")
+        with gr.Column(elem_classes="output-column"):
+            output_gallery = gr.Gallery(label="تصاویر ویرایش شده", elem_classes="output-gallery")
+            output_text = gr.Textbox(
+                label="پیام سیستم",
+                placeholder="در صورت بروز خطا، پیام مربوطه اینجا نمایش داده می‌شود.",
+                elem_classes="output-text"
+            )
     submit_btn.click(
+        fn=process_image_and_prompt,
         inputs=[image_input, prompt_input],
+        outputs=[output_gallery, output_text],
     )
+    gr.Markdown("## نمونه‌های آماده", elem_classes="gr-examples-header")
+    examples = [
+        ["data/1.webp", 'متن را به "امیر" تغییر بده', ""],
+        ["data/2.webp", "قاشق را از دست حذف کن", ""],
+        ["data/3.webp", 'متن را به "بساز" تغییر بده', ""],
+        ["data/1.jpg", "فقط روی صورت استایل جوکر اضافه کن", ""],
+        ["data/1777043.jpg", "فقط روی صورت استایل جوکر اضافه کن", ""],
+        ["data/2807615.jpg", "فقط روی لب‌ها رژ لب اضافه کن", ""],
+        ["data/76860.jpg", "فقط روی لب‌ها رژ لب اضافه کن", ""],
+        ["data/2807615.jpg", "فقط صورت را شادتر کن", ""],
+    ]
     gr.Examples(
+        examples=examples,
+        inputs=[image_input, prompt_input],
+        elem_id="examples-grid"
     )
+demo.queue(max_size=50).launch()