ezmary-image-edit

Running

App Files Files Community

Hamed744 commited on 13 days ago

Commit

e570148

verified ·

1 Parent(s): a9acc0c

Update app.py

Browse files

Files changed (1) hide show

app.py +25 -66

app.py CHANGED Viewed

@@ -24,13 +24,7 @@ def translate_prompt_to_english(text, api_key, model="gemini-2.0-flash-exp"):
     client = genai.Client(api_key=api_key.strip())
-    pre_prompt = (
-        "Translate the following text to English accurately and naturally, as a native English speaker would phrase it. "
-        "The text could be in Persian (Farsi), Urdu, Pashto, Arabic, Kurdish, or other languages. "
-        "Keep the translation concise and clear, avoiding unnecessary words or literal translations. "
-        "For example, if the Persian text is 'متن را به \"امیر\" تغییر بده', translate it to 'Change the text to \"Amir\"'. "
-        "Do not include any additional explanations or context in the translation."
-    )
     full_text = pre_prompt + "\n" + text
     contents = [
@@ -65,11 +59,7 @@ def generate_with_api(api_key, text, file_name, model="gemini-2.0-flash-exp"):
     client = genai.Client(api_key=api_key.strip())
     files = [client.files.upload(file=file_name)]
-    pre_prompt = (
-        "The following instruction is in English. Process it carefully. "
-        "Ensure the new text matches the style, font, and position of the original text as closely as possible. Generate an edited image with the changes applied."
-    )
-    full_text = pre_prompt + "\n" + text
     contents = [
         types.Content(
@@ -88,11 +78,9 @@ def generate_with_api(api_key, text, file_name, model="gemini-2.0-flash-exp"):
         top_p=0.95,
         top_k=40,
         max_output_tokens=8192,
-        response_modalities=["image", "text"],
-        response_mime_type="text/plain",
     )
-    text_response = ""
     image_path = None
     with tempfile.NamedTemporaryFile(suffix=".png", delete=False) as tmp:
         temp_path = tmp.name
@@ -108,11 +96,9 @@ def generate_with_api(api_key, text, file_name, model="gemini-2.0-flash-exp"):
                 save_binary_file(temp_path, candidate.inline_data.data)
                 image_path = temp_path
                 break
-            else:
-                text_response += chunk.text + "\n"
     del files
-    return image_path, text_response
 def process_single_api(api_key, prompt, file_name, model):
     if not api_key:
@@ -120,14 +106,14 @@ def process_single_api(api_key, prompt, file_name, model):
     try:
         translated_prompt = translate_prompt_to_english(prompt, api_key, model)
-        image_path, text_response = generate_with_api(api_key, translated_prompt, file_name, model)
         if image_path:
             result_img = Image.open(image_path)
             if result_img.mode == "RGBA":
                 result_img = result_img.convert("RGB")
             return result_img, ""
-        return None, text_response if text_response else "No image generated"
     except Exception as e:
         return None, f"Error with API {api_key[-4:]}: {str(e)}"
@@ -149,7 +135,6 @@ def process_image_and_prompt(composite_pil, prompt):
         result_images = []
         error_messages = []
-        # اجرای همزمان با 4 thread (هر API در یک thread جدا)
         with concurrent.futures.ThreadPoolExecutor(max_workers=4) as executor:
             futures = {
                 executor.submit(
@@ -168,12 +153,12 @@ def process_image_and_prompt(composite_pil, prompt):
         os.unlink(composite_path)
         if not result_images:
-            return None, "\n".join(error_messages) + "\n\n**توجه**: اگر تصویر تولید نشد، لطفاً دستور خود را واضح‌تر بنویسید یا دوباره امتحان کنید."
         return result_images, ""
     except Exception as e:
-        raise gr.Error(f"خطا در پردازش: {e}", duration=5)
 css = """
 footer { visibility: hidden; }
@@ -183,7 +168,7 @@ display: none !important;
 }
 """
-with gr.Blocks(css_paths="style.css", css=css) as demo:
     gr.HTML(
     """
     <div class="header-container">
@@ -197,48 +182,30 @@ with gr.Blocks(css_paths="style.css", css=css) as demo:
     """
     )
-    with gr.Accordion("⚠️ راهنمای استفاده", open=False, elem_classes="config-accordion"):
         gr.Markdown("""
-        ### راهنمای استفاده
-        - تصویر خود را آپلود کرده و دستور ویرایش را وارد کنید
-        - در صورت بروز خطا، پیام مربوطه نمایش داده خواهد شد
-        - فقط تصاویر با فرمت PNG آپلود کنید
-        - از آپلود تصاویر نامناسب خودداری کنید
         """)
-    with gr.Accordion("📌 دستورالعمل‌های ویرایش", open=False, elem_classes="instructions-accordion"):
-        gr.Markdown("""
-        ### نمونه دستورات ویرایش
-        - متن تصویر را به \"متن جدید\" تغییر بده
-        - شیء خاصی را از تصویر حذف کن
-        - استایل خاصی به بخشی از تصویر اضافه کن
-        - تغییرات رنگی روی تصویر اعمال کن
-        """)
-    with gr.Row(elem_classes="main-content"):
-        with gr.Column(elem_classes="input-column"):
             image_input = gr.Image(
                 type="pil",
                 label="تصویر را آپلود کنید",
-                image_mode="RGBA",
-                elem_id="image-input",
-                elem_classes="upload-box"
             )
             prompt_input = gr.Textbox(
                 lines=2,
-                placeholder="تصویر چیکار بشه؟ اینجا بنویسید...",
-                label="دستور ویرایش",
-                elem_classes="prompt-input"
             )
-            submit_btn = gr.Button("اعمال تغییرات", elem_classes="generate-btn")
-        with gr.Column(elem_classes="output-column"):
-            output_gallery = gr.Gallery(label="تصاویر ویرایش شده", elem_classes="output-gallery")
-            output_text = gr.Textbox(
-                label="پیام سیستم",
-                placeholder="در صورت بروز خطا، پیام مربوطه اینجا نمایش داده می‌شود.",
-                elem_classes="output-text"
-            )
     submit_btn.click(
         fn=process_image_and_prompt,
@@ -246,23 +213,15 @@ with gr.Blocks(css_paths="style.css", css=css) as demo:
         outputs=[output_gallery, output_text],
     )
-    gr.Markdown("## نمونه‌های آماده", elem_classes="gr-examples-header")
     examples = [
-        ["data/1.webp", 'متن را به "امیر" تغییر بده', ""],
-        ["data/2.webp", "قاشق را از دست حذف کن", ""],
-        ["data/3.webp", 'متن را به "بساز" تغییر بده', ""],
-        ["data/1.jpg", "فقط روی صورت استایل جوکر اضافه کن", ""],
-        ["data/1777043.jpg", "فقط روی صورت استایل جوکر اضافه کن", ""],
-        ["data/2807615.jpg", "فقط روی لب‌ها رژ لب اضافه کن", ""],
-        ["data/76860.jpg", "فقط روی لب‌ها رژ لب اضافه کن", ""],
-        ["data/2807615.jpg", "فقط صورت را شادتر کن", ""],
     ]
     gr.Examples(
         examples=examples,
         inputs=[image_input, prompt_input],
-        elem_id="examples-grid"
     )
 demo.queue(max_size=50).launch()

     client = genai.Client(api_key=api_key.strip())
+    pre_prompt = "Translate this to English accurately:"
     full_text = pre_prompt + "\n" + text
     contents = [
     client = genai.Client(api_key=api_key.strip())
     files = [client.files.upload(file=file_name)]
+    full_text = "Apply this edit to the image: " + text
     contents = [
         types.Content(
         top_p=0.95,
         top_k=40,
         max_output_tokens=8192,
+        response_modalities=["image"],
     )
     image_path = None
     with tempfile.NamedTemporaryFile(suffix=".png", delete=False) as tmp:
         temp_path = tmp.name
                 save_binary_file(temp_path, candidate.inline_data.data)
                 image_path = temp_path
                 break
     del files
+    return image_path, ""
 def process_single_api(api_key, prompt, file_name, model):
     if not api_key:
     try:
         translated_prompt = translate_prompt_to_english(prompt, api_key, model)
+        image_path, _ = generate_with_api(api_key, translated_prompt, file_name, model)
         if image_path:
             result_img = Image.open(image_path)
             if result_img.mode == "RGBA":
                 result_img = result_img.convert("RGB")
             return result_img, ""
+        return None, "No image generated"
     except Exception as e:
         return None, f"Error with API {api_key[-4:]}: {str(e)}"
         result_images = []
         error_messages = []
         with concurrent.futures.ThreadPoolExecutor(max_workers=4) as executor:
             futures = {
                 executor.submit(
         os.unlink(composite_path)
         if not result_images:
+            return None, "\n".join(error_messages)
         return result_images, ""
     except Exception as e:
+        raise gr.Error(f"خطا در پردازش: {e}")
 css = """
 footer { visibility: hidden; }
 }
 """
+with gr.Blocks(css=css) as demo:
     gr.HTML(
     """
     <div class="header-container">
     """
     )
+    with gr.Accordion("⚠️ راهنمای استفاده", open=False):
         gr.Markdown("""
+        - تصویر خود را آپلود کنید
+        - دستور ویرایش را وارد کنید
+        - نتیجه را دریافت نمایید
         """)
+    with gr.Row():
+        with gr.Column():
             image_input = gr.Image(
                 type="pil",
                 label="تصویر را آپلود کنید",
+                image_mode="RGBA"
             )
             prompt_input = gr.Textbox(
                 lines=2,
+                placeholder="دستور ویرایش خود را وارد کنید...",
+                label="دستور ویرایش"
             )
+            submit_btn = gr.Button("اعمال تغییرات")
+        with gr.Column():
+            output_gallery = gr.Gallery(label="نتایج")
+            output_text = gr.Textbox(label="پیام سیستم")
     submit_btn.click(
         fn=process_image_and_prompt,
         outputs=[output_gallery, output_text],
     )
     examples = [
+        ["data/1.webp", 'متن را به "امیر" تغییر بده'],
+        ["data/2.webp", "قاشق را از دست حذف کن"],
+        ["data/3.webp", 'متن را به "بساز" تغییر بده'],
     ]
     gr.Examples(
         examples=examples,
         inputs=[image_input, prompt_input],
     )
 demo.queue(max_size=50).launch()