Spaces:

Shitao
/

OmniGen

Running on Zero

App Files Files Community

Shitao commited on 4 days ago

Commit

d8e8827

•

1 Parent(s): 6aff343

Update app.py

Browse files

Files changed (1) hide show

app.py +15 -9

app.py CHANGED Viewed

@@ -1,6 +1,7 @@
 import gradio as gr
 from PIL import Image
 import os
 import spaces
@@ -12,12 +13,15 @@ pipe = OmniGenPipeline.from_pretrained(
 @spaces.GPU(duration=160)
 def generate_image(text, img1, img2, img3, height, width, guidance_scale, img_guidance_scale, inference_steps, seed, separate_cfg_infer, offload_model,
-            use_input_image_size_as_output, max_input_image_size):
     input_images = [img1, img2, img3]
     # Delete None
     input_images = [img for img in input_images if img is not None]
     if len(input_images) == 0:
         input_images = None
     output = pipe(
         prompt=text,
@@ -270,9 +274,9 @@ def get_example():
     return case
 def run_for_examples(text, img1, img2, img3, height, width, guidance_scale, img_guidance_scale, inference_steps, seed, separate_cfg_infer, offload_model,
-            use_input_image_size_as_output, max_input_image_size):
     return generate_image(text, img1, img2, img3, height, width, guidance_scale, img_guidance_scale, inference_steps, seed, separate_cfg_infer, offload_model,
-            use_input_image_size_as_output, max_input_image_size)
 description = """
 OmniGen is a unified image generation model that you can use to perform various tasks, including but not limited to text-to-image generation, subject-driven generation, Identity-Preserving Generation, and image-conditioned generation.
@@ -281,11 +285,11 @@ For example, use an image of a woman to generate a new image:
 prompt = "A woman holds a bouquet of flowers and faces the camera. Thw woman is \<img\>\<|image_1|\>\</img\>."
 Tips:
-- For out of memory or time cost, you can refer to [inference.md#requiremented-resources](https://github.com/VectorSpaceLab/OmniGen/blob/main/docs/inference.md#requiremented-resources) to select a appropriate setting.
-- If time cost is too long, please try to reduce the `max_input_image_size`. More details please refer to [inference.md](https://github.com/VectorSpaceLab/OmniGen/blob/main/docs/inference.md#requiremented-resources)
 - Oversaturated: If the image appears oversaturated, please reduce the `guidance_scale`.
 - Not match the prompt: If the image does not match the prompt, please try to increase the `guidance_scale`.
-- Low-quality: More detailed prompt will lead to better results.
 - Animate Style: If the genereate images is in animate style, you can try to add `photo` to the prompt`.
 - Edit generated image. If you generate a image by omnigen and then want to edit it, you cannot use the same seed to edit this image. For example, use seed=0 to generate image, and should use seed=1 to edit this image.
 - For image editing tasks, we recommend placing the image before the editing instruction. For example, use `<img><|image_1|></img> remove suit`, rather than `remove suit <img><|image_1|></img>`.
@@ -353,6 +357,7 @@ with gr.Blocks() as demo:
             seed_input = gr.Slider(
                 label="Seed", minimum=0, maximum=2147483647, value=42, step=1
             )
             max_input_image_size = gr.Slider(
                 label="max_input_image_size", minimum=128, maximum=2048, value=1024, step=16
@@ -362,10 +367,10 @@ with gr.Blocks() as demo:
                 label="separate_cfg_infer", info="Whether to use separate inference process for different guidance. This will reduce the memory cost.", value=True,
             )
             offload_model = gr.Checkbox(
-                label="offload_model", info="Offload model to CPU, which will significantly reduce the memory cost but slow down the generation speed. You can cancle separate_cfg_infer and set offload_model=True. If both separate_cfg_infer and offload_model be True, further reduce the memory, but slowest generation", value=False,
             )
             use_input_image_size_as_output = gr.Checkbox(
-                label="use_input_image_size_as_output", info="Automatically adjust the output image size to be same as input image size. For editing and controlnet task, it can make sure the output image has the same size with input image leading to better performance", value=False,
             )
             # generate
@@ -394,6 +399,7 @@ with gr.Blocks() as demo:
             offload_model,
             use_input_image_size_as_output,
             max_input_image_size,
         ],
         outputs=output_image,
     )
@@ -423,4 +429,4 @@ with gr.Blocks() as demo:
     gr.Markdown(article)
 # launch
-demo.launch()

 import gradio as gr
 from PIL import Image
 import os
+import random
 import spaces
 @spaces.GPU(duration=160)
 def generate_image(text, img1, img2, img3, height, width, guidance_scale, img_guidance_scale, inference_steps, seed, separate_cfg_infer, offload_model,
+            use_input_image_size_as_output, max_input_image_size, randomize_seed):
     input_images = [img1, img2, img3]
     # Delete None
     input_images = [img for img in input_images if img is not None]
     if len(input_images) == 0:
         input_images = None
+    if randomize_seed:
+        seed = random.randint(0, 10000000)
     output = pipe(
         prompt=text,
     return case
 def run_for_examples(text, img1, img2, img3, height, width, guidance_scale, img_guidance_scale, inference_steps, seed, separate_cfg_infer, offload_model,
+            use_input_image_size_as_output, max_input_image_size, randomize_seed=False):
     return generate_image(text, img1, img2, img3, height, width, guidance_scale, img_guidance_scale, inference_steps, seed, separate_cfg_infer, offload_model,
+            use_input_image_size_as_output, max_input_image_size, randomize_seed=randomize_seed)
 description = """
 OmniGen is a unified image generation model that you can use to perform various tasks, including but not limited to text-to-image generation, subject-driven generation, Identity-Preserving Generation, and image-conditioned generation.
 prompt = "A woman holds a bouquet of flowers and faces the camera. Thw woman is \<img\>\<|image_1|\>\</img\>."
 Tips:
+- For out-of-memory or time cost, you can set `offload_model=True` or refer to [./docs/inference.md#requiremented-resources](https://github.com/VectorSpaceLab/OmniGen/blob/main/docs/inference.md#requiremented-resources) to select a appropriate setting.
+- If inference time is too long when inputting multiple images, please try to reduce the `max_input_image_size`. For more details please refer to [./docs/inference.md#requiremented-resources](https://github.com/VectorSpaceLab/OmniGen/blob/main/docs/inference.md#requiremented-resources).
 - Oversaturated: If the image appears oversaturated, please reduce the `guidance_scale`.
 - Not match the prompt: If the image does not match the prompt, please try to increase the `guidance_scale`.
+- Low-quality: More detailed prompts will lead to better results.
 - Animate Style: If the genereate images is in animate style, you can try to add `photo` to the prompt`.
 - Edit generated image. If you generate a image by omnigen and then want to edit it, you cannot use the same seed to edit this image. For example, use seed=0 to generate image, and should use seed=1 to edit this image.
 - For image editing tasks, we recommend placing the image before the editing instruction. For example, use `<img><|image_1|></img> remove suit`, rather than `remove suit <img><|image_1|></img>`.
             seed_input = gr.Slider(
                 label="Seed", minimum=0, maximum=2147483647, value=42, step=1
             )
+            randomize_seed = gr.Checkbox(label="Randomize seed", value=True)
             max_input_image_size = gr.Slider(
                 label="max_input_image_size", minimum=128, maximum=2048, value=1024, step=16
                 label="separate_cfg_infer", info="Whether to use separate inference process for different guidance. This will reduce the memory cost.", value=True,
             )
             offload_model = gr.Checkbox(
+                label="offload_model", info="Offload model to CPU, which will significantly reduce the memory cost but slow down the generation speed. You can cancel separate_cfg_infer and set offload_model=True. If both separate_cfg_infer and offload_model are True, further reduce the memory, but slowest generation", value=False,
             )
             use_input_image_size_as_output = gr.Checkbox(
+                label="use_input_image_size_as_output", info="Automatically adjust the output image size to be same as input image size. For editing and controlnet task, it can make sure the output image has the same size as input image leading to better performance", value=False,
             )
             # generate
             offload_model,
             use_input_image_size_as_output,
             max_input_image_size,
+            randomize_seed,
         ],
         outputs=output_image,
     )
     gr.Markdown(article)
 # launch
+demo.launch()