import os import gradio as gr import os import random from PIL import Image import time import torch from torch import autocast from kandinsky2 import get_kandinsky2 device = torch.device('cuda' if torch.cuda.is_available() else 'cpu') model = get_kandinsky2( 'cuda', task_type='text2img', cache_dir='/media/agp/d58e0f56-1cd5-45af-938c-27e43b4fc343/kandinsky/tmp', model_version='2.1', use_flash_attention=False ) """ num_steps=50, batch_size=4, guidance_scale=7, h=768, w=768, sampler='ddim_sampler', prior_cf_scale=1, prior_steps='25', """ #@title Images Generation def infer(prompt, negative,h,w,batch_size, num_steps, guidance_scale,prior_cf_scale): images = model.generate_text2img(prompt, negative_prior_prompt=negative, negative_decoder_prompt=negative, num_steps=int(num_steps), batch_size=int(batch_size), guidance_scale=int(guidance_scale), h=int(h), w=int(w), sampler='p_sampler', prior_cf_scale=int(prior_cf_scale), prior_steps='30',) return images css = """ .gradio-container { font-family: 'IBM Plex Sans', sans-serif; } .gr-button { color: white; border-color: black; background: black; } input[type='range'] { accent-color: black; } .dark input[type='range'] { accent-color: #dfdfdf; } .container { max-width: 930px; margin: auto; padding-top: 1.5rem; } #gallery { min-height: 22rem; margin-bottom: 15px; margin-left: auto; margin-right: auto; border-bottom-right-radius: .5rem !important; border-bottom-left-radius: .5rem !important; } #gallery>div>.h-full { min-height: 20rem; } .details:hover { text-decoration: underline; } .gr-button { white-space: nowrap; } .gr-button:focus { border-color: rgb(147 197 253 / var(--tw-border-opacity)); outline: none; box-shadow: var(--tw-ring-offset-shadow), var(--tw-ring-shadow), var(--tw-shadow, 0 0 #0000); --tw-border-opacity: 1; --tw-ring-offset-shadow: var(--tw-ring-inset) 0 0 0 var(--tw-ring-offset-width) var(--tw-ring-offset-color); --tw-ring-shadow: var(--tw-ring-inset) 0 0 0 calc(3px var(--tw-ring-offset-width)) var(--tw-ring-color); --tw-ring-color: rgb(191 219 254 / var(--tw-ring-opacity)); --tw-ring-opacity: .5; } #advanced-btn { font-size: .7rem !important; line-height: 19px; margin-top: 12px; margin-bottom: 12px; padding: 2px 8px; border-radius: 14px !important; } #advanced-options { display: none; margin-bottom: 20px; } .footer { margin-bottom: 45px; margin-top: 35px; text-align: center; border-bottom: 1px solid #e5e5e5; } .footer>p { font-size: .8rem; display: inline-block; padding: 0 10px; transform: translateY(10px); background: white; } .dark .footer { border-color: #303030; } .dark .footer>p { background: #0b0f19; } .acknowledgments h4{ margin: 1.25em 0 .25em 0; font-weight: bold; font-size: 115%; } #container-advanced-btns{ display: flex; flex-wrap: wrap; justify-content: space-between; align-items: center; } .animate-spin { animation: spin 1s linear infinite; } @keyframes spin { from { transform: rotate(0deg); } to { transform: rotate(360deg); } } } .gr-form{ flex: 1 1 50%; border-top-right-radius: 0; border-bottom-right-radius: 0; } #prompt-container{ gap: 0; } #generated_id{ min-height: 1860x } """ block = gr.Blocks(css=css) #SPACE_ID = os.getenv('SPACE_ID') with block as webui: gr.Markdown(f""" """ ) with gr.Tab("text to image"): with gr.Group(): with gr.Box(): with gr.Row(): text = gr.Textbox( label="Enter your prompt", show_label=True, max_lines=2 ) negative = gr.Textbox( label="Enter your negative prompt", show_label=True, max_lines=2 ) with gr.Row(): with gr.Accordion("Advanced image settings", open=False): h = gr.Slider(minimum=512, maximum=1280, step=64 ,label="Height. Minimum 512px, maximum 1280px") w = gr.Slider(minimum=512, maximum=1280, step=64, label="Width. Minimum 512px , Maximum 1280px") num_steps = gr.Slider(minimum=40, maximum=150, step=5 ,label="Number of Steps: Minimum 30, maximum 150") batch_size = gr.Slider(minimum=1, maximum=8, step=1, label="Number of images to generate: Minimum 1, maximum 8") guidance_scale = gr.Slider( minimum=1, maximum=20, step=1, label="Guidance scale. A high guidance scale means that the model should generate images that closely match the specified style or theme, while a low guidance scale allows the model to generate more diverse and original images") prior_cf_scale = gr.Slider(minimum=1, maximum=20, step=1, label="Prior config scale.Overall, the prior config scale hyperparameter allows users to control the level of adherence to specified conditions in the generated images. A high prior config scale results in images that closely match the specified conditions, while a low prior config scale generates more diverse and creative images.") #prior_steps = gr.Slider(minimum=1, maximum=50, step=1, label="Prior steps. Increasing the prior steps can result in more detailed and accurate output, but it can also make the model slower and more computationally expensive.") with gr.Row(): btn = gr.Button("Generate") gallery = gr.Gallery(label="Generated images", show_label=False, elem_id="generated_id").style(columns=[2], rows=[2], object_fit="contain", height="auto") # ex = gr.Examples(examples=examples, fn=infer, inputs=[text, negative], outputs=gallery, cache_examples=True) #ex.dataset.headers = [""] text.submit(infer, inputs=[text, negative, h, w, batch_size, num_steps, guidance_scale, prior_cf_scale], outputs=gallery) btn.click(infer, inputs=[text, negative, h, w, batch_size, num_steps, guidance_scale, prior_cf_scale], outputs=gallery) with gr.Tab("Flip Text"): gr.Markdown(f""" text test """ ) webui.queue(max_size=15).launch()