Spaces:

Surn
/

HexaGrid

Running on Zero

App Files Files Community

Surn commited on Jan 22

Commit

650c805

1 Parent(s): 061d802

Working Version with negative prompts and dynamic trigger words

Browse files

Files changed (4) hide show

utils/ai_generator.py +169 -0
utils/ai_generator_diffusers_flux.py +269 -0
utils/constants.py +2 -0
utils/lora_details.py +59 -0

utils/ai_generator.py ADDED Viewed

	@@ -0,0 +1,169 @@

+# utils/ai_generator.py
+import os
+import time  # Added for implementing delays
+import torch
+import random
+from utils.ai_generator_diffusers_flux import generate_ai_image_local
+from pathlib import Path
+from huggingface_hub import InferenceClient
+import requests
+import io
+from PIL import Image
+from tempfile import NamedTemporaryFile
+import utils.constants as constants
+def generate_image_from_text(text, model_name="flax-community/dalle-mini", image_width=768, image_height=512):
+    # Initialize the InferenceClient
+    client = InferenceClient()
+    # Generate the image from the text
+    response = client(text, model_name)
+    # Get the image data
+    image_data = response.content
+    # Load the image from the data
+    image = Image.open(io.BytesIO(image_data))
+    # Resize the image
+    image = image.resize((image_width, image_height))
+    return image
+def generate_ai_image(
+    map_option,
+    prompt_textbox_value,
+    neg_prompt_textbox_value,
+    model,
+    lora_weights=None,
+    *args,
+    **kwargs
+):
+    seed = random.randint(1, 99999)
+    if torch.cuda.is_available():
+        print("Local GPU available. Generating image locally.")
+        return generate_ai_image_local(
+            map_option,
+            prompt_textbox_value,
+            neg_prompt_textbox_value,
+            model,
+            lora_weights=lora_weights,
+            seed=seed
+        )
+    else:
+        print("No local GPU available. Sending request to Hugging Face API.")
+        return generate_ai_image_remote(
+            map_option,
+            prompt_textbox_value,
+            neg_prompt_textbox_value,
+            model
+        )
+def generate_ai_image_remote(map_option, prompt_textbox_value, neg_prompt_textbox_value, model, height=512, width=896, num_inference_steps=50, guidance_scale=3.5, seed=777):
+    max_retries = 3
+    retry_delay = 4  # Initial delay in seconds
+    try:
+        if map_option != "Prompt":
+            prompt = constants.PROMPTS[map_option]
+            # Convert the negative prompt string to a list
+            negative_prompt_str = constants.NEGATIVE_PROMPTS.get(map_option, "")
+            negative_prompt = [p.strip() for p in negative_prompt_str.split(',') if p.strip()]
+        else:
+            prompt = prompt_textbox_value
+            # Convert the negative prompt string to a list
+            negative_prompt = [p.strip() for p in neg_prompt_textbox_value.split(',') if p.strip()] if neg_prompt_textbox_value else []
+        print("Remotely Generating image with the following parameters:")
+        print(f"Prompt: {prompt}")
+        print(f"Negative Prompt: {negative_prompt}")
+        print(f"Height: {height}")
+        print(f"Width: {width}")
+        print(f"Number of Inference Steps: {num_inference_steps}")
+        print(f"Guidance Scale: {guidance_scale}")
+        print(f"Seed: {seed}")
+        for attempt in range(1, max_retries + 1):
+            try:
+                if os.getenv("IS_SHARED_SPACE") == "True":
+                    client = InferenceClient(
+                        model,
+                        token=constants.HF_API_TOKEN
+                    )
+                    image = client.text_to_image(
+                        inputs=prompt,
+                        parameters={
+                            "guidance_scale": guidance_scale,
+                            "num_inference_steps": num_inference_steps,
+                            "width": width,
+                            "height": height,
+                            "max_sequence_length":512,
+                            # Optional: Add 'scheduler' and 'seed' if needed
+                            "seed": seed
+                        }
+                    )
+                else:
+                    API_URL = f"https://api-inference.huggingface.co/models/{model}"
+                    headers = {
+                        "Authorization": f"Bearer {constants.HF_API_TOKEN}",
+                        "Content-Type": "application/json"
+                    }
+                    payload = {
+                        "inputs": prompt,
+                        "parameters": {
+                            "guidance_scale": guidance_scale,
+                            "num_inference_steps": num_inference_steps,
+                            "width": width,
+                            "height": height,
+                            "max_sequence_length":512,
+                            # Optional: Add 'scheduler' and 'seed' if needed
+                            "seed": seed
+                        }
+                    }
+                    print(f"Attempt {attempt}: Sending POST request to Hugging Face API...")
+                    response = requests.post(API_URL, headers=headers, json=payload, timeout=300)  # Increased timeout to 30 seconds
+                    if response.status_code == 200:
+                        image_bytes = response.content
+                        image = Image.open(io.BytesIO(image_bytes))
+                        break  # Exit the retry loop on success
+                    elif response.status_code == 400:
+                        # Handle 400 Bad Request specifically
+                        print(f"Bad Request (400): {response.text}")
+                        print("Check your request parameters and payload format.")
+                        return None  # Do not retry on 400 errors
+                    elif response.status_code in [429, 504]:
+                        print(f"Received status code {response.status_code}. Retrying in {retry_delay} seconds...")
+                        if attempt < max_retries:
+                            time.sleep(retry_delay)
+                            retry_delay *= 2  # Exponential backoff
+                        else:
+                            response.raise_for_status()  # Raise exception after max retries
+                    else:
+                        print(f"Received unexpected status code {response.status_code}: {response.text}")
+                        response.raise_for_status()
+            except (requests.exceptions.ReadTimeout, requests.exceptions.ConnectTimeout) as timeout_error:
+                print(f"Timeout occurred: {timeout_error}. Retrying in {retry_delay} seconds...")
+                if attempt < max_retries:
+                    time.sleep(retry_delay)
+                    retry_delay *= 2  # Exponential backoff
+                else:
+                    raise  # Re-raise the exception after max retries
+            except requests.exceptions.RequestException as req_error:
+                print(f"Request exception: {req_error}. Retrying in {retry_delay} seconds...")
+                if attempt < max_retries:
+                    time.sleep(retry_delay)
+                    retry_delay *= 2  # Exponential backoff
+                else:
+                    raise  # Re-raise the exception after max retries
+        else:
+            # If all retries failed
+            print("Max retries exceeded. Failed to generate image.")
+            return None
+        with NamedTemporaryFile(delete=False, suffix=".png") as tmp:
+            image.save(tmp.name, format="PNG")
+            constants.temp_files.append(tmp.name)
+            print(f"Image saved to {tmp.name}")
+            return tmp.name
+    except Exception as e:
+        print(f"Error generating AI image: {e}")
+        return None

utils/ai_generator_diffusers_flux.py ADDED Viewed

	@@ -0,0 +1,269 @@

+# utils/ai_generator_diffusers_flux.py
+import os
+import torch
+import accelerate
+import transformers
+import safetensors
+import xformers
+from diffusers import FluxPipeline
+from diffusers.utils import load_image
+# from huggingface_hub import hf_hub_download
+from PIL import Image
+from tempfile import NamedTemporaryFile
+from src.condition import Condition
+import utils.constants as constants
+from utils.image_utils import (
+     crop_and_resize_image,
+)
+from utils.version_info import (
+    versions_html,
+    get_torch_info,
+    get_diffusers_version,
+    get_transformers_version,
+    get_xformers_version
+)
+from utils.lora_details import get_trigger_words
+from utils.color_utils import detect_color_format
+# import utils.misc as misc
+from pathlib import Path
+import warnings
+warnings.filterwarnings("ignore", message=".*Torch was not compiled with flash attention.*")
+#print(torch.__version__)  # Ensure it's 2.0 or newer
+#print(torch.cuda.is_available())  # Ensure CUDA is available
+def generate_image_from_text(
+    text,
+    model_name="black-forest-labs/FLUX.1-dev",
+    lora_weights=None,
+    conditioned_image=None,
+    image_width=1344,
+    image_height=848,
+    guidance_scale=3.5,
+    num_inference_steps=50,
+    seed=0,
+    additional_parameters=None
+):
+    device = "cuda" if torch.cuda.is_available() else "cpu"
+    print(f"device:{device}\nmodel_name:{model_name}\n")
+    pipe = FluxPipeline.from_pretrained(
+        model_name,
+        torch_dtype=torch.bfloat16 if device == "cuda" else torch.float32
+    ).to(device)
+    pipe = pipe.to(device)
+    pipe.enable_model_cpu_offload()
+    # Load and apply LoRA weights
+    if lora_weights:
+        for lora_weight in lora_weights:
+            lora_configs = constants.LORA_DETAILS.get(lora_weight, [])
+            if lora_configs:
+                for config in lora_configs:
+                    weight_name = config.get("weight_name")
+                    adapter_name = config.get("adapter_name")
+                    pipe.load_lora_weights(
+                        lora_weight,
+                        weight_name=weight_name,
+                        adapter_name=adapter_name,
+                        use_auth_token=constants.HF_API_TOKEN
+                    )
+            else:
+                pipe.load_lora_weights(lora_weight, use_auth_token=constants.HF_API_TOKEN)
+    generator = torch.Generator(device=device).manual_seed(seed)
+    conditions = []
+    if conditioned_image is not None:
+        conditioned_image = crop_and_resize_image(conditioned_image, 1024, 1024)
+        condition = Condition("subject", conditioned_image)
+        conditions.append(condition)
+    generate_params = {
+        "prompt": text,
+        "height": image_height,
+        "width": image_width,
+        "guidance_scale": guidance_scale,
+        "num_inference_steps": num_inference_steps,
+        "generator": generator,
+        "conditions": conditions if conditions else None
+    }
+    if additional_parameters:
+        generate_params.update(additional_parameters)
+    generate_params = {k: v for k, v in generate_params.items() if v is not None}
+    result = pipe(**generate_params)
+    image = result.images[0]
+    return image
+def generate_image_lowmem(
+    text,
+    neg_prompt=None,
+    model_name="black-forest-labs/FLUX.1-dev",
+    lora_weights=None,
+    conditioned_image=None,
+    image_width=1344,
+    image_height=848,
+    guidance_scale=3.5,
+    num_inference_steps=50,
+    seed=0,
+    true_cfg_scale=1.0,
+    additional_parameters=None
+):
+    device = "cuda" if torch.cuda.is_available() else "cpu"
+    print(f"device:{device}\nmodel_name:{model_name}\n")
+    print(f"\n {get_torch_info()}\n")
+    # Disable gradient calculations
+    with torch.no_grad():
+        # Initialize the pipeline inside the context manager
+        pipe = FluxPipeline.from_pretrained(
+            model_name,
+            torch_dtype=torch.bfloat16 if device == "cuda" else torch.bfloat32
+        ).to(device)
+        # Optionally, don't use CPU offload if not necessary
+        pipe.enable_model_cpu_offload()
+        # alternative version that may be more efficient
+        # pipe.enable_sequential_cpu_offload()
+        flash_attention_enabled = torch.backends.cuda.flash_sdp_enabled()
+        if flash_attention_enabled == False:
+            #Enable xFormers memory-efficient attention (optional)
+            pipe.enable_xformers_memory_efficient_attention()
+            print("\nEnabled xFormers memory-efficient attention.\n")
+        else:
+            pipe.attn_implementation="flash_attention_2"
+            print("\nEnabled flash_attention_2.\n")
+        pipe.enable_vae_tiling()
+        # Load LoRA weights
+        if lora_weights:
+            for lora_weight in lora_weights:
+                lora_configs = constants.LORA_DETAILS.get(lora_weight, [])
+                if lora_configs:
+                    for config in lora_configs:
+                        # Load LoRA weights with optional weight_name and adapter_name
+                        weight_name = config.get("weight_name")
+                        adapter_name = config.get("adapter_name")
+                        if weight_name and adapter_name:
+                            pipe.load_lora_weights(
+                                lora_weight,
+                                weight_name=weight_name,
+                                adapter_name=adapter_name,
+                                use_auth_token=constants.HF_API_TOKEN
+                            )
+                        else:
+                            pipe.load_lora_weights(
+                                lora_weight,
+                                use_auth_token=constants.HF_API_TOKEN
+                            )
+                        # Apply 'pipe' configurations if present
+                        if 'pipe' in config:
+                            pipe_config = config['pipe']
+                            for method_name, params in pipe_config.items():
+                                method = getattr(pipe, method_name, None)
+                                if method:
+                                    print(f"Applying pipe method: {method_name} with params: {params}")
+                                    method(**params)
+                                else:
+                                    print(f"Method {method_name} not found in pipe.")
+                else:
+                    pipe.load_lora_weights(lora_weight, use_auth_token=constants.HF_API_TOKEN)
+        generator = torch.Generator(device=device).manual_seed(seed)
+        conditions = []
+        if conditioned_image is not None:
+            conditioned_image = crop_and_resize_image(conditioned_image, 1024, 1024)
+            condition = Condition("subject", conditioned_image)
+            conditions.append(condition)
+        if neg_prompt!=None:
+            true_cfg_scale=1.1
+        generate_params = {
+            "prompt": text,
+            "negative_prompt": neg_prompt,
+            "true_cfg_scale": true_cfg_scale,
+            "height": image_height,
+            "width": image_width,
+            "guidance_scale": guidance_scale,
+            "num_inference_steps": num_inference_steps,
+            "generator": generator,
+            "conditions": conditions if conditions else None
+        }
+        if additional_parameters:
+            generate_params.update(additional_parameters)
+        generate_params = {k: v for k, v in generate_params.items() if v is not None}
+        # Generate the image
+        result = pipe(**generate_params)
+        image = result.images[0]
+        # Clean up
+        del result
+        del conditions
+        del generator
+    # Delete the pipeline and clear cache
+    del pipe
+    torch.cuda.empty_cache()
+    print(torch.cuda.memory_summary(device=None, abbreviated=False))
+    return image
+def generate_ai_image_local (
+    map_option,
+    prompt_textbox_value,
+    neg_prompt_textbox_value,
+    model="black-forest-labs/FLUX.1-dev",
+    lora_weights=None,
+    conditioned_image=None,
+    height=512,
+    width=896,
+    num_inference_steps=50,
+    guidance_scale=3.5,
+    seed=777
+):
+    try:
+        if map_option != "Prompt":
+            prompt = constants.PROMPTS[map_option]
+            negative_prompt = constants.NEGATIVE_PROMPTS.get(map_option, "")
+        else:
+            prompt = prompt_textbox_value
+            negative_prompt = neg_prompt_textbox_value or ""
+        #full_prompt = f"{prompt} {negative_prompt}"
+        additional_parameters = {}
+        if lora_weights:
+            for lora_weight in lora_weights:
+                lora_configs = constants.LORA_DETAILS.get(lora_weight, [])
+                for config in lora_configs:
+                    if 'parameters' in config:
+                        additional_parameters.update(config['parameters'])
+                    elif 'trigger_words' in config:
+                        trigger_words = get_trigger_words(lora_weight)
+                        prompt = f"{trigger_words} {prompt}"
+        for key, value in additional_parameters.items():
+            if key in ['height', 'width', 'num_inference_steps', 'max_sequence_length']:
+                additional_parameters[key] = int(value)
+            elif key in ['guidance_scale','true_cfg_scale']:
+                additional_parameters[key] = float(value)
+        height = additional_parameters.get('height', height)
+        width = additional_parameters.get('width', width)
+        num_inference_steps = additional_parameters.get('num_inference_steps', num_inference_steps)
+        guidance_scale = additional_parameters.get('guidance_scale', guidance_scale)
+        print("Generating image with the following parameters:")
+        print(f"Model: {model}")
+        print(f"LoRA Weights: {lora_weights}")
+        print(f"Prompt: {prompt}")
+        print(f"Neg Prompt: {negative_prompt}")
+        print(f"Height: {height}")
+        print(f"Width: {width}")
+        print(f"Number of Inference Steps: {num_inference_steps}")
+        print(f"Guidance Scale: {guidance_scale}")
+        print(f"Seed: {seed}")
+        print(f"Additional Parameters: {additional_parameters}")
+        image = generate_image_lowmem(
+            text=prompt,
+            model_name=model,
+            neg_prompt=negative_prompt,
+            lora_weights=lora_weights,
+            conditioned_image=conditioned_image,
+            image_width=width,
+            image_height=height,
+            guidance_scale=guidance_scale,
+            num_inference_steps=num_inference_steps,
+            seed=seed,
+            additional_parameters=additional_parameters
+        )
+        with NamedTemporaryFile(delete=False, suffix=".png") as tmp:
+            image.save(tmp.name, format="PNG")
+            constants.temp_files.append(tmp.name)
+            print(f"Image saved to {tmp.name}")
+            return tmp.name
+    except Exception as e:
+        print(f"Error generating AI image: {e}")
+        return None

utils/constants.py CHANGED Viewed

@@ -15,6 +15,8 @@ os.environ['XFORMERS_FORCE_DISABLE_TRITON']= '1'
 os.environ["HF_TOKEN"] = ""
 HF_API_TOKEN = os.getenv("HF_TOKEN")
 default_lut_example_img = "./LUT/daisy.jpg"
 PROMPTS = {
     "Map1": "eight_color (tabletop_map built from small hexagon pieces) as ((empty black on all sides), barren alien_world_map), with light_blue_is_rivers and brown_is_mountains and red_is_volcano and [white_is_snow at the top and bottom of map] as (four_color background: light_blue, green, tan, brown), horizontal_gradient is (brown to tan to green to light_blue to blue) and vertical_gradient is (white to blue to (green, tan and red) to blue to white), (middle is dark, no_reflections, no_shadows), ((partial hexes on edges and sides are black))",

 os.environ["HF_TOKEN"] = ""
 HF_API_TOKEN = os.getenv("HF_TOKEN")
 default_lut_example_img = "./LUT/daisy.jpg"
+os.environ["HF_TOKEN"] = """
+HF_API_TOKEN = os.getenv("HF_TOKEN")
 PROMPTS = {
     "Map1": "eight_color (tabletop_map built from small hexagon pieces) as ((empty black on all sides), barren alien_world_map), with light_blue_is_rivers and brown_is_mountains and red_is_volcano and [white_is_snow at the top and bottom of map] as (four_color background: light_blue, green, tan, brown), horizontal_gradient is (brown to tan to green to light_blue to blue) and vertical_gradient is (white to blue to (green, tan and red) to blue to white), (middle is dark, no_reflections, no_shadows), ((partial hexes on edges and sides are black))",

utils/lora_details.py ADDED Viewed

	@@ -0,0 +1,59 @@

+# utils/lora_details.py
+import gradio as gr
+from utils.constants import LORA_DETAILS
+def upd_prompt_notes(model_textbox_value):
+    """
+    Updates the prompt_notes_label with the notes from LORA_DETAILS.
+    Args:
+        model_textbox_value (str): The name of the LoRA model.
+    Returns:
+        gr.update: Updated Gradio label component with the notes.
+    """
+    notes = ""
+    if model_textbox_value in LORA_DETAILS:
+        lora_detail_list = LORA_DETAILS[model_textbox_value]
+        for item in lora_detail_list:
+            if 'notes' in item:
+                notes = item['notes']
+                break
+    else:
+        notes = "Enter Prompt description of your image"
+    return gr.update(value=notes)
+def get_trigger_words(model_textbox_value):
+    """
+    Retrieves the trigger words from constants.LORA_DETAILS for the specified model.
+    Args:
+        model_textbox_value (str): The name of the LoRA model.
+    Returns:
+        str: The trigger words associated with the model, or a default message if not found.
+    """
+    trigger_words = ""
+    if model_textbox_value in LORA_DETAILS:
+        lora_detail_list = LORA_DETAILS[model_textbox_value]
+        for item in lora_detail_list:
+            if 'trigger_words' in item:
+                trigger_words = item['trigger_words']
+                break
+    else:
+        trigger_words = ""
+    return trigger_words
+def upd_trigger_words(model_textbox_value):
+    """
+    Updates the trigger_words_label with the trigger words from LORA_DETAILS.
+    Args:
+        model_textbox_value (str): The name of the LoRA model.
+    Returns:
+        gr.update: Updated Gradio label component with the trigger words.
+    """
+    trigger_words = get_trigger_words(model_textbox_value)
+    return gr.update(value=trigger_words)