Spaces:

lulavc
/

Z-Image-Turbo

Running on Zero

App Files Files

lulavc commited on 2 days ago

Commit

c0d50a9

verified ·

1 Parent(s): d65f758

Upload app.py with huggingface_hub

Browse files

Files changed (1) hide show

app.py +50 -13

app.py CHANGED Viewed

@@ -715,19 +715,61 @@ def generate_prompt_with_glm(image_description: str, user_request: str, style: s
     if not image_description or image_description.startswith("Please") or image_description.startswith("Error") or image_description.startswith("GLM API") or image_description.startswith("Could not"):
         return "Please analyze the image first."
-    if not user_request or not user_request.strip():
-        return "Please describe what changes you want."
     client = get_deepseek_client()
     if not client:
         return "DeepSeek API key not configured. Please add DEEPSEEK_API_KEY to space secrets."
-    style_hint = f" Apply style: {style}." if style and style != "None" else ""
     desc = image_description[:MAX_DESCRIPTION_LENGTH] if len(image_description) > MAX_DESCRIPTION_LENGTH else image_description
-    system_prompt = """You are an image prompt generator. Output ONLY the final prompt - nothing else.
-TASK: Combine the image description with the requested changes into ONE image prompt.
 GLOBAL RULE: Your output text CANNOT exceed 4000 TOKENS. This is a strict limit. Output ONLY the prompt text itself.
@@ -739,13 +781,8 @@ ABSOLUTELY FORBIDDEN - NEVER OUTPUT THESE:
 - Word counting or token counting
 - ANY text that is not the actual image prompt
-WRONG (reasoning leaked):
-"Add textures and mood: The velvet of dresses has a rich..."
-"Here is the transformed prompt: A beautiful sunset..."
-"The key elements to include are: lighting, colors..."
-CORRECT (pure prompt only):
-"A majestic ballroom scene rendered in vibrant anime style, elegant dancers in flowing silk gowns with rich velvet textures, crystal chandeliers casting warm golden light, polished marble floor with soft reflections, romantic atmosphere with floating rose petals"
 OUTPUT THE IMAGE PROMPT NOW - NOTHING ELSE:"""
@@ -755,7 +792,7 @@ OUTPUT THE IMAGE PROMPT NOW - NOTHING ELSE:"""
             max_tokens=4000,
             messages=[
                 {"role": "system", "content": system_prompt},
-                {"role": "user", "content": f"ORIGINAL IMAGE: {desc}\n\nREQUESTED CHANGES: {user_request}{style_hint}"}
             ],
         )

     if not image_description or image_description.startswith("Please") or image_description.startswith("Error") or image_description.startswith("GLM API") or image_description.startswith("Could not"):
         return "Please analyze the image first."
+    has_style = style and style != "None"
+    has_request = user_request and user_request.strip()
+    # Allow style-only generation (no user request needed if style is selected)
+    if not has_request and not has_style:
+        return "Please describe what changes you want or select a style."
     client = get_deepseek_client()
     if not client:
         return "DeepSeek API key not configured. Please add DEEPSEEK_API_KEY to space secrets."
     desc = image_description[:MAX_DESCRIPTION_LENGTH] if len(image_description) > MAX_DESCRIPTION_LENGTH else image_description
+    # Get the full style details from STYLE_SUFFIXES
+    style_details = STYLE_SUFFIXES.get(style, "").lstrip(", ").strip() if has_style else ""
+    # Build the user message based on what's provided
+    if has_style and has_request:
+        # Both style and custom request
+        user_content = f"""ORIGINAL IMAGE DESCRIPTION:
+{desc}
+STYLE TO APPLY: {style}
+STYLE DETAILS (use these painting techniques): {style_details}
+ADDITIONAL CHANGES REQUESTED: {user_request}
+Generate a prompt that transforms the image into this painting style while incorporating the requested changes."""
+    elif has_style:
+        # Style only - no custom request
+        user_content = f"""ORIGINAL IMAGE DESCRIPTION:
+{desc}
+STYLE TO APPLY: {style}
+STYLE DETAILS (use these painting techniques): {style_details}
+Generate a prompt that transforms this image into a {style}. Describe the scene as it would appear painted in this style, incorporating all the painting techniques and visual characteristics listed above."""
+    else:
+        # Custom request only - no style
+        user_content = f"""ORIGINAL IMAGE DESCRIPTION:
+{desc}
+REQUESTED CHANGES: {user_request}
+Generate a prompt that describes the transformed image."""
+    system_prompt = """You are an image prompt generator specialized in painting style transformations. Output ONLY the final prompt - nothing else.
+TASK: Generate a detailed image prompt that describes how the original image would look after transformation.
+When a PAINTING STYLE is specified (Van Gogh, Picasso, etc.):
+- You MUST incorporate ALL the painting technique details provided
+- Describe the scene AS A PAINTING with visible brushstrokes, paint textures, canvas texture
+- Include the specific color palette, brushwork style, and artistic characteristics of that painter
+- The output should clearly be a PAINTING, not a photo
 GLOBAL RULE: Your output text CANNOT exceed 4000 TOKENS. This is a strict limit. Output ONLY the prompt text itself.
 - Word counting or token counting
 - ANY text that is not the actual image prompt
+CORRECT OUTPUT EXAMPLE (Van Gogh style):
+"A post-impressionist oil painting of a ballroom scene in the style of Vincent van Gogh, elegant dancers rendered with thick impasto brushstrokes, swirling dynamic patterns in the ceiling and walls, vibrant cadmium yellows and cobalt blues in the chandeliers creating luminous glowing halos, visible canvas texture beneath bold expressive paint layers, the figures painted with short choppy directional marks, emotional intensity through saturated complementary colors"
 OUTPUT THE IMAGE PROMPT NOW - NOTHING ELSE:"""
             max_tokens=4000,
             messages=[
                 {"role": "system", "content": system_prompt},
+                {"role": "user", "content": user_content}
             ],
         )