
Z Image
Create High-Quality Images from Text Instantly
Text Description
{
"aspect_ratio": "3:4 (portrait)",
"scene_description": "A high-contrast, internet-forward cosplay-style portrait shot inside a worn, industrial concrete room, featuring a single primary subject in a sleek, matte-black, body-hugging outfit and a vivid neon-green bob wig, posed in a dominant, over-the-shoulder stance while looking down toward the camera; the image’s core vibe is gritty urban editorial meets anime/cyber cosplay, with the subject’s saturated green hair and the tight black fabric popping aggressively against a distressed gray-and-black wall and a raw concrete ceiling with exposed piping, creating a stark foreground-to-background depth where the subject fills most of the frame while the environment reads as texture-heavy, decayed architecture.",
"prompt": {
"scene_and_composition": {
"visual_hook": "Low-angle, over-the-shoulder pose that emphasizes the curve of the hips and the tight, matte-black fabric wrapping the body, contrasted by the shockingly saturated neon-green hair; the composition uses a strong ‘looking down at the viewer’ dominance cue and an exaggerated perspective that enlarges the lower torso/hip area closest to the lens.",
"camera_angle": "Extreme low-angle (near floor level) looking up, slightly off to the subject’s rear three-quarter side; perspective distortion from a wide lens makes the near hip/upper thigh appear larger, while the head and ceiling converge upward toward the top-left corner.",
"framing_and_depth": "Full-body/three-quarter body framing leaning toward a lower-torso emphasis; subject occupies most of the mid-to-foreground with minimal breathing room; moderate depth of field—subject remains sharp while background texture is readable but less attention-grabbing, aided by contrast and tonal separation rather than heavy blur.",
"medium_physics": "Crisp digital capture with mild shadow noise in darker wall areas; strong micro-contrast and texture retention on concrete; minimal motion blur (hair tips appear slightly wind-swept but not blurred); no obvious film grain, but a gritty ‘raw’ clarity consistent with phone/DSLR direct flash or hard key lighting."
},
"subject_content": {
"overall_pose": "Standing in a turned, rear three-quarter stance with torso twisted so the shoulders and face angle back toward the camera, creating an over-the-shoulder look-down posture.",
"limb_articulation": {
"left_arm": "Bent and drawn close to the torso, hand placed on/near the waist/hip line, fingers splayed with dark manicure visible.",
"right_arm": "Relaxed along the side with the long sleeve falling in soft folds; arm remains mostly behind the torso line from this angle.",
"left_leg": "Weight-bearing leg closer to camera, hip pushed outward to accentuate curvature; thigh and hip occupy the near foreground due to perspective.",
"right_leg": "Slightly back and offset, supporting the twist; leg line recedes into midground, partially obscured by the drape of the black garment."
},
"pose_dynamics": "Center of gravity sits into the hip with a deliberate, posed tension; the torso twist creates a strong S-curve, shoulders rotated toward camera while hips remain angled away; overall body language reads controlled, confident, and performative.",
"makeup_look": "Editorial-clean complexion with a smooth, slightly luminous skin finish; defined eyeliner/upper lash emphasis and a muted lip tone that keeps focus on the neon wig and the graphic black outfit. Note: makeup style is for reference only and must be merged with the input_photo’s facial features.",
"emotional_vibe": "Cool, self-possessed, slightly intimidating confidence—an ‘I’m above you’ gaze reinforced by the steep low-angle perspective and minimal smile.",
"main_object_apparel": "A matte-black, long-sleeve, high-neck, bodycon garment with clean seams and subtle stretch sheen; fabric hugs the torso and arms with visible tension lines and fold compression at the waist/hip where the hand presses; the silhouette reads sleek and tactical/editorial, functioning as the main graphic mass against the distressed setting. Logic note: if this outfit is crucial to the image’s internet-impact and overall vibe, prioritize it; if less relevant, adapt to the input_photo; if the input_photo lacks full-body info, strictly use this apparel description to complete the scene.",
"hair_and_styling": "Short, neon-green bob wig with choppy, outward-flipped ends and exaggerated, anime-like volume; strands lift slightly as if caught by airflow. Note: hair styling is reference and should auto-adapt to the input_photo when necessary.",
"interaction_with_environment": "Subject occupies the room corner area with the head and shoulders visually framed against the ceiling plane; no direct contact with walls, but the pose uses the tight space and converging concrete lines to amplify dominance and verticality."
},
"environment": {
"visual_depth_stack": {
"foreground_left_to_right": [
"1) Near-lens black fabric edge/drape forming a soft, dark shape at the bottom-left",
"2) The subject’s near hip/upper thigh area occupying the lower-right foreground, catching warmer highlights"
],
"middle_ground_left_to_right": [
"1) Subject torso and bent arm creating a large matte-black mass center-left",
"2) Subject head and neon-green hair centered upper-left, silhouetted against ceiling/wall",
"3) Distressed wall surface with peeling paint and mottled stains behind the subject, center-right"
],
"background_left_to_right": [
"1) Raw concrete ceiling plane with formwork marks and grime, upper-left",
"2) A single exposed white/gray pipe running along the ceiling, upper-left to upper-center",
"3) Corner seam where two concrete walls meet, upper-mid",
"4) Heavily weathered blackened wall with scraped patches and lighter underlayers, right side",
"5) Lower wall band with rough, flaking plaster/paint and brick-like texture hints, lower-left to lower-mid"
]
},
"lighting_atmosphere": {
"key_light": "Hard, directional light from camera-right/front-right, producing crisp highlights on the neon-green hair and strong sculpting across the black garment; the light reads as cool-to-neutral white with high intensity, similar to a direct flash or small hard source.",
"fill_ambient": "Weak ambient fill from the room, leaving deep shadows on the left side of the outfit and in wall recesses; shadow regions retain some detail but skew toward cool gray/greenish neutrality due to concrete bounce.",
"interaction": "Specular glints on hair fibers create sharp, bright edges; the matte-black fabric shows subtle stretch sheen and crease shadowing at the waist/hip; the wall’s peeling paint and concrete pores are accentuated by raking light, increasing perceived grit and tactile roughness."
}
},
"realism_rules": {
"aesthetic_style_definition": [
"Gritty industrial editorial cosplay",
"High-contrast ‘internet photo’ look with bold color pop (neon hair vs black outfit)",
"Wide-angle perspective distortion for dynamic dominance",
"Raw location texture: distressed concrete, peeling paint, exposed utilitarian elements"
],
"image_defect_tolerance": [
"Allow mild shadow noise and uneven wall staining",
"Allow slight over-sharpening/clarity and harsh highlight roll-off consistent with hard key light/flash",
"Allow minor lens distortion (wide-angle stretching near frame edges)",
"Avoid overly perfect skin smoothing; keep realistic pores/texture cues"
]
}
}
}







