Spaces:
Running on Zero
Running on Zero
File size: 1,373 Bytes
f88cfbb fb42b12 f88cfbb fb42b12 f88cfbb fb42b12 f88cfbb fb42b12 f88cfbb fb42b12 f88cfbb fb42b12 f88cfbb fb42b12 f88cfbb fb42b12 f88cfbb | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 | import torch
from diffusers import FluxImg2ImgPipeline
from PIL import Image
import sys
import spaces
# Tested with FLUX.1-schnell
@spaces.GPU
def process_image(image, mask_image, prompt="a person", model_id="black-forest-labs/FLUX.1-schnell", strength=0.75, seed=0, num_inference_steps=4):
print("Starting process_image")
if image is None:
print("Empty input image returned.")
return None
# Ensure the image is in RGB mode (this handles formats like WebP and JFIF)
if image.mode != "RGB":
image = image.convert("RGB")
# If needed, add use_auth_token="YOUR_TOKEN" in from_pretrained below.
pipe = FluxImg2ImgPipeline.from_pretrained(
model_id,
torch_dtype=torch.bfloat16
).to("cuda")
generator = torch.Generator("cuda").manual_seed(seed)
print(prompt)
output = pipe(
prompt=prompt,
image=image,
generator=generator,
strength=strength,
guidance_scale=0,
num_inference_steps=num_inference_steps,
max_sequence_length=256
)
# TODO: Add mask support if needed
return output.images[0]
if __name__ == "__main__":
# Usage: python flux1_img2img.py input-image input-mask output
image = Image.open(sys.argv[1])
mask = Image.open(sys.argv[2])
output = process_image(image, mask)
output.save(sys.argv[3])
|