Aduc-sdr-cinematic-video

Runtime error

App Files Files Community

Aduc-sdr-cinematic-video / flux_kontext_helpers.py

euiia

Update flux_kontext_helpers.py

cf24bfb verified 3 months ago

raw

history blame

6.81 kB

	# flux_kontext_helpers.py (ADUC: O Especialista Pintor - com suporte a callback)
	# Copyright (C) 4 de Agosto de 2025 Carlos Rodrigues dos Santos

	import torch
	from PIL import Image, ImageOps
	import gc
	from diffusers import FluxKontextPipeline
	import huggingface_hub
	import os
	import threading
	import yaml
	import logging

	from hardware_manager import hardware_manager

	logger = logging.getLogger(__name__)

	class FluxWorker:
	"""Representa uma única instância do pipeline FluxKontext em um dispositivo."""
	def __init__(self, device_id='cuda:0'):
	self.cpu_device = torch.device('cpu')
	self.device = torch.device(device_id if torch.cuda.is_available() else 'cpu')
	self.pipe = None
	self._load_pipe_to_cpu()

	def _load_pipe_to_cpu(self):
	if self.pipe is None:
	logger.info(f"FLUX Worker ({self.device}): Carregando modelo para a CPU...")
	self.pipe = FluxKontextPipeline.from_pretrained(
	"black-forest-labs/FLUX.1-Kontext-dev", torch_dtype=torch.bfloat16
	).to(self.cpu_device)
	logger.info(f"FLUX Worker ({self.device}): Modelo pronto na CPU.")

	def to_gpu(self):
	if self.device.type == 'cpu': return
	logger.info(f"FLUX Worker: Movendo modelo para a GPU {self.device}...")
	self.pipe.to(self.device)

	def to_cpu(self):
	if self.device.type == 'cpu': return
	logger.info(f"FLUX Worker: Descarregando modelo da GPU {self.device}...")
	self.pipe.to(self.cpu_device)
	gc.collect()
	if torch.cuda.is_available(): torch.cuda.empty_cache()

	def _create_composite_reference(self, images: list[Image.Image], target_width: int, target_height: int) -> Image.Image:
	if not images: return None
	valid_images = [img.convert("RGB") for img in images if img is not None]
	if not valid_images: return None
	if len(valid_images) == 1:
	if valid_images[0].size != (target_width, target_height):
	return ImageOps.fit(valid_images[0], (target_width, target_height), Image.Resampling.LANCZOS)
	return valid_images[0]

	base_height = valid_images[0].height
	resized_for_concat = []
	for img in valid_images:
	if img.height != base_height:
	aspect_ratio = img.width / img.height
	new_width = int(base_height * aspect_ratio)
	resized_for_concat.append(img.resize((new_width, base_height), Image.Resampling.LANCZOS))
	else:
	resized_for_concat.append(img)

	total_width = sum(img.width for img in resized_for_concat)
	concatenated = Image.new('RGB', (total_width, base_height))
	x_offset = 0
	for img in resized_for_concat:
	concatenated.paste(img, (x_offset, 0))
	x_offset += img.width

	#final_reference = ImageOps.fit(concatenated, (target_width, target_height), Image.Resampling.LANCZOS)
	return concatenated

	@torch.inference_mode()
	def generate_image_internal(self, reference_images: list[Image.Image], prompt: str, target_width: int, target_height: int, seed: int, callback: callable = None):
	composite_reference = self._create_composite_reference(reference_images, target_width, target_height)

	num_steps = 12 # Valor fixo otimizado

	logger.info(f"\n===== [CHAMADA AO PIPELINE FLUX em {self.device}] =====\n"
	f" - Prompt: '{prompt}'\n"
	f" - Resolução: {target_width}x{target_height}, Seed: {seed}, Passos: {num_steps}\n"
	f" - Nº de Imagens na Composição: {len(reference_images)}\n"
	f"==========================================")

	generated_image = self.pipe(
	image=composite_reference,
	prompt=prompt,
	guidance_scale=2.5,
	width=target_width,
	height=target_height,
	num_inference_steps=num_steps,
	generator=torch.Generator(device="cpu").manual_seed(seed),
	callback_on_step_end=callback,
	callback_on_step_end_tensor_inputs=["latents"] if callback else None
	).images[0]

	return generated_image

	class FluxPoolManager:
	def __init__(self, device_ids):
	logger.info(f"FLUX POOL MANAGER: Criando workers para os dispositivos: {device_ids}")
	self.workers = [FluxWorker(device_id) for device_id in device_ids]
	self.current_worker_index = 0
	self.lock = threading.Lock()
	self.last_cleanup_thread = None

	def _cleanup_worker_thread(self, worker):
	logger.info(f"FLUX CLEANUP THREAD: Iniciando limpeza de {worker.device} em background...")
	worker.to_cpu()

	def generate_image(self, reference_images, prompt, width, height, seed=42, callback=None):
	worker_to_use = None
	try:
	with self.lock:
	if self.last_cleanup_thread and self.last_cleanup_thread.is_alive():
	self.last_cleanup_thread.join()
	worker_to_use = self.workers[self.current_worker_index]
	previous_worker_index = (self.current_worker_index - 1 + len(self.workers)) % len(self.workers)
	worker_to_cleanup = self.workers[previous_worker_index]
	cleanup_thread = threading.Thread(target=self._cleanup_worker_thread, args=(worker_to_cleanup,))
	cleanup_thread.start()
	self.last_cleanup_thread = cleanup_thread
	worker_to_use.to_gpu()
	self.current_worker_index = (self.current_worker_index + 1) % len(self.workers)

	logger.info(f"FLUX POOL MANAGER: Gerando imagem em {worker_to_use.device}...")
	return worker_to_use.generate_image_internal(
	reference_images=reference_images,
	prompt=prompt,
	target_width=width,
	target_height=height,
	seed=seed,
	callback=callback
	)
	except Exception as e:
	logger.error(f"FLUX POOL MANAGER: Erro durante a geração: {e}", exc_info=True)
	raise e
	finally:
	pass

	# --- Instanciação Singleton Dinâmica ---
	logger.info("Lendo config.yaml para inicializar o FluxKontext Pool Manager...")
	with open("config.yaml", 'r') as f: config = yaml.safe_load(f)
	hf_token = os.getenv('HF_TOKEN');
	if hf_token: huggingface_hub.login(token=hf_token)
	flux_gpus_required = config['specialists']['flux']['gpus_required']
	flux_device_ids = hardware_manager.allocate_gpus('Flux', flux_gpus_required)
	flux_kontext_singleton = FluxPoolManager(device_ids=flux_device_ids)
	logger.info("Especialista de Imagem (Flux) pronto.")