maxcushion / handler.py
colt12's picture
Update handler.py
5545537 verified
raw
history blame
1.33 kB
import torch
from diffusers import StableDiffusionXLPipeline, DDIMScheduler # Import your desired scheduler
import base64
from io import BytesIO
import os
class InferenceHandler:
def __init__(self):
self.device = "cuda" if torch.cuda.is_available() else "cpu"
model_name = "./" # Use the current directory
self.pipe = StableDiffusionXLPipeline.from_pretrained(
model_name,
torch_dtype=torch.float16,
use_safetensors=True,
use_auth_token=os.getenv("HUGGINGFACE_TOKEN")
).to(self.device)
# Set the scheduler programmatically
self.pipe.scheduler = DDIMScheduler.from_config(self.pipe.scheduler.config)
def __call__(self, inputs):
prompt = inputs.get("prompt", "")
if not prompt:
raise ValueError("A prompt must be provided")
negative_prompt = inputs.get("negative_prompt", "")
image = self.pipe(
prompt=prompt,
negative_prompt=negative_prompt,
num_inference_steps=30,
guidance_scale=7.5
).images[0]
buffered = BytesIO()
image.save(buffered, format="PNG")
image_base64 = base64.b64encode(buffered.getvalue()).decode("utf-8")
return {"image_base64": image_base64}
handler = InferenceHandler()