1212from diffusers .pipelines .stable_diffusion import StableDiffusionPipelineOutput
1313from diffusers .pipelines .stable_diffusion .safety_checker import StableDiffusionSafetyChecker
1414from diffusers .schedulers import DDIMScheduler , LMSDiscreteScheduler , PNDMScheduler
15- from diffusers .utils import deprecate , is_accelerate_available , logging
15+ from diffusers .utils import PIL_INTERPOLATION , deprecate , is_accelerate_available , logging
1616from transformers import CLIPFeatureExtractor , CLIPTextModel , CLIPTokenizer
1717
1818
@@ -358,7 +358,7 @@ def get_weighted_text_embeddings(
358358def preprocess_image (image ):
359359 w , h = image .size
360360 w , h = map (lambda x : x - x % 32 , (w , h )) # resize to integer multiple of 32
361- image = image .resize ((w , h ), resample = PIL . Image . LANCZOS )
361+ image = image .resize ((w , h ), resample = PIL_INTERPOLATION [ "lanczos" ] )
362362 image = np .array (image ).astype (np .float32 ) / 255.0
363363 image = image [None ].transpose (0 , 3 , 1 , 2 )
364364 image = torch .from_numpy (image )
@@ -369,7 +369,7 @@ def preprocess_mask(mask):
369369 mask = mask .convert ("L" )
370370 w , h = mask .size
371371 w , h = map (lambda x : x - x % 32 , (w , h )) # resize to integer multiple of 32
372- mask = mask .resize ((w // 8 , h // 8 ), resample = PIL . Image . NEAREST )
372+ mask = mask .resize ((w // 8 , h // 8 ), resample = PIL_INTERPOLATION [ "nearest" ] )
373373 mask = np .array (mask ).astype (np .float32 ) / 255.0
374374 mask = np .tile (mask , (4 , 1 , 1 ))
375375 mask = mask [None ].transpose (0 , 1 , 2 , 3 ) # what does this step do?
0 commit comments