@@ -156,6 +156,12 @@ def load_checkpoint_with_lora(w: ComfyWorkflow, checkpoint: CheckpointInput, mod
156
156
return model , Clip (clip , arch ), vae
157
157
158
158
159
+ def vae_encode (w : ComfyWorkflow , vae : Output , image : Output , tiled : bool ):
160
+ if tiled :
161
+ return w .vae_encode_tiled (vae , image )
162
+ return w .vae_encode (vae , image )
163
+
164
+
159
165
def vae_decode (w : ComfyWorkflow , vae : Output , latent : Output , tiled : bool ):
160
166
if tiled :
161
167
return w .vae_decode_tiled (vae , latent )
@@ -678,7 +684,7 @@ def scale_refine_and_decode(
678
684
decoded = vae_decode (w , vae , latent , tiled_vae )
679
685
upscale = w .upscale_image (upscale_model , decoded )
680
686
upscale = w .scale_image (upscale , extent .desired )
681
- latent = w . vae_encode (vae , upscale )
687
+ latent = vae_encode (w , vae , upscale , tiled_vae )
682
688
params = _sampler_params (sampling , strength = 0.4 )
683
689
684
690
positive , negative = encode_text_prompt (w , cond , clip , regions )
@@ -874,7 +880,7 @@ def inpaint(
874
880
)
875
881
inpaint_model = model
876
882
else :
877
- latent = w . vae_encode (vae , in_image )
883
+ latent = vae_encode (w , vae , in_image , checkpoint . tiled_vae )
878
884
latent = w .set_latent_noise_mask (latent , initial_mask )
879
885
inpaint_model = model
880
886
@@ -899,7 +905,7 @@ def inpaint(
899
905
upscale = ensure_minimum_extent (w , upscale , initial_bounds .extent , 32 )
900
906
upscale = w .upscale_image (upscale_model , upscale )
901
907
upscale = w .scale_image (upscale , upscale_extent .desired )
902
- latent = w . vae_encode (vae , upscale )
908
+ latent = vae_encode (w , vae , upscale , checkpoint . tiled_vae )
903
909
latent = w .set_latent_noise_mask (latent , upscale_mask )
904
910
905
911
cond_upscale = cond .copy ()
@@ -956,7 +962,7 @@ def refine(
956
962
model = apply_regional_ip_adapter (w , model , cond .regions , extent .initial , models )
957
963
in_image = w .load_image (image )
958
964
in_image = scale_to_initial (extent , w , in_image , models )
959
- latent = w . vae_encode (vae , in_image )
965
+ latent = vae_encode (w , vae , in_image , checkpoint . tiled_vae )
960
966
latent = w .batch_latent (latent , misc .batch_count )
961
967
positive , negative = encode_text_prompt (w , cond , clip , regions )
962
968
model , positive , negative = apply_control (
@@ -1010,7 +1016,7 @@ def refine_region(
1010
1016
inpaint_patch = w .load_fooocus_inpaint (** models .fooocus_inpaint )
1011
1017
inpaint_model = w .apply_fooocus_inpaint (model , inpaint_patch , latent_inpaint )
1012
1018
else :
1013
- latent = w . vae_encode (vae , in_image )
1019
+ latent = vae_encode (w , vae , in_image , checkpoint . tiled_vae )
1014
1020
latent = w .set_latent_noise_mask (latent , initial_mask )
1015
1021
inpaint_model = model
1016
1022
@@ -1179,7 +1185,7 @@ def tiled_region(region: Region, index: int, tile_bounds: Bounds):
1179
1185
w , tile_model , positive , negative , control , no_reshape , vae , models
1180
1186
)
1181
1187
1182
- latent = w . vae_encode (vae , tile_image )
1188
+ latent = vae_encode (w , vae , tile_image , checkpoint . tiled_vae )
1183
1189
latent = w .set_latent_noise_mask (latent , tile_mask )
1184
1190
sampler = w .sampler_custom_advanced (
1185
1191
tile_model , positive , negative , latent , models .arch , ** _sampler_params (sampling )
0 commit comments