Try to free memory for both cond+uncond before inference.

This commit is contained in:
comfyanonymous
2023-11-27 14:55:40 -05:00
parent be71bb5e13
commit 13fdee6abf
2 changed files with 3 additions and 3 deletions

View File

@@ -166,8 +166,8 @@ class BaseModel(torch.nn.Module):
def memory_required(self, input_shape):
if comfy.model_management.xformers_enabled() or comfy.model_management.pytorch_attention_flash_attention():
#TODO: this needs to be tweaked
area = max(input_shape[0], 3) * input_shape[2] * input_shape[3]
return (area * comfy.model_management.dtype_size(self.get_dtype()) / 60) * (1024 * 1024)
area = input_shape[0] * input_shape[2] * input_shape[3]
return (area * comfy.model_management.dtype_size(self.get_dtype()) / 50) * (1024 * 1024)
else:
#TODO: this formula might be too aggressive since I tweaked the sub-quad and split algorithms to use less memory.
area = input_shape[0] * input_shape[2] * input_shape[3]