image-ip-composer

Running on Zero

App Files Files Community

linoyts HF Staff commited on Apr 1

Commit

4375f4e

verified ·

1 Parent(s): ca154e9

Update IP_Composer/perform_swap.py

Browse files

Files changed (1) hide show

IP_Composer/perform_swap.py +14 -41

IP_Composer/perform_swap.py CHANGED Viewed

@@ -1,64 +1,37 @@
 import torch
 import numpy as np
-from typing import List, Dict, Optional
-from PIL.Image import Image as PILImage
-from IP_Adapter import IPAdapterXL
-def compute_dataset_embeds_svd(
-    all_embeds: np.ndarray,
-    rank: int
-) -> np.ndarray:
     # Perform SVD on the combined matrix
-    _, _, v = np.linalg.svd(all_embeds, full_matrices=False)
     # Select the top `rank` singular vectors to construct the projection matrix
-    v = v[:rank]
-    projection_matrix = v.T @ v
     return projection_matrix
-def get_projected_embedding(
-    embed: np.ndarray,
-    projection_matrix: np.ndarray
-) -> np.ndarray:
-    return embed @ projection_matrix
-def get_embedding_composition(
-    embed: np.ndarray,
-    projections_data: List[Dict[str, np.ndarray]]
-) -> np.ndarray:
     combined_embeds = embed.copy()
     for proj_data in projections_data:
-        combined_embeds -= get_projected_embedding(embed, proj_data["projection_matrix"])
-        combined_embeds += get_projected_embedding(proj_data["embed"], proj_data["projection_matrix"])
     return combined_embeds
-def get_modified_images_embeds_composition(
-    embed: np.ndarray,
-    projections_data: List[Dict[str, np.ndarray]],
-    ip_model: IPAdapterXL,
-    prompt: Optional[str] = None,
-    scale: float = 1.0,
-    num_samples: int = 3,
-    seed: int = 420
-) -> List[PILImage]:
     final_embeds = get_embedding_composition(embed, projections_data)
     clip_embeds = torch.from_numpy(final_embeds)
-    images: List[PILImage] = ip_model.generate(
-    clip_image_embeds=clip_embeds,
-    prompt=prompt,
-    num_samples=num_samples,
-    num_inference_steps=50,
-    seed=seed,
-    guidance_scale=7.5,
-    scale=scale
-    )
     return images

 import torch
 import numpy as np
+def compute_dataset_embeds_svd(all_embeds, rank):
     # Perform SVD on the combined matrix
+    u, s, vh = np.linalg.svd(all_embeds, full_matrices=False)
     # Select the top `rank` singular vectors to construct the projection matrix
+    vh = vh[:rank]  # Top `rank` right singular vectors
+    projection_matrix = vh.T @ vh  # Shape: (feature_dim, feature_dim)
     return projection_matrix
+def get_embedding_composition(embed, projections_data):
+    # Initialize the combined embedding with the input embed
     combined_embeds = embed.copy()
     for proj_data in projections_data:
+        # Add the combined projection to the result
+        combined_embeds -= embed @ proj_data["projection_matrix"]
+        combined_embeds += proj_data["embed"] @ proj_data["projection_matrix"]
     return combined_embeds
+def get_modified_images_embeds_composition(embed, projections_data, ip_model, prompt=None, scale=1.0, num_samples=3, seed=420, num_inference_steps=50):
     final_embeds = get_embedding_composition(embed, projections_data)
     clip_embeds = torch.from_numpy(final_embeds)
+    images = ip_model.generate(clip_image_embeds=clip_embeds, prompt=prompt, num_samples=num_samples, num_inference_steps=num_inference_steps, seed=seed, guidance_scale=7.5, scale=scale)
     return images