add some transform
Browse files- app.py +11 -0
- images/ColorWheel001 BW.jpg +0 -0
- images/ColorWheel001.jpg +0 -0
- images/ColorWheel002 BW.jpg +0 -0
- images/ColorWheel002.jpg +0 -0
app.py
CHANGED
@@ -45,6 +45,7 @@ def image_to_embedding(input_im):
|
|
45 |
image = inp.tile(1, 1, 1, 1).to(device=device, dtype=dtype)
|
46 |
image_embeddings = pipe.image_encoder(image).image_embeds
|
47 |
image_embeddings = image_embeddings[0]
|
|
|
48 |
image_embeddings_np = image_embeddings.cpu().detach().numpy()
|
49 |
return image_embeddings_np
|
50 |
|
@@ -57,6 +58,7 @@ def prompt_to_embedding(prompt):
|
|
57 |
# image = inputs.pixel_values
|
58 |
with torch.no_grad():
|
59 |
prompt_embededdings = model.get_text_features(prompt_tokens.to(device))
|
|
|
60 |
prompt_embededdings = prompt_embededdings[0].cpu().detach().numpy()
|
61 |
return prompt_embededdings
|
62 |
|
@@ -155,7 +157,10 @@ def update_average_embeddings(embedding_base64s_state, embedding_powers):
|
|
155 |
# embeddings_b64 = embedding_to_base64(embeddings)
|
156 |
# return gr.Text.update(embeddings_b64)
|
157 |
return gr.Text.update('')
|
|
|
|
|
158 |
final_embedding = final_embedding / num_embeddings
|
|
|
159 |
embeddings_b64 = embedding_to_base64(final_embedding)
|
160 |
return embeddings_b64
|
161 |
|
@@ -255,6 +260,12 @@ tabbed_examples = {
|
|
255 |
"540554": "540554.jpeg",
|
256 |
"Prompt 4": "two trains are coming down the tracks, a steam engine and a modern train.",
|
257 |
},
|
|
|
|
|
|
|
|
|
|
|
|
|
258 |
"Portraits": {
|
259 |
"Snoop": "Snoop Dogg.jpg",
|
260 |
"Snoop Prompt": "Snoop Dogg",
|
|
|
45 |
image = inp.tile(1, 1, 1, 1).to(device=device, dtype=dtype)
|
46 |
image_embeddings = pipe.image_encoder(image).image_embeds
|
47 |
image_embeddings = image_embeddings[0]
|
48 |
+
# image_embeddings /= image_embeddings.norm(dim=-1, keepdim=True)
|
49 |
image_embeddings_np = image_embeddings.cpu().detach().numpy()
|
50 |
return image_embeddings_np
|
51 |
|
|
|
58 |
# image = inputs.pixel_values
|
59 |
with torch.no_grad():
|
60 |
prompt_embededdings = model.get_text_features(prompt_tokens.to(device))
|
61 |
+
# prompt_embededdings /= prompt_embededdings.norm(dim=-1, keepdim=True)
|
62 |
prompt_embededdings = prompt_embededdings[0].cpu().detach().numpy()
|
63 |
return prompt_embededdings
|
64 |
|
|
|
157 |
# embeddings_b64 = embedding_to_base64(embeddings)
|
158 |
# return gr.Text.update(embeddings_b64)
|
159 |
return gr.Text.update('')
|
160 |
+
|
161 |
+
# TODO toggle this to support average or sum
|
162 |
final_embedding = final_embedding / num_embeddings
|
163 |
+
|
164 |
embeddings_b64 = embedding_to_base64(final_embedding)
|
165 |
return embeddings_b64
|
166 |
|
|
|
260 |
"540554": "540554.jpeg",
|
261 |
"Prompt 4": "two trains are coming down the tracks, a steam engine and a modern train.",
|
262 |
},
|
263 |
+
"Transforms": {
|
264 |
+
"ColorWheel001": "ColorWheel001.jpg",
|
265 |
+
"ColorWheel001 BW": "ColorWheel001 BW.jpg",
|
266 |
+
"ColorWheel002": "ColorWheel002.jpg",
|
267 |
+
"ColorWheel002 BW": "ColorWheel002 BW.jpg",
|
268 |
+
},
|
269 |
"Portraits": {
|
270 |
"Snoop": "Snoop Dogg.jpg",
|
271 |
"Snoop Prompt": "Snoop Dogg",
|
images/ColorWheel001 BW.jpg
ADDED
images/ColorWheel001.jpg
ADDED
images/ColorWheel002 BW.jpg
ADDED
images/ColorWheel002.jpg
ADDED