Spaces:

sohojoe
/

soho-clip

Runtime error

App Files Files Community

sohojoe commited on Jan 9, 2023

Commit

7baa44d

•

1 Parent(s): 7989328

add some basic read me

Browse files

Files changed (1) hide show

app.py +31 -3

app.py CHANGED Viewed

@@ -225,6 +225,15 @@ examples = [
 with gr.Blocks() as demo:
     with gr.Row():
         for i in range(max_tabs):
             with gr.Tab(f"Input {i+1}"):
@@ -246,7 +255,8 @@ with gr.Blocks() as demo:
     with gr.Row():
         with gr.Accordion(f"Avergage embeddings in base 64", open=False):
             average_embedding_base64 = gr.Textbox(show_label=False)
     with gr.Row():
         with gr.Column(scale=1, min_width=200):
             scale = gr.Slider(0, 25, value=3, step=1, label="Guidance scale")
@@ -256,8 +266,6 @@ with gr.Blocks() as demo:
             steps = gr.Slider(5, 50, value=25, step=5, label="Steps")
         with gr.Column(scale=1, min_width=200):
             seed = gr.Number(None, label="Seed", precision=0)
-    with gr.Row():
-        submit = gr.Button("Submit")
     with gr.Row():
         output = gr.Gallery(label="Generated variations")
@@ -277,6 +285,26 @@ with gr.Blocks() as demo:
     submit.click(main, inputs= [average_embedding_base64, scale, n_samples, steps, seed], outputs=output)
     output.style(grid=2)
 if __name__ == "__main__":

 with gr.Blocks() as demo:
+    with gr.Row():
+        gr.Markdown(
+"""# Soho-Clip
+A tool for exploring CLIP embedding spaces.
+My interest is to use CLIP for image/video understanding (see [CLIP_visual-spatial-reasoning](https://github.com/Sohojoe/CLIP_visual-spatial-reasoning).)
+Try it out by uploading a few images/add text prompts and generate images of the average of their embeddings
+""")
     with gr.Row():
         for i in range(max_tabs):
             with gr.Tab(f"Input {i+1}"):
     with gr.Row():
         with gr.Accordion(f"Avergage embeddings in base 64", open=False):
             average_embedding_base64 = gr.Textbox(show_label=False)
+    with gr.Row():
+        submit = gr.Button("Generate images")
     with gr.Row():
         with gr.Column(scale=1, min_width=200):
             scale = gr.Slider(0, 25, value=3, step=1, label="Guidance scale")
             steps = gr.Slider(5, 50, value=25, step=5, label="Steps")
         with gr.Column(scale=1, min_width=200):
             seed = gr.Number(None, label="Seed", precision=0)
     with gr.Row():
         output = gr.Gallery(label="Generated variations")
     submit.click(main, inputs= [average_embedding_base64, scale, n_samples, steps, seed], outputs=output)
     output.style(grid=2)
+    with gr.Row():
+        gr.Markdown(
+"""### Initial Features
+- Combine up to 10 Images and/or text inputs to create an average embedding space.
+- View embedding spaces as graph
+- Generate a new image based on the average embedding space
+### Known limitations
+- Text input is a little off (requires fine tuning and I'm having issues with that at the moment)
+- It can only generate a single image at a time
+- Not easy to use the sample images
+### Acknowledgements
+- I heavily build on Justin Pinkney's Experiments in Image Variation (see https://www.justinpinkney.com/image-variation-experiments). Please credit them if you use this work.
+""")
 if __name__ == "__main__":