Spaces:

uberthoth
/

artist

Runtime error

App Files Files Community

Josh Cox commited on Feb 22

Commit

158667b

•

1 Parent(s): 78e3b34

app

Browse files

Files changed (6) hide show

.python-version +1 -0
__pycache__/artist_lib.cpython-311.pyc +0 -0
app.py +158 -4
artist_lib.py +179 -0
images/van_gogh_dogs_playing_poker.png +0 -0
requirements.txt +13 -0

.python-version ADDED Viewed

	@@ -0,0 +1 @@


1	+ artist

__pycache__/artist_lib.cpython-311.pyc ADDED Viewed

Binary file (11.1 kB). View file

app.py CHANGED Viewed

@@ -1,7 +1,161 @@
 import gradio as gr
-def greet(name):
-    return "Hello " + name + "!!"
-iface = gr.Interface(fn=greet, inputs="text", outputs="text")
-iface.launch()

+import argparse
+import binascii
+import glob
+import os
+import os.path
+import numpy as np
+import matplotlib.pyplot as plt
+import random
+import sys
+import tempfile
+import time
+import torch
+from PIL import Image
+from diffusers import StableDiffusionPipeline
 import gradio as gr
+import artist_lib
+from dotenv import load_dotenv
+load_dotenv()
+SERVER_NAME = os.getenv("SERVER_NAME")
+drawdemo = gr.Interface(
+    fn=artist_lib.draw,
+    inputs=[
+        gr.Text(label="Drawing description text", value="hindu mandala neon orange and blue"),
+        gr.Dropdown(label='Model', choices=["stable-diffusion-2", "stable-diffusion-2-1", "stable-diffusion-v1-5"], value="stable-diffusion-v1-5"),
+        gr.Checkbox(label="Force-New"),
+    ],
+    outputs="image",
+        examples=[
+        ['van gogh dogs playing poker', "stable-diffusion-v1-5", False],
+        ['picasso the scream', "stable-diffusion-v1-5", False],
+        ['dali american gothic', "stable-diffusion-v1-5", False],
+        ['matisse mona lisa', "stable-diffusion-v1-5", False],
+        ['maxfield parrish angel in lake ', "stable-diffusion-v1-5", False],
+        ['peter max dogs playing poker', "stable-diffusion-v1-5", False],
+        ['hindu mandala copper and patina green', "stable-diffusion-v1-5", False],
+        ['hindu mandala fruit salad', "stable-diffusion-v1-5", False],
+        ['hindu mandala neon green black and purple', "stable-diffusion-v1-5", False],
+        ['astronaut riding a horse on mars', "stable-diffusion-v1-5", False]
+    ],
+)
+AudioDemo = gr.Interface(
+    fn=artist_lib.generate_tone,
+    inputs=[
+        gr.Dropdown(artist_lib.notes, type="index"),
+        gr.Slider(4, 6, step=1),
+        gr.Textbox(value=1, label="Duration in seconds")
+    ],
+    outputs="audio"
+)
+imageClassifierDemo = gr.Interface(
+    fn=artist_lib.imageClassifier,
+    inputs="image",
+    outputs="text"
+)
+audioGeneratorDemo = gr.Interface(
+    fn=artist_lib.audioGenerator,
+    inputs="text",
+    outputs="audio",
+    examples=[
+        ['balsamic beats'],
+        ['dance the night away']
+    ]
+)
+nameMyPetDemo = gr.Interface(
+    fn=artist_lib.nameMyPet,
+    inputs=[
+        gr.Text(label="What type of animal is your pet?", value="green cat")
+    ],
+    outputs="text",
+        examples=[
+        ['dog'],
+        ['pink dolphin'],
+        ['elevated elephant'],
+        ['green monkey'],
+        ['bionic beaver'],
+        ['felonous fish'],
+        ['delinquent dog'],
+        ['dragging donkey'],
+        ['stinky skunk'],
+        ['pink unicorn'],
+        ['naughty narwahl'],
+        ['blue cat']
+    ],
+)
+blog_writer_demo = gr.Interface(
+    fn=artist_lib.write_blog,
+    inputs=[
+        gr.Text(label="Blog description text", value="machine learning can be used to track chickens"),
+        gr.Dropdown(label='Model', choices=["gpt-neo-1.3B", "gpt-neo-2.7B"], value="gpt-neo-1.3B"),
+        gr.Number(label='Minimum word count', value=50, precision=0),
+        gr.Number(label='Maximum word count', value=50, precision=0),
+        gr.Checkbox(label="Force-New"),
+    ],
+    outputs="text",
+        examples=[
+        ['machine learning can be used to track chickens', "gpt-neo-1.3B", 50, 50, False],
+        ['music and machine learning', "gpt-neo-2.7B", 50, 50, False]
+    ],
+)
+generateAudioDemo = gr.Interface(
+    fn=artist_lib.generate_spectrogram_audio_and_loop,
+    title="Audio Diffusion",
+    description="Generate audio using Huggingface diffusers.\
+        The models without 'latent' or 'ddim' give better results but take about \
+            20 minutes without a GPU. For GPU, you can use \
+                [colab](https://colab.research.google.com/github/teticio/audio-diffusion/blob/master/notebooks/gradio_app.ipynb) \
+                    to run this app.",
+    inputs=[
+        gr.Dropdown(label="Model",
+                    choices=[
+                        "teticio/audio-diffusion-256",
+                        "teticio/audio-diffusion-breaks-256",
+                        "teticio/audio-diffusion-instrumental-hiphop-256",
+                        "teticio/audio-diffusion-ddim-256",
+                        "teticio/latent-audio-diffusion-256",
+                        "teticio/latent-audio-diffusion-ddim-256"
+                    ],
+                    value="teticio/latent-audio-diffusion-ddim-256")
+    ],
+    outputs=[
+        gr.Image(label="Mel spectrogram", image_mode="L"),
+        gr.Audio(label="Audio"),
+        gr.Audio(label="Loop"),
+    ],
+    allow_flagging="never")
+with gr.Blocks() as gallerydemo:
+    with gr.Column(variant="panel"):
+        with gr.Row(variant="compact"):
+            text = gr.Textbox(
+                label="Enter your prompt",
+                show_label=False,
+                max_lines=1,
+                placeholder="Enter your prompt"
+            )
+            btn = gr.Button("Generate image")
+        gallery = gr.Gallery(
+            label="Generated images", show_label=False, elem_id="gallery"
+        )
+    btn.click(artist_lib.fake_gan, None, gallery)
+#artist = gr.TabbedInterface( [drawdemo, blog_writer_demo, gallerydemo], ["Draw", "Bloggr", "Gallery"])
+#artist = gr.TabbedInterface( [drawdemo, blog_writer_demo, imageClassifierDemo, generateAudioDemo, audioGeneratorDemo, AudioDemo, nameMyPetDemo], ["Draw", "Bloggr", "imageClassifier", "generateAudio", "audioGenerator", "AudioDemo", "nameMyPet"])
+artist = gr.TabbedInterface( [drawdemo, imageClassifierDemo, generateAudioDemo, nameMyPetDemo, blog_writer_demo], ["Draw", "imageClassifier", "generateAudio", "nameMyPet", "Bloggr"])
+artist.queue(
+    max_size = 4
+)
+artist.launch()

artist_lib.py ADDED Viewed

	@@ -0,0 +1,179 @@

+import argparse
+import binascii
+import glob
+import openai
+import os
+import os.path
+import numpy as np
+import matplotlib.pyplot as plt
+import random
+import sys
+import tempfile
+import time
+import torch
+from PIL import Image
+from IPython.display import Audio
+from diffusers import StableDiffusionPipeline
+from diffusers import DiffusionPipeline
+from transformers import pipeline
+from transformers import ViTFeatureExtractor, ViTForImageClassification
+from audiodiffusion import AudioDiffusion
+import requests
+notes = ["C", "C#", "D", "D#", "E", "F", "F#", "G", "G#", "A", "A#", "B"]
+def fake_gan():
+    images = [
+        (random.choice(
+            [
+                "https://images.unsplash.com/photo-1507003211169-0a1dd7228f2d?ixlib=rb-1.2.1&ixid=MnwxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8&auto=format&fit=crop&w=387&q=80",
+                "https://images.unsplash.com/photo-1554151228-14d9def656e4?ixlib=rb-1.2.1&ixid=MnwxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8&auto=format&fit=crop&w=386&q=80",
+                "https://images.unsplash.com/photo-1542909168-82c3e7fdca5c?ixlib=rb-1.2.1&ixid=MnwxMjA3fDB8MHxzZWFyY2h8MXx8aHVtYW4lMjBmYWNlfGVufDB8fDB8fA%3D%3D&w=1000&q=80",
+                "https://images.unsplash.com/photo-1546456073-92b9f0a8d413?ixlib=rb-1.2.1&ixid=MnwxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8&auto=format&fit=crop&w=387&q=80",
+                "https://images.unsplash.com/photo-1601412436009-d964bd02edbc?ixlib=rb-1.2.1&ixid=MnwxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8&auto=format&fit=crop&w=464&q=80",
+            ]
+        ), f"label {i}" if i != 0 else "label" * 50)
+        for i in range(3)
+    ]
+    return images
+def imageClassifier(inputImage):
+    #fn=artist_lib.imageClassifier,
+    #url = 'http://images.cocodataset.org/val2017/000000039769.jpg'
+    #image = Image.open(requests.get(url, stream=True).raw)
+    image = inputImage
+    feature_extractor = ViTFeatureExtractor.from_pretrained('google/vit-base-patch16-224')
+    model = ViTForImageClassification.from_pretrained('google/vit-base-patch16-224')
+    inputs = feature_extractor(images=image, return_tensors="pt")
+    outputs = model(**inputs)
+    logits = outputs.logits
+    # model predicts one of the 1000 ImageNet classes
+    predicted_class_idx = logits.argmax(-1).item()
+    #print("Predicted class:", model.config.id2label[predicted_class_idx])
+    return "Predicted class:", model.config.id2label[predicted_class_idx]
+def audioGenerator(inputText):
+    device = "cuda" if torch.cuda.is_available() else "cpu"
+    pipe = DiffusionPipeline.from_pretrained("teticio/audio-diffusion-256").to(device)
+    output = pipe()
+    from IPython.display import display
+    display(output.images[0])
+    display(Audio(output.audios[0], rate=pipe.mel.get_sample_rate()))
+    print("sample rate is ", pipe.mel.get_sample_rate())
+    #print(Audio(output.audios[0]))
+    sr=int(pipe.mel.get_sample_rate())
+    audio=Audio(output.audios[0])
+    #return int(pipe.mel.get_sample_rate()), Audio(output.audios[0])
+    return sr, audio
+def generate_spectrogram_audio_and_loop(model_id):
+    audio_diffusion = AudioDiffusion(model_id=model_id)
+    image, (sample_rate,
+            audio) = audio_diffusion.generate_spectrogram_and_audio()
+    loop = AudioDiffusion.loop_it(audio, sample_rate)
+    if loop is None:
+        loop = audio
+    return image, (sample_rate, audio), (sample_rate, loop)
+def generate_tone(note, octave, duration):
+    sr = 48000
+    a4_freq, tones_from_a4 = 440, 12 * (octave - 4) + (note - 9)
+    frequency = a4_freq * 2 ** (tones_from_a4 / 12)
+    duration = int(duration)
+    audio = np.linspace(0, duration, duration * sr)
+    audio = (20000 * np.sin(audio * (2 * np.pi * frequency))).astype(np.int16)
+    return sr, audio
+def draw(inp, this_model, force_new):
+    drawing = inp
+    if this_model == "stable-diffusion-2":
+        this_model_addr = "stabilityai/stable-diffusion-2"
+        images_dir = 'images2/'
+    elif this_model == "stable-diffusion-2-1":
+        this_model_addr = "stabilityai/stable-diffusion-2-1"
+        images_dir = 'images2-1/'
+    elif this_model == "stable-diffusion-v1-5":
+        this_model_addr = "runwayml/stable-diffusion-v1-5"
+        images_dir = 'images/'
+    else:
+        raise gr.Error("Unknown Model!")
+    mkdir_if_not_exist(images_dir)
+    drawing_filename = images_dir + drawing.replace(' ', '_') + '.png'
+    if os.path.exists(drawing_filename):
+        if force_new:
+            new_drawing_filename = images_dir + drawing.replace(' ', '_') + '.' + str(time.time()) + '.png'
+            os.replace(drawing_filename, new_drawing_filename)
+        else:
+            print("found drawing ", drawing_filename)
+            return Image.open(drawing_filename)
+    print("generating drawing '", drawing, "'", drawing_filename)
+    pipe = StableDiffusionPipeline.from_pretrained(this_model_addr, torch_dtype=torch.float16)
+    pipe.enable_attention_slicing()
+    pipe = pipe.to("cuda")
+    image = pipe(drawing).images[0]
+    image.seek(0)
+    image.save(drawing_filename)
+    return image
+def write_blog(inp, this_model, min_length, max_length, force_new):
+    blog_post_name = inp
+    if this_model == "gpt-neo-1.3B":
+        this_model_addr = "EleutherAI/gpt-neo-1.3B"
+        text_dir = 'text1.3/'
+    elif this_model == "gpt-neo-2.7B":
+        this_model_addr = "EleutherAI/gpt-neo-2.7B"
+        text_dir = 'text2.7/'
+    else:
+        raise gr.Error("Unknown Model!")
+    mkdir_if_not_exist(text_dir)
+    target_filename = text_dir + blog_post_name.replace(' ', '_') + '.txt'
+    if os.path.exists(target_filename):
+        if force_new:
+            new_target_filename = text_dir + blog_post_name.replace(' ', '_') + '.' + str(time.time()) + '.txt'
+            os.replace(target_filename, new_target_filename)
+        else:
+            print("found drawing ", target_filename)
+            with open(target_filename, 'r') as file:
+              return file.read()
+    print("generating blog '", blog_post_name, "'", target_filename)
+    device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")
+    #generator = pipeline('text-generation', model='EleutherAI/gpt-neo-2.7B', device=device, torch_dtype=torch.float16)
+    #generator = pipeline('text-generation', model=this_model_addr, torch_dtype=torch.float16)
+    #generator = pipeline('text-generation', model=this_model_addr)
+    generator = pipeline('text-generation', model=this_model_addr, device=device, torch_dtype=torch.float16)
+    # AttributeError: 'TextGenerationPipeline' object has no attribute 'enable_attention_slicing'
+    #generator.enable_attention_slicing()
+    res = generator(blog_post_name, min_length=min_length, max_length=max_length, do_sample=True, temperature=0.7)
+    blog_post_text = res[0]['generated_text']
+    with open(target_filename, 'w') as file:
+        file.write(blog_post_text)
+    return blog_post_text
+def nameMyPet(inp):
+        animal = inp
+        response = openai.Completion.create(
+            model="text-davinci-003",
+            prompt=generate_prompt(animal),
+            temperature=0.6,
+        )
+        return  response.choices[0].text
+def mkdir_if_not_exist(path):
+  if os.path.exists(path):
+      return 0
+  else:
+      os.mkdir(path)
+def generate_prompt(animal):
+    return """Suggest three names for an animal that is a superhero.
+Animal: Cat
+Names: Captain Sharpclaw, Agent Fluffball, The Incredible Feline
+Animal: Dog
+Names: Ruff the Protector, Wonder Canine, Sir Barks-a-Lot
+Animal: {}
+Names:""".format(
+        animal.capitalize()
+    )

images/van_gogh_dogs_playing_poker.png ADDED Viewed

requirements.txt ADDED Viewed

	@@ -0,0 +1,13 @@

+accelerate==0.27.2
+audiodiffusion==1.5.6
+diffusers==0.26.3
+gradio==4.19.1
+ipython==8.21.0
+matplotlib==3.8.3
+numpy==1.26.4
+openai==1.12.0
+Pillow==10.2.0
+python-dotenv==1.0.1
+Requests==2.31.0
+torch==2.2.1
+transformers==4.38.1