Spaces:

nostalgebraist
/

frank-diffusion-streamlit

Runtime error

App Files Files Community

frank-diffusion-streamlit / app.py

nostalgebraist

typo

53273e5 about 2 years ago

raw history blame contribute delete

No virus

7.45 kB

	import streamlit as st

	import time, uuid
	from datetime import datetime
	import numpy as np
	from PIL import Image

	if 'session_id' not in st.session_state:
	st.session_state.session_id = str(uuid.uuid4())
	st.session_state.n_gen = 0

	# constants
	HF_REPO_NAME_DIFFUSION = 'nostalgebraist/nostalgebraist-autoresponder-diffusion'
	model_path_diffusion = 'nostalgebraist-autoresponder-diffusion'
	timestep_respacing_sres1 = '20' # '90,60,60,20,20'
	timestep_respacing_sres2 = '20' # '250'

	DIFFUSION_DEFAULTS = dict(
	batch_size=1,
	n_samples=1,
	clf_free_guidance=True,
	clf_free_guidance_sres=False,
	guidance_scale=1,
	guidance_scale_sres=0,
	yield_intermediates=True
	)

	@st.experimental_singleton
	def setup():
	import os, subprocess, sys
	if not os.path.exists('improved_diffusion'):
	os.system("git clone https://github.com/nostalgebraist/improved-diffusion.git")
	os.system("cd improved-diffusion && git fetch origin nbar-space && git checkout nbar-space && pip install -e .")
	os.system("pip install tokenizers x-transformers==0.22.0 axial-positional-embedding")
	os.system("pip install einops==0.3.2")
	sys.path.append("improved-diffusion")

	import improved_diffusion.pipeline
	from transformer_utils.util.tfm_utils import get_local_path_from_huggingface_cdn

	if not os.path.exists(model_path_diffusion):
	model_tar_name = 'model.tar'
	model_tar_path = get_local_path_from_huggingface_cdn(
	HF_REPO_NAME_DIFFUSION, model_tar_name
	)
	subprocess.run(f"tar -xf {model_tar_path} && rm {model_tar_path}", shell=True)

	checkpoint_path_sres1 = os.path.join(model_path_diffusion, "sres1.pt")
	config_path_sres1 = os.path.join(model_path_diffusion, "config_sres1.json")

	checkpoint_path_sres2 = os.path.join(model_path_diffusion, "sres2.pt")
	config_path_sres2 = os.path.join(model_path_diffusion, "config_sres2.json")

	# load
	sampling_model_sres1 = improved_diffusion.pipeline.SamplingModel.from_config(
	checkpoint_path=checkpoint_path_sres1,
	config_path=config_path_sres1,
	timestep_respacing=timestep_respacing_sres1
	)

	sampling_model_sres2 = improved_diffusion.pipeline.SamplingModel.from_config(
	checkpoint_path=checkpoint_path_sres2,
	config_path=config_path_sres2,
	timestep_respacing=timestep_respacing_sres2
	)

	pipeline = improved_diffusion.pipeline.SamplingPipeline(sampling_model_sres1, sampling_model_sres2)
	return pipeline


	def now_str():
	return datetime.utcnow().strftime('%Y-%m-%d %H-%M-%S')


	def log(msg, st_state):
	session_id = st_state.session_id if 'session_id' in st_state else None
	n_gen = st.session_state.n_gen if 'n_gen' in st_state else None

	print(f"{now_str()} {session_id} ({n_gen}th gen):\n\t{msg}\n")

	def handler(text, ts1, ts2, gs1, st_state):
	pipeline = setup()

	data = {'text': text[:380], 'guidance_scale': gs1}
	args = {k: v for k, v in DIFFUSION_DEFAULTS.items()}
	args.update(data)

	log_data = {'ts1': ts2, 'ts2': ts2}
	log_data.update(args)

	log(repr(log_data), st_state)

	pipeline.base_model.set_timestep_respacing(str(ts1))
	pipeline.super_res_model.set_timestep_respacing(str(ts2))

	return pipeline.sample(**args)

	FRESH = True

	st.title('nostalgebraist-autoresponder image generation demo')

	st.write("#### For a much faster experience, try the [Colab notebook](https://colab.research.google.com/drive/17BOTYmLv4fdurr8y5dcaGKy8JVY_A62a?usp=sharing) instead!")

	st.write("A demo of the image models used in the tumblr bot [nostalgebraist-autoresponder](https://nostalgebraist-autoresponder.tumblr.com/).\n\nBy [nostalgebraist](https://nostalgebraist.tumblr.com/)")

	st.write('##### What is this thing? How does it work?')

	st.write("See [this post](https://nostalgebraist.tumblr.com/post/672300992964050944/franks-image-generation-model-explained) for an explanation.")

	st.header('Prompt')

	button_dril = st.button('Fill @dril tweet example text')

	if FRESH and button_dril:
	st.session_state.fill_value = 'wint\nFollowing\n@dril\nthe wise man bowed his head solemnly and\nspoke: "theres actually zero difference\nbetween good & bad things. you imbecile.\nyou fucking moron'

	if 'fill_value' in st.session_state:
	fill_value = st.session_state.fill_value
	else:
	fill_value = ""
	st.session_state.fill_value = fill_value

	text = st.text_area('Enter your text here (or leave blank for a textless image)', max_chars=380, height=230,
	value=fill_value)

	st.header('Settings')

	st.write("The bot uses 250 base steps and 250 upsampling steps, with custom spacing (not available here) for the base part.\n\nSince this demo doesn't have a GPU, you'll probably want to use fewer than 250 steps unles you have a lot of patience.")

	help_ts1 = "How long to run the base model. Larger values make the image more realistic / better. Smaller values are faster."
	help_ts2 = "How long to run the upsampling model. Larger values sometimes make the big image crisper and more detailed. Smaller values are faster."
	help_gs1 = "Guidance scale. Larger values make the image more likely to contain the text you wrote. If this is zero, the first part will be faster."

	ts1 = st.slider('Steps (base)', min_value=5, max_value=500, value=50, step=5, help=help_ts1)
	ts2 = st.slider('Steps (upsampling)', min_value=5, max_value=500, value=50, step=5, help=help_ts2)
	gs1 = st.select_slider('Guidance scale (base)', [0.5*i for i in range(9)], value=1.0, help=help_gs1)

	button_go = st.button('Generate')
	button_stop = st.button('Stop')

	st.write("During generation, the two images show different ways of looking at the same process.\n- The left image starts with 100% noise and gradually turns into 100 signal.\n- The right image shows the model's current 'guess' about what the left image will look like when all the noise has been removed.")

	generating_marker = st.empty()
	low_res = st.empty()
	high_res = st.empty()

	if button_go:
	st.session_state.n_gen = st.session_state.n_gen + 1
	with generating_marker.container():
	st.write('Generating...')
	st.write('Prompt:')
	st.write(repr(text))

	count_low_res, count_high_res = 0, 0
	times_low, times_high = [], []

	t = time.time()

	for s, xs in handler(text, ts1, ts2, gs1, st.session_state):
	s = Image.fromarray(s[0])
	xs = Image.fromarray(xs[0])

	t2 = time.time()
	delta = t2 - t
	t = t2

	is_high_res = s.size[0] == 256

	if is_high_res:
	target = high_res
	count_high_res += 1
	count = count_high_res
	total = ts2
	times_high.append(delta)
	times = times_high
	prefix = "Part 2 of 2 (upsampling)"
	else:
	target = low_res
	count_low_res += 1
	count = count_low_res
	total = ts1
	times_low.append(delta)
	times = times_low
	prefix = "Part 1 of 2 (base model)"

	rate = sum(times)/len(times)

	with target.container():
	st.image([s, xs])
	st.write(f'{prefix} \| {count:02d} / {total} frames \| {rate:.2f} seconds/frame')

	if button_stop:
	log('gen stopped', st.session_state)
	break

	with generating_marker.container():
	log('gen complete', st.session_state)
	st.write('')