Spaces:

KK44
/

StoryBookGenerator

Sleeping

App Files Files Community

StoryBookGenerator / app.py

KK44

Update app.py

dbde418 verified 3 months ago

raw history blame contribute delete

No virus

7.83 kB

	import streamlit as st
	import json
	import torch
	from diffusers import DiffusionPipeline
	from openai import OpenAI
	from PIL import Image,ImageDraw,ImageFont
	from dotenv import load_dotenv
	st.title("Story Book Generator")

	model_name = "stabilityai/stable-diffusion-xl-base-1.0"

	lora_path = "StorybookRedmondV2-KidsBook-KidsRedmAF.safetensors"

	load_dotenv()
	client = OpenAI()

	def wrap_text(text,font,max_width):
	lines = []
	words = text.split()

	while words:
	line = ""
	while words and font.getmask(line + words[0]).getbbox()[2] <= max_width:
	line += (words.pop(0) + ' ')
	lines.append(line.strip())

	return lines

	def text_on_image(image,text,font_path=None,position='top',font_size=50,
	bg_color=(0,0,0,128),line_spacing=20,padding_top=20,padding_bottom=20,
	padding_sides=0):
	draw = ImageDraw.Draw(image)

	try:
	if font_path:
	font = ImageFont.truetype(font_path,font_size)
	except IOError:
	print("Default font will be used as specified font was not found.")
	font = ImageFont.load_default()

	max_width = image.width - 2 *padding_sides
	wrapped_text = wrap_text(text,font,max_width)

	text_heights = [font.getmask(line).getbbox()[3] for line in wrapped_text]
	text_block_height = sum(text_heights) + line_spacing * (len(wrapped_text)-1)

	y = padding_top if position=='top' else image.height - text_block_height - padding_bottom

	bg_rectangle_top = y-padding_top
	bg_rectangle_bottom = y + text_block_height + padding_bottom
	bg_rectangle_left = padding_sides
	bg_rectangle_right = image.width - padding_sides
	if position == "top":
	draw.rectangle([(bg_rectangle_left, bg_rectangle_top), (bg_rectangle_right, bg_rectangle_bottom)],
	fill=bg_color)
	else:
	draw.rectangle([(bg_rectangle_left, image.height - text_block_height - padding_top - padding_bottom),
	(bg_rectangle_right, image.height)], fill=bg_color)

	# Reset y position for text
	y = padding_top if position == "top" else image.height - text_block_height - padding_bottom

	# Draw text on image
	for line in wrapped_text:
	line_width = font.getmask(line).getbbox()[2]
	x = (image.width - line_width) / 2
	draw.text((x, y), line, fill=(255, 255, 255), font=font)
	y += font.getmask(line).getbbox()[3] + line_spacing

	# Display the image
	return image



	@st.cache_resource()
	def load_image_model(model_name,model_path_refiner=None,lora_path=None,torch_dtype=torch.float16,variant='fp16',use_safetensors=True):
	base = DiffusionPipeline.from_pretrained(model_name,
	torch_dtype=torch_dtype,
	variant=variant,
	use_safetensors=use_safetensors)

	if lora_path:
	base.load_lora_weights(lora_path)

	if model_path_refiner:
	refiner = DiffusionPipeline.from_pretrained(
	model_path_refiner,
	text_encoder_2=base.text_encoder_2,
	vae = base.vae,
	use_safetensors=use_safetensors,
	variant=variant
	)
	return base,refiner
	else:
	refiner=None


	return base,refiner
	def generate_image(base,prompt,refiner=None,num_inference_steps=20,guidance_scale=15,
	high_noise_frac=0.8,output_type='latent',verbose=False,temperature=0.7):

	if refiner:
	image = base(prompt=prompt,num_inference_steps=num_inference_steps,denoising_end=high_noise_frac,
	output_type=output_type,verbose=verbose,guidance_scale=guidance_scale,temperature=temperature).images
	image = refiner(prompt=prompt,num_inference_steps=num_inference_steps,denoising_end=high_noise_frac,
	image=image,verbose=verbose).images[0]
	else:
	image = base(prompt=prompt,num_inference_steps=num_inference_steps,
	guidance_scale=guidance_scale).images[0]

	return image
	def generate_description(client,prompt,text_area_placeholder=None,
	model='gpt-3.5-turbo',temperature=0.7,
	max_tokens=3000,top_p=1,frequency_penalty=0,
	presence_penalty=0,stream=True,html=False):

	response = client.chat.completions.create(
	model=model,
	messages=[{'role':'user','content':prompt}],
	temperature=temperature,
	max_tokens=max_tokens,
	top_p = top_p,
	frequency_penalty=frequency_penalty,
	presence_penalty=presence_penalty,
	stream=stream
	)
	complete_response = []

	for chunk in response:
	if chunk.choices[0].delta.content:
	complete_response.append(chunk.choices[0].delta.content)
	result_string = ''.join(complete_response)

	#Auto Scroll
	lines = result_string.count('\n') + 1
	avg_chars_per_line = 80
	lines += len(result_string)//avg_chars_per_line
	height_per_line = 20
	total_height = lines * height_per_line

	if text_area_placeholder:
	if html:
	text_area_placeholder.markdown(result_string,unsafe_allow_html=True)
	else:
	text_area_placeholder.text_area("Generated Text",value=result_string,height=total_height)
	result_string = ''.join(complete_response)
	words = len(result_string.split())
	st.text(f"Total Words Generated: {words}")

	return result_string

	user_input = st.text_input("Enter your prompt",value='A princess that saved the village from dragon')
	base,refiner = load_image_model(model_name,None,lora_path)
	lora_trigger = 'Kids Book'
	prompt_user = user_input + lora_trigger

	prompt_input = """
	write a 5 page story for children with a character.
	- Each page will have a single line.
	- For each page give a description that will be used to generate an image for that page. Don't use names in the description of the image.
	- Describe the appearance of the character in each image description, as the AI does not have a memory.
	- Don't use words like the same character because the ai model does not have any memory.
	- Use white skin color for the character and mention it in each image description.
	- follow the output format as follows:
	{
	"page1":"page 1 line",
	"page2":"page 2 line",
	"page3":"page 3 line",
	"page4":"page 4 line",
	"page5":"page 5 line",
	"page1_image_description":"page1 image description",
	"page2_image_description":"page2 image description",
	"page3_image_description":"page3 image description",
	"page4_image_description":"page4 image description",
	"page5_image_description":"page5 image description",
	}

	Here are the details:
	"""
	prompt = prompt_input + prompt_user

	page1_text = "Once upon a time, in a faraway kingdom, there lived a brave princess. "
	page1_img = Image.open('img.jpeg')

	if st.button("Generate Story"):
	with st.spinner("Generating Story Book..."):

	story = generate_description(client,prompt)

	story_json = json.loads(story)

	for i in range(1,6):
	st.text(f"Page {str(i)}")
	st.write(story_json['page' + str(i)])
	st.write(story_json['page' + str(i) + "_image_description"])
	page_prompt = story_json['page' + str(i) + '_image_description']
	page_text = story_json['page' + str(i)]
	generate_img = generate_image(base,page_prompt)
	image = text_on_image(generate_img,page_text,font_page="one_trick_pony_tt.ttf",
	position ='top' )
	st.image(image,channels='BGR',use_column_width=True)