|
|
|
|
|
|
|
import os |
|
from PIL import Image, ImageDraw, ImageFont |
|
import nltk |
|
from nltk.corpus import brown |
|
import random |
|
|
|
IMAGES_PER_FONT = 50 |
|
|
|
|
|
nltk.download('brown') |
|
|
|
|
|
font_dirs = ['/System/Library/Fonts/', '/System/Library/Fonts/Supplemental/'] |
|
output_dir = './font_images' |
|
os.makedirs(output_dir, exist_ok=True) |
|
|
|
all_brown_words = sorted(set(brown.words(categories='news'))) |
|
|
|
|
|
FONT_ALLOWLIST = ["Arial", "Avenir", "Courier", "Helvetica", "Georgia", "Tahoma", "Times New Roman", "Verdana"] |
|
|
|
def wrap_text(text, line_length=10): |
|
"""Wraps the provided text every 'line_length' words.""" |
|
words = text.split() |
|
return "\n".join([" ".join(words[i:i+line_length]) for i in range(0, len(words), line_length)]) |
|
|
|
def random_prose_text(words, num_words=200): |
|
"""Returns a random selection of 'num_words' words from the provided list of words.""" |
|
random_words = " ".join(random.sample(words, num_words)) |
|
return wrap_text(random_words) |
|
|
|
def random_code_text(base_code, num_lines=15): |
|
"""Returns a random selection of 'num_lines' lines from the provided code.""" |
|
lines = base_code.split("\n") |
|
return "\n".join(random.sample(lines, min(num_lines, len(lines)))) |
|
|
|
for font_dir in font_dirs: |
|
for font_file in os.listdir(font_dir): |
|
if font_file.endswith('.ttf') or font_file.endswith('.ttc'): |
|
font_path = os.path.join(font_dir, font_file) |
|
font_name = font_file.split('.')[0] |
|
if font_name not in FONT_ALLOWLIST: |
|
continue |
|
|
|
print(font_path, font_name) |
|
|
|
if font_file.endswith('.ttc'): |
|
|
|
font = ImageFont.truetype(font_path, random.choice(range(32, 128)), index=0) |
|
else: |
|
|
|
font_size = random.choice(range(32, 128)) |
|
font = ImageFont.truetype(font_path, font_size) |
|
|
|
|
|
j = 0 |
|
for i in range(IMAGES_PER_FONT): |
|
prose_sample = random_prose_text(all_brown_words) |
|
|
|
for text in [prose_sample]: |
|
img = Image.new('RGB', (800, 400), color="white") |
|
draw = ImageDraw.Draw(img) |
|
|
|
|
|
offset_x = random.randint(-20, 10) |
|
offset_y = random.randint(-20, 10) |
|
draw.text((offset_x, offset_y), text, fill="black", font=font) |
|
|
|
j += 1 |
|
output_file = os.path.join(output_dir, f"{font_name}_{j}.png") |
|
img.save(output_file) |
|
|