* feat: add meme-generation skill * Reduce meme skill prompt cost with tighter selection rules * feat(skill): overhaul meme-generation into real image generator Move from skills/creative/ to optional-skills/creative/ (niche skill, not needed by default). Replace prompt-only meme concept brainstormer with actual meme image generation: - Python script using Pillow to overlay text on template images - 10 curated templates with hand-tuned text positioning - Dynamic access to ~100 popular imgflip templates via public API - Custom image mode (--image): use AI-generated or any image as base - Two text modes: overlay (white+outline on image) or bars (black bars) - Vision verification workflow: use vision_analyze to QA the result - Auto-scaling font with pixel-accurate word wrapping - Template search via --search - No API keys required Original skill concept by adanaleycio (PR #1771), overhauled with image generation and custom image support. --------- Co-authored-by: adanaleycio <atillababa767@gmail.com>
472 lines
16 KiB
Python
472 lines
16 KiB
Python
#!/usr/bin/env python3
|
|
"""Generate a meme image by overlaying text on a template.
|
|
|
|
Usage:
|
|
python generate_meme.py <template_id_or_name> <output_path> <text1> [text2] [text3] [text4]
|
|
|
|
Example:
|
|
python generate_meme.py drake /tmp/meme.png "Writing tests" "Shipping to prod and hoping"
|
|
python generate_meme.py "Disaster Girl" /tmp/meme.png "Top text" "Bottom text"
|
|
python generate_meme.py --list # show curated templates
|
|
python generate_meme.py --search "distracted" # search all imgflip templates
|
|
|
|
Templates with custom text positioning are in templates.json (10 curated).
|
|
Any of the ~100 popular imgflip templates can also be used by name or ID —
|
|
unknown templates get smart default text positioning based on their box_count.
|
|
"""
|
|
|
|
import json
|
|
import os
|
|
import sys
|
|
import textwrap
|
|
from io import BytesIO
|
|
from pathlib import Path
|
|
|
|
try:
|
|
import requests as _requests
|
|
except ImportError:
|
|
_requests = None
|
|
|
|
from PIL import Image, ImageDraw, ImageFont
|
|
|
|
SCRIPT_DIR = Path(__file__).parent
|
|
TEMPLATES_FILE = SCRIPT_DIR / "templates.json"
|
|
CACHE_DIR = SCRIPT_DIR / ".cache"
|
|
IMGFLIP_API = "https://api.imgflip.com/get_memes"
|
|
IMGFLIP_CACHE_FILE = CACHE_DIR / "imgflip_memes.json"
|
|
IMGFLIP_CACHE_MAX_AGE = 86400 # 24 hours
|
|
|
|
|
|
def _fetch_url(url: str, timeout: int = 15) -> bytes:
|
|
"""Fetch URL content, using requests if available, else urllib."""
|
|
if _requests is not None:
|
|
resp = _requests.get(url, timeout=timeout)
|
|
resp.raise_for_status()
|
|
return resp.content
|
|
import urllib.request
|
|
return urllib.request.urlopen(url, timeout=timeout).read()
|
|
|
|
|
|
def load_curated_templates() -> dict:
|
|
"""Load templates with hand-tuned text field positions."""
|
|
with open(TEMPLATES_FILE) as f:
|
|
return json.load(f)
|
|
|
|
|
|
def _default_fields(box_count: int) -> list:
|
|
"""Generate sensible default text field positions for unknown templates."""
|
|
if box_count <= 0:
|
|
box_count = 2
|
|
if box_count == 1:
|
|
return [{"name": "text", "x_pct": 0.5, "y_pct": 0.5, "w_pct": 0.90, "align": "center"}]
|
|
if box_count == 2:
|
|
return [
|
|
{"name": "top", "x_pct": 0.5, "y_pct": 0.08, "w_pct": 0.95, "align": "center"},
|
|
{"name": "bottom", "x_pct": 0.5, "y_pct": 0.92, "w_pct": 0.95, "align": "center"},
|
|
]
|
|
# 3+: evenly space vertically
|
|
fields = []
|
|
for i in range(box_count):
|
|
y = 0.08 + (0.84 * i / (box_count - 1)) if box_count > 1 else 0.5
|
|
fields.append({
|
|
"name": f"text{i+1}",
|
|
"x_pct": 0.5,
|
|
"y_pct": round(y, 2),
|
|
"w_pct": 0.90,
|
|
"align": "center",
|
|
})
|
|
return fields
|
|
|
|
|
|
def fetch_imgflip_templates() -> list:
|
|
"""Fetch popular meme templates from imgflip API. Cached for 24h."""
|
|
import time
|
|
|
|
CACHE_DIR.mkdir(exist_ok=True)
|
|
# Check cache
|
|
if IMGFLIP_CACHE_FILE.exists():
|
|
age = time.time() - IMGFLIP_CACHE_FILE.stat().st_mtime
|
|
if age < IMGFLIP_CACHE_MAX_AGE:
|
|
with open(IMGFLIP_CACHE_FILE) as f:
|
|
return json.load(f)
|
|
|
|
try:
|
|
data = json.loads(_fetch_url(IMGFLIP_API))
|
|
memes = data.get("data", {}).get("memes", [])
|
|
with open(IMGFLIP_CACHE_FILE, "w") as f:
|
|
json.dump(memes, f)
|
|
return memes
|
|
except Exception as e:
|
|
# If fetch fails and we have stale cache, use it
|
|
if IMGFLIP_CACHE_FILE.exists():
|
|
with open(IMGFLIP_CACHE_FILE) as f:
|
|
return json.load(f)
|
|
print(f"Warning: could not fetch imgflip templates: {e}", file=sys.stderr)
|
|
return []
|
|
|
|
|
|
def _slugify(name: str) -> str:
|
|
"""Convert a template name to a slug for matching."""
|
|
return name.lower().replace(" ", "-").replace("'", "").replace("\"", "")
|
|
|
|
|
|
def resolve_template(identifier: str) -> dict:
|
|
"""Resolve a template by curated ID, imgflip name, or imgflip ID.
|
|
|
|
Returns dict with: name, url, fields, source.
|
|
"""
|
|
curated = load_curated_templates()
|
|
|
|
# 1. Exact curated ID match
|
|
if identifier in curated:
|
|
tmpl = curated[identifier]
|
|
return {**tmpl, "source": "curated"}
|
|
|
|
# 2. Slugified curated match
|
|
slug = _slugify(identifier)
|
|
for tid, tmpl in curated.items():
|
|
if _slugify(tmpl["name"]) == slug or tid == slug:
|
|
return {**tmpl, "source": "curated"}
|
|
|
|
# 3. Search imgflip templates
|
|
imgflip_memes = fetch_imgflip_templates()
|
|
slug_lower = slug.lower()
|
|
id_lower = identifier.strip()
|
|
|
|
for meme in imgflip_memes:
|
|
meme_slug = _slugify(meme["name"])
|
|
# Check curated first for this imgflip template (custom positioning)
|
|
for tid, ctmpl in curated.items():
|
|
if _slugify(ctmpl["name"]) == meme_slug:
|
|
if meme_slug == slug_lower or meme["id"] == id_lower:
|
|
return {**ctmpl, "source": "curated"}
|
|
|
|
if meme_slug == slug_lower or meme["id"] == id_lower or slug_lower in meme_slug:
|
|
return {
|
|
"name": meme["name"],
|
|
"url": meme["url"],
|
|
"fields": _default_fields(meme.get("box_count", 2)),
|
|
"source": "imgflip",
|
|
}
|
|
|
|
return None
|
|
|
|
|
|
def get_template_image(url: str) -> Image.Image:
|
|
"""Download a template image, caching it locally."""
|
|
CACHE_DIR.mkdir(exist_ok=True)
|
|
# Use URL hash as cache key
|
|
cache_name = url.split("/")[-1]
|
|
cache_path = CACHE_DIR / cache_name
|
|
|
|
# Always cache as PNG to avoid JPEG/RGBA conflicts
|
|
cache_path = cache_path.with_suffix(".png")
|
|
|
|
if cache_path.exists():
|
|
return Image.open(cache_path).convert("RGBA")
|
|
|
|
data = _fetch_url(url)
|
|
img = Image.open(BytesIO(data)).convert("RGBA")
|
|
img.save(cache_path, "PNG")
|
|
return img
|
|
|
|
|
|
def find_font(size: int) -> ImageFont.FreeTypeFont:
|
|
"""Find a bold font for meme text. Tries Impact, then falls back."""
|
|
candidates = [
|
|
"/usr/share/fonts/truetype/msttcorefonts/Impact.ttf",
|
|
"/usr/share/fonts/truetype/liberation/LiberationSans-Bold.ttf",
|
|
"/usr/share/fonts/liberation-sans/LiberationSans-Bold.ttf",
|
|
"/usr/share/fonts/truetype/dejavu/DejaVuSans-Bold.ttf",
|
|
"/usr/share/fonts/dejavu-sans/DejaVuSans-Bold.ttf",
|
|
"/System/Library/Fonts/Helvetica.ttc",
|
|
"/System/Library/Fonts/SFCompact.ttf",
|
|
]
|
|
for path in candidates:
|
|
if os.path.exists(path):
|
|
try:
|
|
return ImageFont.truetype(path, size)
|
|
except (OSError, IOError):
|
|
continue
|
|
# Last resort: Pillow default
|
|
try:
|
|
return ImageFont.truetype("DejaVuSans-Bold", size)
|
|
except (OSError, IOError):
|
|
return ImageFont.load_default()
|
|
|
|
|
|
def _wrap_text(text: str, font: ImageFont.FreeTypeFont, max_width: int) -> str:
|
|
"""Word-wrap text to fit within max_width pixels. Never breaks mid-word."""
|
|
words = text.split()
|
|
if not words:
|
|
return text
|
|
lines = []
|
|
current_line = words[0]
|
|
for word in words[1:]:
|
|
test_line = current_line + " " + word
|
|
if font.getlength(test_line) <= max_width:
|
|
current_line = test_line
|
|
else:
|
|
lines.append(current_line)
|
|
current_line = word
|
|
lines.append(current_line)
|
|
return "\n".join(lines)
|
|
|
|
|
|
def draw_outlined_text(
|
|
draw: ImageDraw.ImageDraw,
|
|
text: str,
|
|
x: int,
|
|
y: int,
|
|
font_size: int,
|
|
max_width: int,
|
|
align: str = "center",
|
|
):
|
|
"""Draw white text with black outline, auto-scaled to fit max_width."""
|
|
# Auto-scale: reduce font size until text fits reasonably
|
|
size = font_size
|
|
while size > 12:
|
|
font = find_font(size)
|
|
wrapped = _wrap_text(text, font, max_width)
|
|
bbox = draw.multiline_textbbox((0, 0), wrapped, font=font, align=align)
|
|
text_w = bbox[2] - bbox[0]
|
|
line_count = wrapped.count("\n") + 1
|
|
# Accept if width fits and not too many lines
|
|
if text_w <= max_width * 1.05 and line_count <= 4:
|
|
break
|
|
size -= 2
|
|
else:
|
|
font = find_font(size)
|
|
wrapped = _wrap_text(text, font, max_width)
|
|
|
|
# Measure total text block
|
|
bbox = draw.multiline_textbbox((0, 0), wrapped, font=font, align=align)
|
|
text_w = bbox[2] - bbox[0]
|
|
text_h = bbox[3] - bbox[1]
|
|
|
|
# Center horizontally at x, vertically at y
|
|
tx = x - text_w // 2
|
|
ty = y - text_h // 2
|
|
|
|
# Draw outline (black border)
|
|
outline_range = max(2, font.size // 18)
|
|
for dx in range(-outline_range, outline_range + 1):
|
|
for dy in range(-outline_range, outline_range + 1):
|
|
if dx == 0 and dy == 0:
|
|
continue
|
|
draw.multiline_text(
|
|
(tx + dx, ty + dy), wrapped, font=font, fill="black", align=align
|
|
)
|
|
# Draw main text (white)
|
|
draw.multiline_text((tx, ty), wrapped, font=font, fill="white", align=align)
|
|
|
|
|
|
def _overlay_on_image(img: Image.Image, texts: list, fields: list) -> Image.Image:
|
|
"""Overlay meme text directly on an image using field positions."""
|
|
draw = ImageDraw.Draw(img)
|
|
w, h = img.size
|
|
base_font_size = max(16, min(w, h) // 12)
|
|
|
|
for i, field in enumerate(fields):
|
|
if i >= len(texts):
|
|
break
|
|
text = texts[i].strip()
|
|
if not text:
|
|
continue
|
|
fx = int(field["x_pct"] * w)
|
|
fy = int(field["y_pct"] * h)
|
|
fw = int(field["w_pct"] * w)
|
|
draw_outlined_text(draw, text, fx, fy, base_font_size, fw, field.get("align", "center"))
|
|
return img
|
|
|
|
|
|
def _add_bars(img: Image.Image, texts: list) -> Image.Image:
|
|
"""Add black bars with white text above/below the image.
|
|
|
|
Distributes texts across bars: first text on top bar, last text on
|
|
bottom bar, any middle texts overlaid on the image center.
|
|
"""
|
|
w, h = img.size
|
|
bar_font_size = max(20, w // 16)
|
|
font = find_font(bar_font_size)
|
|
padding = bar_font_size // 2
|
|
|
|
top_text = texts[0].strip() if texts else ""
|
|
bottom_text = texts[-1].strip() if len(texts) > 1 else ""
|
|
middle_texts = [t.strip() for t in texts[1:-1]] if len(texts) > 2 else []
|
|
|
|
def _measure_bar(text: str) -> int:
|
|
if not text:
|
|
return 0
|
|
wrapped = _wrap_text(text, font, int(w * 0.92))
|
|
bbox = ImageDraw.Draw(Image.new("RGB", (1, 1))).multiline_textbbox(
|
|
(0, 0), wrapped, font=font, align="center"
|
|
)
|
|
return (bbox[3] - bbox[1]) + padding * 2
|
|
|
|
top_h = _measure_bar(top_text)
|
|
bottom_h = _measure_bar(bottom_text)
|
|
new_h = h + top_h + bottom_h
|
|
|
|
canvas = Image.new("RGB", (w, new_h), (0, 0, 0))
|
|
canvas.paste(img.convert("RGB"), (0, top_h))
|
|
draw = ImageDraw.Draw(canvas)
|
|
|
|
if top_text:
|
|
wrapped = _wrap_text(top_text, font, int(w * 0.92))
|
|
bbox = draw.multiline_textbbox((0, 0), wrapped, font=font, align="center")
|
|
tw = bbox[2] - bbox[0]
|
|
th = bbox[3] - bbox[1]
|
|
tx = (w - tw) // 2
|
|
ty = (top_h - th) // 2
|
|
draw.multiline_text((tx, ty), wrapped, font=font, fill="white", align="center")
|
|
|
|
if bottom_text:
|
|
wrapped = _wrap_text(bottom_text, font, int(w * 0.92))
|
|
bbox = draw.multiline_textbbox((0, 0), wrapped, font=font, align="center")
|
|
tw = bbox[2] - bbox[0]
|
|
th = bbox[3] - bbox[1]
|
|
tx = (w - tw) // 2
|
|
ty = top_h + h + (bottom_h - th) // 2
|
|
draw.multiline_text((tx, ty), wrapped, font=font, fill="white", align="center")
|
|
|
|
# Overlay any middle texts centered on the image
|
|
if middle_texts:
|
|
mid_fields = _default_fields(len(middle_texts))
|
|
# Shift y positions to account for top bar offset
|
|
for field in mid_fields:
|
|
field["y_pct"] = (top_h + field["y_pct"] * h) / new_h
|
|
field["w_pct"] = 0.90
|
|
_overlay_on_image(canvas, middle_texts, mid_fields)
|
|
|
|
return canvas
|
|
|
|
|
|
def generate_meme(template_id: str, texts: list[str], output_path: str) -> str:
|
|
"""Generate a meme from a template and save it. Returns the path."""
|
|
tmpl = resolve_template(template_id)
|
|
|
|
if tmpl is None:
|
|
print(f"Unknown template: {template_id}", file=sys.stderr)
|
|
print("Use --list to see curated templates or --search to find imgflip templates.", file=sys.stderr)
|
|
sys.exit(1)
|
|
|
|
fields = tmpl["fields"]
|
|
print(f"Using template: {tmpl['name']} ({tmpl['source']}, {len(fields)} fields)", file=sys.stderr)
|
|
|
|
img = get_template_image(tmpl["url"])
|
|
img = _overlay_on_image(img, texts, fields)
|
|
|
|
output = Path(output_path)
|
|
if output.suffix.lower() in (".jpg", ".jpeg"):
|
|
img = img.convert("RGB")
|
|
img.save(str(output), quality=95)
|
|
return str(output)
|
|
|
|
|
|
def generate_from_image(
|
|
image_path: str, texts: list[str], output_path: str, use_bars: bool = False
|
|
) -> str:
|
|
"""Generate a meme from a custom image (e.g. AI-generated). Returns the path."""
|
|
img = Image.open(image_path).convert("RGBA")
|
|
print(f"Custom image: {img.size[0]}x{img.size[1]}, {len(texts)} text(s), mode={'bars' if use_bars else 'overlay'}", file=sys.stderr)
|
|
|
|
if use_bars:
|
|
result = _add_bars(img, texts)
|
|
else:
|
|
fields = _default_fields(len(texts))
|
|
result = _overlay_on_image(img, texts, fields)
|
|
|
|
output = Path(output_path)
|
|
if output.suffix.lower() in (".jpg", ".jpeg"):
|
|
result = result.convert("RGB")
|
|
result.save(str(output), quality=95)
|
|
return str(output)
|
|
|
|
|
|
def list_templates():
|
|
"""Print curated templates with custom positioning."""
|
|
templates = load_curated_templates()
|
|
print(f"{'ID':<25} {'Name':<30} {'Fields':<8} Best for")
|
|
print("-" * 90)
|
|
for tid, tmpl in sorted(templates.items()):
|
|
fields = len(tmpl["fields"])
|
|
print(f"{tid:<25} {tmpl['name']:<30} {fields:<8} {tmpl['best_for']}")
|
|
print(f"\n{len(templates)} curated templates with custom text positioning.")
|
|
print("Use --search to find any of the ~100 popular imgflip templates.")
|
|
|
|
|
|
def search_templates(query: str):
|
|
"""Search imgflip templates by name."""
|
|
imgflip_memes = fetch_imgflip_templates()
|
|
curated = load_curated_templates()
|
|
curated_slugs = {_slugify(t["name"]) for t in curated.values()}
|
|
query_lower = query.lower()
|
|
|
|
matches = []
|
|
for meme in imgflip_memes:
|
|
if query_lower in meme["name"].lower():
|
|
slug = _slugify(meme["name"])
|
|
has_custom = "curated" if slug in curated_slugs else "default"
|
|
matches.append((meme["name"], meme["id"], meme.get("box_count", 2), has_custom))
|
|
|
|
if not matches:
|
|
print(f"No templates found matching '{query}'")
|
|
return
|
|
|
|
print(f"{'Name':<40} {'ID':<12} {'Fields':<8} Positioning")
|
|
print("-" * 75)
|
|
for name, mid, boxes, positioning in matches:
|
|
print(f"{name:<40} {mid:<12} {boxes:<8} {positioning}")
|
|
print(f"\n{len(matches)} template(s) found. Use the name or ID as the first argument.")
|
|
|
|
|
|
if __name__ == "__main__":
|
|
if len(sys.argv) < 2:
|
|
print("Usage: generate_meme.py <template_id_or_name> <output_path> <text1> [text2] ...")
|
|
print(" generate_meme.py --image <path> [--bars] <output_path> <text1> [text2] ...")
|
|
print(" generate_meme.py --list # curated templates")
|
|
print(" generate_meme.py --search <query> # search all imgflip templates")
|
|
sys.exit(1)
|
|
|
|
if sys.argv[1] == "--list":
|
|
list_templates()
|
|
sys.exit(0)
|
|
|
|
if sys.argv[1] == "--search":
|
|
if len(sys.argv) < 3:
|
|
print("Usage: generate_meme.py --search <query>")
|
|
sys.exit(1)
|
|
search_templates(sys.argv[2])
|
|
sys.exit(0)
|
|
|
|
if sys.argv[1] == "--image":
|
|
# Custom image mode: --image <path> [--bars] <output> <text1> ...
|
|
args = sys.argv[2:]
|
|
if len(args) < 3:
|
|
print("Usage: generate_meme.py --image <image_path> [--bars] <output_path> <text1> ...")
|
|
sys.exit(1)
|
|
image_path = args.pop(0)
|
|
use_bars = False
|
|
if args and args[0] == "--bars":
|
|
use_bars = True
|
|
args.pop(0)
|
|
if len(args) < 2:
|
|
print("Need at least: output_path and one text argument")
|
|
sys.exit(1)
|
|
output_path = args.pop(0)
|
|
result = generate_from_image(image_path, args, output_path, use_bars=use_bars)
|
|
print(f"Meme saved to: {result}")
|
|
sys.exit(0)
|
|
|
|
if len(sys.argv) < 4:
|
|
print("Need at least: template_id_or_name, output_path, and one text argument")
|
|
sys.exit(1)
|
|
|
|
template_id = sys.argv[1]
|
|
output_path = sys.argv[2]
|
|
texts = sys.argv[3:]
|
|
|
|
result = generate_meme(template_id, texts, output_path)
|
|
print(f"Meme saved to: {result}")
|