Changes

2026-04-16 15:46:56 +01:00
parent 8c8d9a6d47
commit a755e12ea3
2 changed files with 20 additions and 35 deletions
--- a/gen_face_ai.py
+++ b/gen_face_ai.py
@@ -1,17 +1,13 @@
 #!/usr/bin/env python3
 """
-gen_face_ai.py  –  Generate assets/face_wire.png using Gemini image generation
-────────────────────────────────────────────────────────────────────────────────
-Uses the Gemini / Google Gen AI SDK with a native image-generation model
-(gemini-2.5-flash-image or similar) to produce a wireframe face PNG ready for
-display.py to load.
+gen_face_ai.py  –  Generate assets/face_wire.png via Gemini image generation
+──────────────────────────────────────────────────────────────────────────────
+Run once to produce the face PNG that display.py loads at startup.

    pip install google-genai pillow
    python3 gen_face_ai.py

-Or set the key in the environment:
-    export GEMINI_API_KEY=YOUR_KEY
-    python3 gen_face_ai.py
+Pass --list-models to see what image-capable models your key can reach.
 """

 import os
@@ -19,16 +15,15 @@ import sys
 import io
 import argparse

-# ── Paste your Gemini API key here ────────────────────────────────────────────
+# ── API key ───────────────────────────────────────────────────────────────────
 API_KEY = 'AQ.Ab8RN6LuGwkGiKPa61jsLAEYEpJp1Yl2EkZuBWTbN9AMKxgTSw'
 # ─────────────────────────────────────────────────────────────────────────────

-# ── CLI ───────────────────────────────────────────────────────────────────────
 ap = argparse.ArgumentParser()
-ap.add_argument('--key',  default='', help='Override the hardcoded API key')
-ap.add_argument('--out',  default='assets/face_wire.png')
+ap.add_argument('--key',   default='', help='Override the hardcoded API key')
+ap.add_argument('--out',   default='assets/face_wire.png')
 ap.add_argument('--model', default='gemini-2.5-flash-image',
-                help='Gemini image model to use (default: gemini-2.5-flash-image)')
+                help='Gemini image model to use')
 ap.add_argument('--list-models', action='store_true',
                help='Print models that support generateContent then exit')
 args = ap.parse_args()
@@ -37,7 +32,6 @@ api_key = args.key or API_KEY or os.environ.get('GEMINI_API_KEY', '')
 if not api_key:
    sys.exit('ERROR: paste your key into API_KEY at the top of this file')

-# ── Install check ─────────────────────────────────────────────────────────────
 try:
    from google import genai
    from google.genai import types
@@ -49,7 +43,6 @@ try:
 except ImportError:
    sys.exit('Run:  pip install pillow   then try again.')

-# ── Connect ───────────────────────────────────────────────────────────────────
 print('Connecting to Google GenAI …')
 client = genai.Client(api_key=api_key)

@@ -61,7 +54,6 @@ if args.list_models:
            print(f'  {m.name}')
    sys.exit(0)

-# ── Prompt ────────────────────────────────────────────────────────────────────
 PROMPT = (
    "3D wireframe polygon mesh of a human head and face, viewed from slightly "
    "below, front-facing, neutral expression, pure black background, thin "
@@ -70,17 +62,15 @@ PROMPT = (
    "style, high contrast monochrome"
 )

-# ── Generate ──────────────────────────────────────────────────────────────────
 print(f'Generating with {args.model} …')
 response = client.models.generate_content(
-    model   = args.model,
-    contents= PROMPT,
-    config  = types.GenerateContentConfig(
+    model    = args.model,
+    contents = PROMPT,
+    config   = types.GenerateContentConfig(
        response_modalities = ['IMAGE', 'TEXT'],
    ),
 )

-# ── Extract image bytes ───────────────────────────────────────────────────────
 img_bytes = None
 for part in response.candidates[0].content.parts:
    if part.inline_data and part.inline_data.mime_type.startswith('image/'):
@@ -88,17 +78,12 @@ for part in response.candidates[0].content.parts:
        break

 if img_bytes is None:
-    # Print any text the model returned to help debug
    for part in response.candidates[0].content.parts:
        if hasattr(part, 'text') and part.text:
-            print('Model text response:', part.text[:400])
+            print('Model said:', part.text[:400])
    sys.exit('No image in response – try a different --model')

-# ── Save as PNG ───────────────────────────────────────────────────────────────
-os.makedirs(os.path.dirname(args.out) if os.path.dirname(args.out) else '.',
-            exist_ok=True)
-
-# Convert whatever format came back to a proper PNG
+os.makedirs(os.path.dirname(args.out) if os.path.dirname(args.out) else '.', exist_ok=True)
 img = Image.open(io.BytesIO(img_bytes))
 img.save(args.out, 'PNG')