diff --git a/prompts/quality-evaluator.md b/prompts/quality-evaluator.md
index 418adc9ce7..a8ec117642 100644
--- a/prompts/quality-evaluator.md
+++ b/prompts/quality-evaluator.md
@@ -97,7 +97,7 @@ You evaluate implementations that passed all auto-reject checks. Focus purely on
 
   "visual_quality": {
     "total": 23,
-    "vq01_text_legibility": {"score": 5, "max": 8, "note": "Readable but relying on defaults (font sizes not explicitly set)"},
+    "vq01_text_legibility": {"score": 6, "max": 8, "note": "Title slightly oversized for content — fontsize=18pt squeezes against the right edge; reduce to ~14pt"},
     "vq02_no_overlap": {"score": 6, "max": 6, "note": "No overlap"},
     "vq03_element_visibility": {"score": 5, "max": 6, "note": "Visible but markers could be better adapted"},
     "vq04_color_accessibility": {"score": 2, "max": 2, "note": "CVD-safe contrast beyond palette choice"},
@@ -150,7 +150,7 @@ You evaluate implementations that passed all auto-reject checks. Focus purely on
   ],
 
   "weaknesses": [
-    "Relying on default font sizes instead of explicit settings",
+    "Title at fontsize=18pt squeezes against the right edge — reduce to ~14pt for the long mandated anyplot title format",
     "No design refinement beyond library defaults",
     "No data storytelling - visual emphasis or hierarchy would improve the plot"
   ],