{"type":"link","version":"1.0","title":"LLM judges require full trajectory context to trigger at all, then achieve only F1 0.17–0.40 at 90x baseline cost","author_name":"AI Archs","author_url":"https://ai-arch.pages.dev","provider_name":"AI Archs","provider_url":"https://ai-arch.pages.dev","url":"https://ai-arch.pages.dev/n/llm-judge-context-floor-for-intervention-detection","thumbnail_url":"https://ai-arch.pages.dev/android-chrome-512x512.png","thumbnail_width":512,"thumbnail_height":512}