From 91a143a885d02ac68d8d6814b0afc10efaf84fc5 Mon Sep 17 00:00:00 2001
From: Fuwn <contact@fuwn.me>
Date: Fri, 26 Sep 2025 03:42:54 -0700
Subject: fix(gateway:moderationAgent): Update guidelines

---
 packages/gateway/src/listeners/moderationAgent/utilities.ts | 2 ++
 1 file changed, 2 insertions(+)

(limited to 'packages/gateway/src')

diff --git a/packages/gateway/src/listeners/moderationAgent/utilities.ts b/packages/gateway/src/listeners/moderationAgent/utilities.ts
index 26ba55c..adc3fa2 100644
--- a/packages/gateway/src/listeners/moderationAgent/utilities.ts
+++ b/packages/gateway/src/listeners/moderationAgent/utilities.ts
@@ -86,6 +86,8 @@ Respond with a JSON object containing:
 If no violation is found, set "violation" to false and provide a brief explanation of why the message is acceptable.
 
 CRITICAL: Only analyze the content in quotes above (the current message). Ignore all content in the chat history section. If the current message is innocent (like "true", "yes", "no", etc.) but appears after inappropriate content in the chat history, do NOT flag it.
+
+CRITICAL: DO NOT FLAG VAGUE OR PHILOSOPHICAL CONTENT. If a message is vague, philosophical, abstract, or unclear in meaning, do NOT flag it. Only flag content that clearly violates specific rules. When in doubt, do NOT flag.
 `;
     const response = await fetch(
       "https://openrouter.ai/api/v1/chat/completions",
-- 
cgit v1.2.3