feat: channel-level conversation analysis with compact formatting

Switch from per-user message batching to per-channel conversation analysis. The LLM now sees the full interleaved conversation with relative timestamps, reply chains, and consecutive message collapsing instead of isolated flat text per user. Key changes: - Fix gpt-5-nano temperature incompatibility (conditional temp param) - Add mention-triggered scan: users @mention bot to analyze recent chat - Refactor debounce buffer from (channel_id, user_id) to channel_id - Replace per-message analyze_message() with analyze_conversation() returning per-user findings from a single LLM call - Add CONVERSATION_TOOL schema with coherence, topic, and game fields - Compact message format: relative timestamps, reply arrows (→), consecutive same-user message collapsing - Separate mention scan tasks from debounce tasks - Remove _store_context/_get_context (conversation block IS the context) - Escalation timeout config: [30, 60, 120, 240] minutes Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
2026-02-24 23:13:07 -05:00
parent 943c67cc87
commit 90b70cad69
5 changed files with 793 additions and 227 deletions
@@ -153,6 +153,19 @@ class ChatCog(commands.Cog):
            if not content:
                content = "(just pinged me)" if not is_proactive else message.content

+            # If a mention scan is running, await it so we can include findings
+            scan_summary = ""
+            if self.bot.user in message.mentions:
+                sentiment_cog = self.bot.get_cog("SentimentCog")
+                if sentiment_cog:
+                    task = sentiment_cog._mention_scan_tasks.get(message.channel.id)
+                    if task and not task.done():
+                        try:
+                            await asyncio.wait_for(asyncio.shield(task), timeout=45)
+                        except (asyncio.TimeoutError, asyncio.CancelledError):
+                            pass
+                    scan_summary = sentiment_cog._mention_scan_results.pop(message.id, "")
+
            # Add drama score context only when noteworthy
            drama_score = self.bot.drama_tracker.get_drama_score(message.author.id)
            user_data = self.bot.drama_tracker.get_user(message.author.id)
@@ -169,6 +182,10 @@ class ChatCog(commands.Cog):
            if user_notes:
                extra_context += f"[Notes about {message.author.display_name}: {user_notes}]\n"

+            # Include mention scan findings if available
+            if scan_summary:
+                extra_context += f"[You just scanned recent chat. Results: {scan_summary}]\n"
+
            recent_user_msgs = []
            try:
                async for msg in message.channel.history(limit=50, before=message):
@@ -239,8 +256,7 @@ class ChatCog(commands.Cog):
        # warnings/mutes appear before the chat reply
        sentiment_cog = self.bot.get_cog("SentimentCog")
        if sentiment_cog:
-            key = (message.channel.id, message.author.id)
-            task = sentiment_cog._debounce_tasks.get(key)
+            task = sentiment_cog._debounce_tasks.get(message.channel.id)
            if task and not task.done():
                try:
                    await asyncio.wait_for(asyncio.shield(task), timeout=15)
@@ -1,8 +1,8 @@
 import asyncio
 import logging
-from collections import deque
 from datetime import datetime, timedelta, timezone

+
 import discord
 from discord.ext import commands, tasks

@@ -15,17 +15,21 @@ STATE_FLUSH_INTERVAL = 300  # 5 minutes
 class SentimentCog(commands.Cog):
    def __init__(self, bot: commands.Bot):
        self.bot = bot
-        # Per-channel message history for context: {channel_id: deque of (author, content)}
-        self._channel_history: dict[int, deque] = {}
        # Track which user IDs have unsaved in-memory changes
        self._dirty_users: set[int] = set()
        # Per-user redirect cooldown: {user_id: last_redirect_datetime}
        self._redirect_cooldowns: dict[int, datetime] = {}
-        # Debounce buffer: keyed by (channel_id, user_id), stores list of messages
-        self._message_buffer: dict[tuple[int, int], list[discord.Message]] = {}
-        # Pending debounce timer tasks
-        self._debounce_tasks: dict[tuple[int, int], asyncio.Task] = {}
-        # Per-channel poll cooldown: {channel_id: last_poll_datetime}
+        # Debounce buffer: keyed by channel_id, stores list of messages from ALL users
+        self._message_buffer: dict[int, list[discord.Message]] = {}
+        # Pending debounce timer tasks (per-channel)
+        self._debounce_tasks: dict[int, asyncio.Task] = {}
+        # Mention scan tasks (separate from debounce)
+        self._mention_scan_tasks: dict[int, asyncio.Task] = {}
+        # Mention scan state
+        self._mention_scan_cooldowns: dict[int, datetime] = {}  # {channel_id: last_scan_time}
+        self._mention_scan_results: dict[int, str] = {}  # {trigger_message_id: findings_summary}
+        self._analyzed_message_ids: set[int] = set()  # Discord message IDs already analyzed
+        self._max_analyzed_ids = 500


    async def cog_load(self):
@@ -37,8 +41,11 @@ class SentimentCog(commands.Cog):
        for task in self._debounce_tasks.values():
            task.cancel()
        self._debounce_tasks.clear()
-        for key in list(self._message_buffer):
-            await self._process_buffered(key)
+        for task in self._mention_scan_tasks.values():
+            task.cancel()
+        self._mention_scan_tasks.clear()
+        for channel_id in list(self._message_buffer):
+            await self._process_buffered(channel_id)
        # Final flush on shutdown
        await self._flush_dirty_states()

@@ -80,202 +87,174 @@ class SentimentCog(commands.Cog):
        if self.bot.drama_tracker.is_immune(message.author.id):
            return

-        # Skip sentiment analysis for messages directed at the bot
-        # (mentions, replies to bot) — users interacting with the bot
-        # in roast/chat modes shouldn't have those messages scored as toxic
+        # Messages directed at the bot (mentions, replies) shouldn't be scored
+        # for toxicity — but @mentions can trigger a scan of recent chat
        directed_at_bot = self.bot.user in message.mentions
        if not directed_at_bot and message.reference and message.reference.message_id:
            ref = message.reference.cached_message
            if ref and ref.author.id == self.bot.user.id:
                directed_at_bot = True
        if directed_at_bot:
+            # @mention (not just reply-to-bot) triggers a mention scan
+            if self.bot.user in message.mentions:
+                mention_config = config.get("mention_scan", {})
+                if mention_config.get("enabled", True):
+                    await self._maybe_start_mention_scan(message, mention_config)
            return

-        # Store message in channel history for context
-        self._store_context(message)
-
        # Skip if empty
        if not message.content or not message.content.strip():
            return

-        # Buffer the message and start/reset debounce timer
-        key = (message.channel.id, message.author.id)
-        if key not in self._message_buffer:
-            self._message_buffer[key] = []
-        self._message_buffer[key].append(message)
+        # Buffer the message and start/reset debounce timer (per-channel)
+        channel_id = message.channel.id
+        if channel_id not in self._message_buffer:
+            self._message_buffer[channel_id] = []
+        self._message_buffer[channel_id].append(message)

-        # Cancel existing debounce timer for this user+channel
-        existing_task = self._debounce_tasks.get(key)
+        # Cancel existing debounce timer for this channel
+        existing_task = self._debounce_tasks.get(channel_id)
        if existing_task and not existing_task.done():
            existing_task.cancel()

-        # Skip debounce when bot is @mentioned so warnings fire before chat replies
-        if self.bot.user in message.mentions:
-            batch_window = 0
-        else:
-            batch_window = config.get("sentiment", {}).get("batch_window_seconds", 3)
+        batch_window = config.get("sentiment", {}).get("batch_window_seconds", 3)

-        self._debounce_tasks[key] = asyncio.create_task(
-            self._debounce_then_process(key, batch_window)
+        self._debounce_tasks[channel_id] = asyncio.create_task(
+            self._debounce_then_process(channel_id, batch_window)
        )

-    async def _debounce_then_process(self, key: tuple[int, int], delay: float):
+    async def _debounce_then_process(self, channel_id: int, delay: float):
        """Sleep for the debounce window, then process the buffered messages."""
        try:
            await asyncio.sleep(delay)
-            await self._process_buffered(key)
+            await self._process_buffered(channel_id)
        except asyncio.CancelledError:
            pass  # Timer was reset by a new message — expected

-    async def _process_buffered(self, key: tuple[int, int]):
-        """Combine buffered messages and run the analysis pipeline once."""
-        messages = self._message_buffer.pop(key, [])
-        self._debounce_tasks.pop(key, None)
+    async def _process_buffered(self, channel_id: int):
+        """Collect buffered messages, build conversation block, and run analysis."""
+        messages = self._message_buffer.pop(channel_id, [])
+        self._debounce_tasks.pop(channel_id, None)

        if not messages:
            return

-        # Use the last message as the reference for channel, author, guild, etc.
-        message = messages[-1]
-        combined_content = "\n".join(m.content for m in messages if m.content and m.content.strip())
-
-        if not combined_content.strip():
-            return
-
-        batch_count = len(messages)
-        if batch_count > 1:
-            logger.info(
-                "Batched %d messages from %s in #%s",
-                batch_count, message.author.display_name,
-                getattr(message.channel, 'name', 'unknown'),
-            )
+        # Use the last message as reference for channel/guild
+        ref_message = messages[-1]
+        channel = ref_message.channel

        config = self.bot.config
-        monitoring = config.get("monitoring", {})
        sentiment_config = config.get("sentiment", {})
-
-        # Build channel context for game detection
        game_channels = config.get("game_channels", {})
-        channel_context = self._build_channel_context(message, game_channels)

-        # Analyze the combined message (triage with lightweight model)
-        context = self._get_context(message)
-        user_notes = self.bot.drama_tracker.get_user_notes(message.author.id)
-        result = await self.bot.llm.analyze_message(
-            combined_content, context, user_notes=user_notes,
+        # Fetch some history before the buffered messages for leading context
+        context_count = sentiment_config.get("context_messages", 8)
+        oldest_buffered = messages[0]
+        history_messages: list[discord.Message] = []
+        try:
+            async for msg in channel.history(limit=context_count + 5, before=oldest_buffered):
+                if msg.author.bot:
+                    continue
+                if not msg.content or not msg.content.strip():
+                    continue
+                history_messages.append(msg)
+                if len(history_messages) >= context_count:
+                    break
+        except discord.HTTPException:
+            pass
+
+        history_messages.reverse()  # chronological order
+
+        # Combine: history (context) + buffered (new messages to analyze)
+        all_messages = history_messages + messages
+
+        # Build msg_id_to_author lookup for reply resolution
+        msg_id_to_author: dict[int, str] = {
+            m.id: m.author.display_name for m in all_messages
+        }
+
+        # Convert to conversation tuples: (username, content, timestamp, reply_to_username)
+        conversation: list[tuple[str, str, datetime, str | None]] = []
+        for msg in all_messages:
+            reply_to = None
+            if msg.reference and msg.reference.message_id:
+                reply_to = msg_id_to_author.get(msg.reference.message_id)
+                if not reply_to:
+                    ref = msg.reference.cached_message
+                    if ref:
+                        reply_to = ref.author.display_name
+            conversation.append((
+                msg.author.display_name,
+                msg.content,
+                msg.created_at,
+                reply_to,
+            ))
+
+        if not conversation:
+            return
+
+        # Build user notes map (only for users in the buffer, not history-only)
+        user_notes_map: dict[str, str] = {}
+        for msg in messages:
+            name = msg.author.display_name
+            if name not in user_notes_map:
+                notes = self.bot.drama_tracker.get_user_notes(msg.author.id)
+                if notes:
+                    user_notes_map[name] = notes
+
+        channel_context = self._build_channel_context(ref_message, game_channels)
+
+        logger.info(
+            "Channel analysis: %d new messages (+%d context) in #%s",
+            len(messages), len(history_messages),
+            getattr(channel, 'name', 'unknown'),
+        )
+
+        # TRIAGE: Lightweight model — conversation-level analysis
+        result = await self.bot.llm.analyze_conversation(
+            conversation,
            channel_context=channel_context,
+            user_notes_map=user_notes_map,
        )

        if result is None:
            return

-        # Escalation: re-analyze with heavy model if triage flags something
+        # ESCALATION: Re-analyze with heavy model if any finding warrants it
        escalation_threshold = sentiment_config.get("escalation_threshold", 0.25)
-        needs_escalation = (
-            result["toxicity_score"] >= escalation_threshold
-            or result.get("off_topic", False)
-            or result.get("coherence_score", 1.0) < 0.6
+        needs_escalation = any(
+            f["toxicity_score"] >= escalation_threshold
+            or f.get("off_topic", False)
+            or f.get("coherence_score", 1.0) < 0.6
+            for f in result.get("user_findings", [])
        )
        if needs_escalation:
-            triage_score = result["toxicity_score"]
-            heavy_result = await self.bot.llm_heavy.analyze_message(
-                combined_content, context, user_notes=user_notes,
+            heavy_result = await self.bot.llm_heavy.analyze_conversation(
+                conversation,
                channel_context=channel_context,
+                user_notes_map=user_notes_map,
            )
            if heavy_result is not None:
                logger.info(
-                    "Escalated to heavy model (triage_score=%.2f) for %s",
-                    triage_score, message.author.display_name,
+                    "Escalated to heavy model for #%s",
+                    getattr(channel, 'name', 'unknown'),
                )
                result = heavy_result

-        score = result["toxicity_score"]
-        categories = result["categories"]
-        reasoning = result["reasoning"]
+        # Build username -> (user_id, ref_msg, [messages]) for buffered users only
+        user_lookup: dict[str, tuple[int, discord.Message, list[discord.Message]]] = {}
+        for msg in messages:
+            name = msg.author.display_name
+            if name not in user_lookup:
+                user_lookup[name] = (msg.author.id, msg, [])
+            user_lookup[name][2].append(msg)

-        # Track the result
-        self.bot.drama_tracker.add_entry(
-            message.author.id, score, categories, reasoning
-        )
+        # Mark all buffered messages as analyzed (for mention scan dedup)
+        for m in messages:
+            self._mark_analyzed(m.id)

-        drama_score = self.bot.drama_tracker.get_drama_score(message.author.id)
-
-        logger.info(
-            "User %s (%d) | msg_score=%.2f | drama_score=%.2f | categories=%s | %s",
-            message.author.display_name,
-            message.author.id,
-            score,
-            drama_score,
-            categories,
-            reasoning,
-        )
-
-        # Topic drift detection
-        off_topic = result.get("off_topic", False)
-        topic_category = result.get("topic_category", "general_chat")
-        topic_reasoning = result.get("topic_reasoning", "")
-
-        # Save message + analysis to DB (awaited — need message_id for action links)
-        db_message_id = await self.bot.db.save_message_and_analysis(
-            guild_id=message.guild.id,
-            channel_id=message.channel.id,
-            user_id=message.author.id,
-            username=message.author.display_name,
-            content=combined_content,
-            message_ts=message.created_at.replace(tzinfo=timezone.utc),
-            toxicity_score=score,
-            drama_score=drama_score,
-            categories=categories,
-            reasoning=reasoning,
-            off_topic=off_topic,
-            topic_category=topic_category,
-            topic_reasoning=topic_reasoning,
-            coherence_score=result.get("coherence_score"),
-            coherence_flag=result.get("coherence_flag"),
-        )
-
-        if off_topic:
-            await self._handle_topic_drift(message, topic_category, topic_reasoning, db_message_id)
-
-        # Game channel redirect detection
-        detected_game = result.get("detected_game")
-        if detected_game and game_channels and not monitoring.get("dry_run", False):
-            await self._handle_channel_redirect(message, detected_game, game_channels, db_message_id)
-
-        # Coherence / intoxication detection
-        coherence_score = result.get("coherence_score", 0.85)
-        coherence_flag = result.get("coherence_flag", "normal")
-        coherence_config = config.get("coherence", {})
-        if coherence_config.get("enabled", True):
-            degradation = self.bot.drama_tracker.update_coherence(
-                user_id=message.author.id,
-                score=coherence_score,
-                flag=coherence_flag,
-                drop_threshold=coherence_config.get("drop_threshold", 0.3),
-                absolute_floor=coherence_config.get("absolute_floor", 0.5),
-                cooldown_minutes=coherence_config.get("cooldown_minutes", 30),
-            )
-            if degradation and not config.get("monitoring", {}).get("dry_run", False):
-                await self._handle_coherence_alert(message, degradation, coherence_config, db_message_id)
-
-        # Capture LLM note updates about this user
-        note_update = result.get("note_update")
-        if note_update:
-            self.bot.drama_tracker.update_user_notes(message.author.id, note_update)
-            self._dirty_users.add(message.author.id)
-
-        # Mark dirty for coherence baseline drift even without actions
-        self._dirty_users.add(message.author.id)
-
-        # Always log analysis to #bcs-log if it exists
-        await self._log_analysis(message, score, drama_score, categories, reasoning, off_topic, topic_category)
-
-        # Dry-run mode: skip warnings/mutes
+        # Resolve thresholds once
        dry_run = config.get("monitoring", {}).get("dry_run", False)
-        if dry_run:
-            return
-
-        # Check thresholds — use relaxed thresholds if the active mode says so
        mode_config = self.bot.get_mode_config()
        moderation_level = mode_config.get("moderation", "full")
        if moderation_level == "relaxed" and "relaxed_thresholds" in mode_config:
@@ -289,18 +268,365 @@ class SentimentCog(commands.Cog):
            base_mute_threshold = sentiment_config.get("mute_threshold", 0.75)
            spike_warn = sentiment_config.get("spike_warning_threshold", 0.5)
            spike_mute = sentiment_config.get("spike_mute_threshold", 0.8)
-        mute_threshold = self.bot.drama_tracker.get_mute_threshold(
-            message.author.id, base_mute_threshold
+        coherence_config = config.get("coherence", {})
+
+        # Process per-user findings
+        for finding in result.get("user_findings", []):
+            username = finding["username"]
+            lookup = user_lookup.get(username)
+            if not lookup:
+                # LLM returned a finding for a history-only user or unknown name; skip
+                continue
+
+            user_id, user_ref_msg, user_msgs = lookup
+            score = finding["toxicity_score"]
+            categories = finding["categories"]
+            reasoning = finding["reasoning"]
+            off_topic = finding.get("off_topic", False)
+            topic_category = finding.get("topic_category", "general_chat")
+            topic_reasoning = finding.get("topic_reasoning", "")
+            coherence_score = finding.get("coherence_score", 0.85)
+            coherence_flag = finding.get("coherence_flag", "normal")
+            note_update = finding.get("note_update")
+            detected_game = finding.get("detected_game")
+
+            # Track the result in DramaTracker
+            self.bot.drama_tracker.add_entry(user_id, score, categories, reasoning)
+            drama_score = self.bot.drama_tracker.get_drama_score(user_id)
+
+            logger.info(
+                "User %s (%d) | msg_score=%.2f | drama_score=%.2f | categories=%s | %s",
+                username, user_id, score, drama_score, categories, reasoning,
+            )
+
+            # Save message + analysis to DB
+            combined_content = "\n".join(
+                m.content for m in user_msgs if m.content and m.content.strip()
+            )
+            db_message_id = await self.bot.db.save_message_and_analysis(
+                guild_id=user_ref_msg.guild.id,
+                channel_id=user_ref_msg.channel.id,
+                user_id=user_id,
+                username=username,
+                content=combined_content[:4000],
+                message_ts=user_ref_msg.created_at.replace(tzinfo=timezone.utc),
+                toxicity_score=score,
+                drama_score=drama_score,
+                categories=categories,
+                reasoning=reasoning,
+                off_topic=off_topic,
+                topic_category=topic_category,
+                topic_reasoning=topic_reasoning,
+                coherence_score=coherence_score,
+                coherence_flag=coherence_flag,
+            )
+
+            # Topic drift handling
+            if off_topic:
+                await self._handle_topic_drift(user_ref_msg, topic_category, topic_reasoning, db_message_id)
+
+            # Game channel redirect detection
+            if detected_game and game_channels and not dry_run:
+                await self._handle_channel_redirect(user_ref_msg, detected_game, game_channels, db_message_id)
+
+            # Coherence / intoxication detection
+            if coherence_config.get("enabled", True):
+                degradation = self.bot.drama_tracker.update_coherence(
+                    user_id=user_id,
+                    score=coherence_score,
+                    flag=coherence_flag,
+                    drop_threshold=coherence_config.get("drop_threshold", 0.3),
+                    absolute_floor=coherence_config.get("absolute_floor", 0.5),
+                    cooldown_minutes=coherence_config.get("cooldown_minutes", 30),
+                )
+                if degradation and not dry_run:
+                    await self._handle_coherence_alert(user_ref_msg, degradation, coherence_config, db_message_id)
+
+            # Capture LLM note updates about this user
+            if note_update:
+                self.bot.drama_tracker.update_user_notes(user_id, note_update)
+                self._dirty_users.add(user_id)
+
+            # Mark dirty for coherence baseline drift even without actions
+            self._dirty_users.add(user_id)
+
+            # Always log analysis to #bcs-log if it exists
+            await self._log_analysis(user_ref_msg, score, drama_score, categories, reasoning, off_topic, topic_category)
+
+            # Moderation actions (skip in dry-run mode)
+            if not dry_run:
+                mute_threshold = self.bot.drama_tracker.get_mute_threshold(
+                    user_id, base_mute_threshold
+                )
+                # Mute: rolling average OR single message spike
+                if drama_score >= mute_threshold or score >= spike_mute:
+                    effective_score = max(drama_score, score)
+                    await self._mute_user(user_ref_msg, effective_score, categories, db_message_id)
+                # Warn: rolling average OR single message spike
+                elif drama_score >= warning_threshold or score >= spike_warn:
+                    effective_score = max(drama_score, score)
+                    await self._warn_user(user_ref_msg, effective_score, db_message_id)
+
+    # -- Mention scan methods --
+
+    def _mark_analyzed(self, discord_message_id: int):
+        """Track a Discord message ID as already analyzed."""
+        self._analyzed_message_ids.add(discord_message_id)
+        if len(self._analyzed_message_ids) > self._max_analyzed_ids:
+            sorted_ids = sorted(self._analyzed_message_ids)
+            self._analyzed_message_ids = set(sorted_ids[len(sorted_ids) // 2:])
+
+    async def _maybe_start_mention_scan(
+        self, trigger_message: discord.Message, mention_config: dict
+    ):
+        """Check cooldown and kick off a mention-triggered scan of recent messages."""
+        channel_id = trigger_message.channel.id
+        cooldown_seconds = mention_config.get("cooldown_seconds", 60)
+
+        now = datetime.now(timezone.utc)
+        last_scan = self._mention_scan_cooldowns.get(channel_id)
+        if last_scan and (now - last_scan).total_seconds() < cooldown_seconds:
+            logger.info(
+                "Mention scan cooldown active for #%s, skipping.",
+                getattr(trigger_message.channel, "name", "unknown"),
+            )
+            return
+
+        self._mention_scan_cooldowns[channel_id] = now
+
+        # Extract the user's concern (strip the bot ping from the message)
+        mention_text = trigger_message.content
+        for fmt in (f"<@{self.bot.user.id}>", f"<@!{self.bot.user.id}>"):
+            mention_text = mention_text.replace(fmt, "")
+        mention_text = mention_text.strip() or "(user pinged bot without specific concern)"
+
+        # Store as a mention scan task (separate from debounce)
+        existing_task = self._mention_scan_tasks.get(channel_id)
+        if existing_task and not existing_task.done():
+            existing_task.cancel()
+
+        self._mention_scan_tasks[channel_id] = asyncio.create_task(
+            self._run_mention_scan(trigger_message, mention_text, mention_config)
        )

-        # Mute: rolling average OR single message spike
-        if drama_score >= mute_threshold or score >= spike_mute:
-            effective_score = max(drama_score, score)
-            await self._mute_user(message, effective_score, categories, db_message_id)
-        # Warn: rolling average OR single message spike
-        elif drama_score >= warning_threshold or score >= spike_warn:
-            effective_score = max(drama_score, score)
-            await self._warn_user(message, effective_score, db_message_id)
+    async def _run_mention_scan(
+        self,
+        trigger_message: discord.Message,
+        mention_text: str,
+        mention_config: dict,
+    ):
+        """Scan recent channel messages with ONE conversation-level LLM call."""
+        channel = trigger_message.channel
+        scan_count = mention_config.get("scan_messages", 30)
+
+        config = self.bot.config
+        sentiment_config = config.get("sentiment", {})
+        game_channels = config.get("game_channels", {})
+
+        # Fetch recent messages (before the trigger, skip bots/empty)
+        raw_messages: list[discord.Message] = []
+        try:
+            async for msg in channel.history(limit=scan_count + 10, before=trigger_message):
+                if msg.author.bot:
+                    continue
+                if not msg.content or not msg.content.strip():
+                    continue
+                raw_messages.append(msg)
+                if len(raw_messages) >= scan_count:
+                    break
+        except discord.HTTPException:
+            logger.warning("Failed to fetch history for mention scan in #%s",
+                           getattr(channel, "name", "unknown"))
+            return
+
+        raw_messages.reverse()  # chronological order
+
+        if not raw_messages:
+            self._mention_scan_results[trigger_message.id] = "No recent messages found to analyze."
+            return
+
+        logger.info(
+            "Mention scan triggered by %s in #%s: %d messages (single LLM call). Focus: %s",
+            trigger_message.author.display_name,
+            getattr(channel, "name", "unknown"),
+            len(raw_messages),
+            mention_text[:80],
+        )
+
+        # Build a lookup of message IDs to authors for resolving replies
+        msg_id_to_author: dict[int, str] = {
+            m.id: m.author.display_name for m in raw_messages
+        }
+
+        # Convert to conversation tuples: (username, content, timestamp, reply_to)
+        conversation: list[tuple[str, str, datetime, str | None]] = []
+        for msg in raw_messages:
+            reply_to = None
+            if msg.reference and msg.reference.message_id:
+                # Try our local lookup first
+                reply_to = msg_id_to_author.get(msg.reference.message_id)
+                if not reply_to:
+                    # Try the cached message
+                    ref = msg.reference.cached_message
+                    if ref:
+                        reply_to = ref.author.display_name
+            conversation.append((
+                msg.author.display_name,
+                msg.content,
+                msg.created_at,
+                reply_to,
+            ))
+
+        # Build user notes map
+        user_notes_map: dict[str, str] = {}
+        for msg in raw_messages:
+            name = msg.author.display_name
+            if name not in user_notes_map:
+                notes = self.bot.drama_tracker.get_user_notes(msg.author.id)
+                if notes:
+                    user_notes_map[name] = notes
+
+        channel_context = self._build_channel_context(raw_messages[0], game_channels)
+        mention_context = (
+            f"A user flagged this conversation and said: \"{mention_text}\"\n"
+            f"Pay special attention to whether this concern is valid."
+        )
+
+        # Single LLM call
+        result = await self.bot.llm.analyze_conversation(
+            conversation,
+            mention_context=mention_context,
+            channel_context=channel_context,
+            user_notes_map=user_notes_map,
+        )
+
+        if result is None:
+            logger.warning("Conversation analysis failed for mention scan.")
+            self._mention_scan_results[trigger_message.id] = "Analysis failed."
+            return
+
+        # Build username → user_id + ref_message mapping
+        user_lookup: dict[str, tuple[int, discord.Message, list[discord.Message]]] = {}
+        for msg in raw_messages:
+            name = msg.author.display_name
+            if name not in user_lookup:
+                user_lookup[name] = (msg.author.id, msg, [])
+            user_lookup[name][2].append(msg)
+
+        findings: list[str] = []
+
+        # Resolve thresholds once (outside the loop)
+        dry_run = config.get("monitoring", {}).get("dry_run", False)
+        mode_config = self.bot.get_mode_config()
+        moderation_level = mode_config.get("moderation", "full")
+        if moderation_level == "relaxed" and "relaxed_thresholds" in mode_config:
+            rt = mode_config["relaxed_thresholds"]
+            warning_threshold = rt.get("warning_threshold", 0.80)
+            base_mute_threshold = rt.get("mute_threshold", 0.85)
+            spike_warn = rt.get("spike_warning_threshold", 0.70)
+            spike_mute = rt.get("spike_mute_threshold", 0.85)
+        else:
+            warning_threshold = sentiment_config.get("warning_threshold", 0.6)
+            base_mute_threshold = sentiment_config.get("mute_threshold", 0.75)
+            spike_warn = sentiment_config.get("spike_warning_threshold", 0.5)
+            spike_mute = sentiment_config.get("spike_mute_threshold", 0.8)
+
+        for finding in result.get("user_findings", []):
+            username = finding["username"]
+            score = finding["toxicity_score"]
+            categories = finding["categories"]
+            reasoning = finding["reasoning"]
+            worst_msg = finding.get("worst_message")
+            off_topic = finding.get("off_topic", False)
+            note_update = finding.get("note_update")
+
+            lookup = user_lookup.get(username)
+            if not lookup:
+                logger.warning("Mention scan: LLM returned unknown user '%s', skipping.", username)
+                continue
+
+            user_id, ref_msg, user_msgs = lookup
+
+            # Skip if all their messages were already analyzed
+            if all(m.id in self._analyzed_message_ids for m in user_msgs):
+                continue
+
+            # Mark their messages as analyzed
+            for m in user_msgs:
+                self._mark_analyzed(m.id)
+
+            self.bot.drama_tracker.add_entry(user_id, score, categories, reasoning)
+            drama_score = self.bot.drama_tracker.get_drama_score(user_id)
+
+            # Save to DB
+            content_summary = f"[Mention scan] {worst_msg}" if worst_msg else "[Mention scan] See conversation"
+            db_message_id = await self.bot.db.save_message_and_analysis(
+                guild_id=ref_msg.guild.id,
+                channel_id=ref_msg.channel.id,
+                user_id=user_id,
+                username=username,
+                content=content_summary,
+                message_ts=ref_msg.created_at.replace(tzinfo=timezone.utc),
+                toxicity_score=score,
+                drama_score=drama_score,
+                categories=categories,
+                reasoning=reasoning,
+                off_topic=off_topic,
+                topic_category="personal_drama" if off_topic else "gaming",
+                topic_reasoning=reasoning,
+                coherence_score=None,
+                coherence_flag=None,
+            )
+
+            # Log to #bcs-log
+            await self._log_analysis(
+                ref_msg, score, drama_score, categories, reasoning,
+                off_topic, "personal_drama" if off_topic else "gaming",
+            )
+
+            # Collect notable findings for summary
+            if score >= 0.3:
+                cat_str = ", ".join(c for c in categories if c != "none") or "none"
+                findings.append(f"{username}: {score:.2f} ({cat_str})")
+
+            # Update user notes
+            if note_update:
+                self.bot.drama_tracker.update_user_notes(user_id, note_update)
+                self._dirty_users.add(user_id)
+
+            # Moderation actions
+            if not dry_run:
+                mute_threshold = self.bot.drama_tracker.get_mute_threshold(
+                    user_id, base_mute_threshold
+                )
+                if drama_score >= mute_threshold or score >= spike_mute:
+                    effective_score = max(drama_score, score)
+                    await self._mute_user(ref_msg, effective_score, categories, db_message_id)
+                elif drama_score >= warning_threshold or score >= spike_warn:
+                    effective_score = max(drama_score, score)
+                    await self._warn_user(ref_msg, effective_score, db_message_id)
+
+        # Build summary for ChatCog
+        convo_summary = result.get("conversation_summary", "")
+        if findings:
+            summary = f"Scanned {len(raw_messages)} msgs. {convo_summary} Notable: " + "; ".join(findings[:5])
+        else:
+            summary = f"Scanned {len(raw_messages)} msgs. {convo_summary}"
+
+        # Prune old scan results
+        if len(self._mention_scan_results) > 20:
+            oldest = sorted(self._mention_scan_results.keys())[:len(self._mention_scan_results) - 10]
+            for k in oldest:
+                del self._mention_scan_results[k]
+
+        self._mention_scan_results[trigger_message.id] = summary
+
+        logger.info(
+            "Mention scan complete in #%s: 1 LLM call, %d messages, %d users flagged",
+            getattr(channel, "name", "unknown"),
+            len(raw_messages),
+            len(findings),
+        )

    async def _mute_user(
        self,
@@ -684,59 +1010,6 @@ class SentimentCog(commands.Cog):
            details=f"from=#{channel_name} to=#{detected_game} game={game_name}",
        ))

-    def _store_context(self, message: discord.Message):
-        ch_id = message.channel.id
-        if ch_id not in self._channel_history:
-            max_ctx = self.bot.config.get("sentiment", {}).get(
-                "context_messages", 8
-            )
-            self._channel_history[ch_id] = deque(maxlen=max_ctx)
-        self._channel_history[ch_id].append(
-            (message.author.display_name, message.content, datetime.now(timezone.utc))
-        )
-
-    def _get_context(self, message: discord.Message) -> str:
-        """Build a timestamped chat log from recent channel messages.
-
-        Excludes messages currently buffered for this user+channel
-        (those appear in the TARGET MESSAGE section instead).
-        """
-        ch_id = message.channel.id
-        history = self._channel_history.get(ch_id, deque())
-        if not history:
-            return "(no prior context)"
-
-        now = datetime.now(timezone.utc)
-
-        # Collect IDs of messages in the current debounce batch so we can skip them
-        batch_key = (ch_id, message.author.id)
-        batch_msgs = self._message_buffer.get(batch_key, [])
-        # Build a set of (author, content) from the batch for fast lookup
-        batch_set = {(m.author.display_name, m.content) for m in batch_msgs}
-
-        lines = []
-        for name, content, ts in history:
-            if (name, content) in batch_set:
-                continue
-            delta = now - ts
-            rel = self._format_relative_time(delta)
-            lines.append(f"[{rel}] {name}: {content}")
-
-        if not lines:
-            return "(no prior context)"
-        return "\n".join(lines)
-
-    @staticmethod
-    def _format_relative_time(delta: timedelta) -> str:
-        total_seconds = int(delta.total_seconds())
-        if total_seconds < 60:
-            return f"~{total_seconds}s ago"
-        minutes = total_seconds // 60
-        if minutes < 60:
-            return f"~{minutes}m ago"
-        hours = minutes // 60
-        return f"~{hours}h ago"
-
    async def _log_analysis(
        self, message: discord.Message, score: float, drama_score: float,
        categories: list[str], reasoning: str, off_topic: bool, topic_category: str,