diff --git a/bot.py b/bot.py index 6e1b1be..fc79ade 100644 --- a/bot.py +++ b/bot.py @@ -97,6 +97,18 @@ class BCSBot(commands.Bot): await self.tree.sync() logger.info("Slash commands synced.") + # Warm up the LLM so the model is loaded into VRAM before messages arrive + logger.info("Warming up LLM model...") + try: + resp = await self.llm._client.chat.completions.create( + model=self.llm.model, + messages=[{"role": "user", "content": "hi"}], + max_tokens=1, + ) + logger.info("LLM warm-up complete.") + except Exception as e: + logger.warning("LLM warm-up failed — first messages may be slow: %s", e) + async def on_message(self, message: discord.Message): logger.info( "EVENT on_message from %s in #%s: %s",