Add LLM backend support and improve debugging observability

- Add LLM_BACKEND to environment configuration - Implement detailed debug logging for LLM request/response cycles - Add missing llama-index dependencies for embeddings and chroma - Update prompt constraints to prevent lore redundancy - Enable CUDA for transcription and set logging to DEBUG level - Add entry point for running the orchestrator directly - Cleanup unused comment in TUI context updates
2026-05-28 23:06:25 -07:00
parent 49127d695a
commit 15dfbfb467
6 changed files with 34 additions and 5 deletions
@@ -45,6 +45,7 @@ class LLMProcessor:
            final_base_url = base_url or os.environ.get("OPENAI_BASE_URL")
            final_api_key = api_key or os.environ.get("OPENAI_API_KEY")

+        logger.info(f"Using LLM backend: {backend}")
        try:
            self.client = OpenAI(
                api_key=final_api_key,
@@ -96,6 +97,14 @@ class LLMProcessor:

        messages.append({"role": "user", "content": user_prompt})

+        # Debugging: Dump inputs
+        logger.debug("--- LLM CALL START ---")
+        logger.debug(f"Model: {self.model}")
+        logger.debug(f"Messages: {messages}")
+        if response_format:
+            logger.debug(f"Response Format: {response_format}")
+        logger.debug("--- LLM CALL END ---")
+
        try:
            response = self.client.chat.completions.create(
                model=self.model,
@@ -105,6 +114,11 @@ class LLMProcessor:
            )
            content = response.choices[0].message.content

+            # Debugging: Dump outputs
+            logger.debug("--- LLM RESPONSE START ---")
+            logger.debug(f"Content: {content}")
+            logger.debug("--- LLM RESPONSE END ---")
+
            return self._strip_markdown_code_blocks(content)
        except Exception as e:
            logger.error(f"LLM Error: {e}")