Merge branch 'main' into track-token-usage

ls1intum · bassner · Oct 23, 2024 · Oct 1, 2024 · Oct 11, 2024 · Oct 11, 2024
commit c79837d2ff64c9cb6cb0fdfd20652f5a507db5ea
diff --git a/app/llm/external/openai_chat.py b/app/llm/external/openai_chat.py
@@ -127,10 +127,20 @@ def chat(
                         temperature=arguments.temperature,
                         max_tokens=arguments.max_tokens,
                     )
-                return convert_to_iris_message(
-                    response.choices[0].message, response.usage, response.model
-                )
-            except Exception as e:
+                choice = response.choices[0]
+                if choice.finish_reason == "content_filter":
+                    # I figured that an openai error would be automatically raised if the content filter activated,
+                    # but it seems that that is not the case.
+                    # We don't want to retry because the same message will likely be rejected again.
+                    # Raise an exception to trigger the global error handler and report a fatal error to the client.
+                    raise ContentFilterFinishReasonError()
+                return convert_to_iris_message(choice.message)
+            except (
+                APIError,
+                APITimeoutError,
+                RateLimitError,
+                InternalServerError,
+            ):
                 wait_time = initial_delay * (backoff_factor**attempt)
                 logging.exception(f"OpenAI error on attempt {attempt + 1}:")
                 logging.info(f"Retrying in {wait_time} seconds...")

diff --git a/app/web/status/status_update.py b/app/web/status/status_update.py
@@ -6,7 +6,7 @@
 from abc import ABC
 
 from app.common.token_usage_dto import TokenUsageDTO
-from ...domain.status.competency_extraction_status_update_dto import (
+from app.domain.status.competency_extraction_status_update_dto import (
     CompetencyExtractionStatusUpdateDTO,
 )
 from app.domain.chat.course_chat.course_chat_status_update_dto import (