Merge pull request #6706 from akatsoulas/create-spam-flag-llm

akatsoulas · web-flow · commit 899e78d29b62 · 2025-06-10T16:06:32.000+02:00
Create a spam flag on automatic spam classificaiton
diff --git a/kitsune/llm/tasks.py b/kitsune/llm/tasks.py
@@ -1,6 +1,7 @@
 import waffle
 from celery import shared_task
 
+from kitsune.flagit.models import FlaggedObject
 from kitsune.llm.questions.classifiers import classify_question
 from kitsune.users.models import Profile
 
@@ -25,6 +26,8 @@ def question_classifier(question_id):
     elif waffle.switch_is_active("flagit-spam-autoflag"):
         flag_question(
             question,
+            reason=FlaggedObject.REASON_CONTENT_MODERATION,
+            status=FlaggedObject.FLAG_PENDING,
             by_user=Profile.get_sumo_bot(),
             notes=(
                 "Automatically flagged for topic moderation:"
diff --git a/kitsune/questions/utils.py b/kitsune/questions/utils.py
@@ -150,8 +150,8 @@ def flag_question(
     question: Question,
     by_user: User,
     notes: str,
-    status: int = FlaggedObject.FLAG_PENDING,
-    reason: str = FlaggedObject.REASON_CONTENT_MODERATION,
+    status: int = FlaggedObject.FLAG_ACCEPTED,
+    reason: str = FlaggedObject.REASON_SPAM,
 ) -> None:
     content_type = ContentType.objects.get_for_model(question)
     flagged_object, created = FlaggedObject.objects.get_or_create(
@@ -214,17 +214,6 @@ def update_question_fields_from_classification(question, result, sumo_bot):
         question.tags.clear()
         question.auto_tag()
 
-        if topic := update_fields.get("topic"):
-            flag_question(
-                question,
-                by_user=sumo_bot,
-                notes=(
-                    f"LLM classified as {topic.title}, for the following reason:\n"
-                    f"{topic_result.get('reason', '')}"
-                ),
-                status=FlaggedObject.FLAG_ACCEPTED,
-            )
-
 
 def process_classification_result(
     question: Question,
@@ -236,19 +225,44 @@ def process_classification_result(
     """
     sumo_bot = Profile.get_sumo_bot()
     action = result.get("action")
+    flag_kwargs = {
+        "by_user": sumo_bot,
+        "notes": "",
+        "question": question,
+    }
 
     match action:
         case ModerationAction.SPAM:
+            flag_kwargs.update(
+                {
+                    "notes": (
+                        f"LLM classified as spam, for the following reason:\n"
+                        f"{result.get('spam_result', {}).get('reason', '')}"
+                    ),
+                }
+            )
             question.mark_as_spam(sumo_bot)
         case ModerationAction.FLAG_REVIEW:
-            flag_question(
-                question,
-                by_user=sumo_bot,
-                notes=(
-                    "LLM flagged for manual review, for the following reason:\n"
-                    f"{result.get('spam_result', {}).get('reason', '')}"
-                ),
-                reason=FlaggedObject.REASON_SPAM,
+            flag_kwargs.update(
+                {
+                    "status": FlaggedObject.FLAG_PENDING,
+                    "notes": (
+                        f"LLM flagged for manual review, for the following reason:\n"
+                        f"{result.get('spam_result', {}).get('reason', '')}"
+                    ),
+                }
             )
         case _:
+            flag_kwargs.update(
+                {
+                    "reason": FlaggedObject.REASON_CONTENT_MODERATION,
+                    "notes": (
+                        f"LLM classified as {result.get('topic_result', {}).get('topic', '')}, "
+                        f"for the following reason:\n"
+                        f"{result.get('topic_result', {}).get('reason', '')}"
+                    ),
+                }
+            )
             update_question_fields_from_classification(question, result, sumo_bot)
+
+    flag_question(**flag_kwargs)