src/sentry/tasks/post_process.py

from __future__ import annotations

import logging
import uuid
from collections.abc import MutableMapping, Sequence
from datetime import datetime, timedelta
from time import time
from typing import TYPE_CHECKING, Any, TypedDict

import sentry_sdk
from django.conf import settings
from django.db.models.signals import post_save
from django.utils import timezone
from google.api_core.exceptions import ServiceUnavailable

from sentry import features, projectoptions
from sentry.exceptions import PluginError
from sentry.issues.grouptype import GroupCategory
from sentry.issues.issue_occurrence import IssueOccurrence
from sentry.killswitches import killswitch_matches_context
from sentry.replays.lib.event_linking import transform_event_for_linking_payload
from sentry.replays.lib.kafka import initialize_replays_publisher
from sentry.sentry_metrics.client import generic_metrics_backend
from sentry.sentry_metrics.use_case_id_registry import UseCaseID
from sentry.signals import event_processed, issue_unignored, transaction_processed
from sentry.silo.base import SiloMode
from sentry.tasks.base import instrumented_task
from sentry.types.group import GroupSubStatus
from sentry.utils import json, metrics
from sentry.utils.cache import cache
from sentry.utils.event_frames import get_sdk_name
from sentry.utils.locking import UnableToAcquireLock
from sentry.utils.locking.backends import LockBackend
from sentry.utils.locking.manager import LockManager
from sentry.utils.retries import ConditionalRetryPolicy, exponential_delay
from sentry.utils.safe import get_path, safe_execute
from sentry.utils.sdk import bind_organization_context, set_current_event_project
from sentry.utils.sdk_crashes.sdk_crash_detection_config import build_sdk_crash_detection_configs
from sentry.utils.services import build_instance_from_options_of_type

if TYPE_CHECKING:
    from sentry.eventstore.models import Event, GroupEvent
    from sentry.eventstream.base import GroupState
    from sentry.models.group import Group
    from sentry.models.project import Project
    from sentry.models.team import Team
    from sentry.ownership.grammar import Rule
    from sentry.services.hybrid_cloud.user import RpcUser

logger = logging.getLogger(__name__)

locks = LockManager(
    build_instance_from_options_of_type(
        LockBackend, settings.SENTRY_POST_PROCESS_LOCKS_BACKEND_OPTIONS
    )
)

ISSUE_OWNERS_PER_PROJECT_PER_MIN_RATELIMIT = 50
HIGHER_ISSUE_OWNERS_PER_PROJECT_PER_MIN_RATELIMIT = 200


class PostProcessJob(TypedDict, total=False):
    event: GroupEvent
    group_state: GroupState
    is_reprocessed: bool
    has_reappeared: bool
    has_alert: bool
    has_escalated: bool


def _get_service_hooks(project_id):
    from sentry.models.servicehook import ServiceHook

    cache_key = f"servicehooks:1:{project_id}"
    result = cache.get(cache_key)

    if result is None:
        hooks = ServiceHook.objects.filter(servicehookproject__project_id=project_id)
        result = [(h.id, h.events) for h in hooks]
        cache.set(cache_key, result, 60)
    return result


def _should_send_error_created_hooks(project):
    from sentry.models.organization import Organization
    from sentry.models.servicehook import ServiceHook

    cache_key = f"servicehooks-error-created:1:{project.id}"
    result = cache.get(cache_key)

    if result is None:
        org = Organization.objects.get_from_cache(id=project.organization_id)
        if not features.has("organizations:integrations-event-hooks", organization=org):
            cache.set(cache_key, 0, 60)
            return False

        result = (
            ServiceHook.objects.filter(organization_id=org.id)
            .extra(where=["events @> '{error.created}'"])
            .exists()
        )

        cache_value = 1 if result else 0
        cache.set(cache_key, cache_value, 60)

    return result


def should_write_event_stats(event: Event | GroupEvent):
    # For now, we only want to write these stats for error events. If we start writing them for
    # other event types we'll throw off existing stats and potentially cause various alerts to fire.
    # We might decide to write these stats for other event types later, either under different keys
    # or with differentiating tags.
    return (
        event.group
        and event.group.issue_category == GroupCategory.ERROR
        and event.group.platform is not None
    )


def format_event_platform(event: Event | GroupEvent):
    if not event.group:
        logger.error(
            "Group not found on event during formatting", extra={"event_id": event.event_id}
        )
        return
    if not event.group.platform:
        logger.error(
            "Platform not found on group during formatting",
            extra={"event_id": event.event_id, "group_id": event.group.id},
        )
        return
    platform = event.group.platform
    return platform.split("-", 1)[0].split("_", 1)[0]


def _capture_event_stats(event: Event) -> None:
    if not should_write_event_stats(event):
        return

    platform = format_event_platform(event)
    tags = {"platform": platform}
    metrics.incr("events.processed", tags={"platform": platform}, skip_internal=False)
    metrics.incr(f"events.processed.{platform}", skip_internal=False)
    metrics.distribution("events.size.data", event.size, tags=tags, unit="byte")


def _update_escalating_metrics(event: Event) -> None:
    """
    Update metrics for escalating issues when an event is processed.
    """
    generic_metrics_backend.counter(
        UseCaseID.ESCALATING_ISSUES,
        org_id=event.project.organization_id,
        project_id=event.project.id,
        metric_name="event_ingested",
        value=1,
        tags={"group": str(event.group_id)},
        unit=None,
    )


def _capture_group_stats(job: PostProcessJob) -> None:
    event = job["event"]
    if not job["group_state"]["is_new"] or not should_write_event_stats(event):
        return

    if not event.group:
        logger.error(
            "Group not found on event while capturing group stats",
            extra={"event_id": event.event_id},
        )
        return

    platform = format_event_platform(event)
    metrics.incr("events.unique", tags={"platform": platform}, skip_internal=False)


def should_issue_owners_ratelimit(project_id: int, group_id: int, organization_id: int | None):
    """
    Make sure that we do not accept more groups than the enforced_limit at the project level.
    """
    from sentry.models.organization import Organization

    enforced_limit = ISSUE_OWNERS_PER_PROJECT_PER_MIN_RATELIMIT
    organization = Organization.objects.get_from_cache(id=organization_id)
    if features.has("organizations:increased-issue-owners-rate-limit", organization=organization):
        enforced_limit = HIGHER_ISSUE_OWNERS_PER_PROJECT_PER_MIN_RATELIMIT

    cache_key = f"issue_owner_assignment_ratelimiter:{project_id}"
    data = cache.get(cache_key)

    if data is None:
        groups = {group_id}
        window_start = datetime.now()
        cache.set(cache_key, (groups, window_start), 60)
    else:
        groups = set(data[0])
        groups.add(group_id)
        window_start = data[1]
        timeout = max(60 - (datetime.now() - window_start).total_seconds(), 0)
        cache.set(cache_key, (groups, window_start), timeout)

    return len(groups) > enforced_limit


def handle_owner_assignment(job):
    if job["is_reprocessed"]:
        return

    with sentry_sdk.start_span(op="tasks.post_process_group.handle_owner_assignment"):
        try:
            from sentry.models.groupowner import (
                ASSIGNEE_DOES_NOT_EXIST_DURATION,
                ASSIGNEE_EXISTS_DURATION,
                ASSIGNEE_EXISTS_KEY,
                ISSUE_OWNERS_DEBOUNCE_DURATION,
                ISSUE_OWNERS_DEBOUNCE_KEY,
            )
            from sentry.models.projectownership import ProjectOwnership

            event = job["event"]
            project, group = event.project, event.group
            # We want to debounce owner assignment when:
            # - GroupOwner of type Ownership Rule || CodeOwner exist with TTL 1 day
            # - we tried to calculate and could not find issue owners with TTL 1 day
            # - an Assignee has been set with TTL of infinite
            with metrics.timer("post_process.handle_owner_assignment"):
                with sentry_sdk.start_span(op="post_process.handle_owner_assignment.ratelimited"):
                    if should_issue_owners_ratelimit(
                        project_id=project.id,
                        group_id=group.id,
                        organization_id=event.project.organization_id,
                    ):
                        metrics.incr("sentry.task.post_process.handle_owner_assignment.ratelimited")
                        return

                with sentry_sdk.start_span(
                    op="post_process.handle_owner_assignment.cache_set_assignee"
                ):
                    # Is the issue already assigned to a team or user?
                    assignee_key = ASSIGNEE_EXISTS_KEY(group.id)
                    assignees_exists = cache.get(assignee_key)
                    if assignees_exists is None:
                        assignees_exists = group.assignee_set.exists()
                        # Cache for 1 day if it's assigned. We don't need to move that fast.
                        cache.set(
                            assignee_key,
                            assignees_exists,
                            (
                                ASSIGNEE_EXISTS_DURATION
                                if assignees_exists
                                else ASSIGNEE_DOES_NOT_EXIST_DURATION
                            ),
                        )

                    if assignees_exists:
                        metrics.incr(
                            "sentry.task.post_process.handle_owner_assignment.assignee_exists"
                        )
                        return

                with sentry_sdk.start_span(
                    op="post_process.handle_owner_assignment.debounce_issue_owners"
                ):
                    issue_owners_key = ISSUE_OWNERS_DEBOUNCE_KEY(group.id)
                    debounce_issue_owners = cache.get(issue_owners_key)

                    if debounce_issue_owners:
                        metrics.incr("sentry.tasks.post_process.handle_owner_assignment.debounce")
                        return

                with metrics.timer("post_process.process_owner_assignments.duration"):
                    with sentry_sdk.start_span(
                        op="post_process.handle_owner_assignment.get_issue_owners"
                    ):
                        if killswitch_matches_context(
                            "post_process.get-autoassign-owners",
                            {
                                "project_id": project.id,
                            },
                        ):
                            # see ProjectOwnership.get_issue_owners
                            issue_owners: Sequence[tuple[Rule, Sequence[Team | RpcUser], str]] = []
                        else:
                            issue_owners = ProjectOwnership.get_issue_owners(project.id, event.data)

                            # Cache for 1 day after we calculated. We don't need to move that fast.
                            cache.set(
                                issue_owners_key,
                                True,
                                ISSUE_OWNERS_DEBOUNCE_DURATION,
                            )

                    with sentry_sdk.start_span(
                        op="post_process.handle_owner_assignment.handle_group_owners"
                    ):
                        if issue_owners:
                            try:
                                handle_group_owners(project, group, issue_owners)
                            except Exception:
                                logger.exception("Failed to store group owners")
                        else:
                            handle_invalid_group_owners(group)

        except Exception:
            logger.exception("Failed to handle owner assignments")


def handle_invalid_group_owners(group):
    from sentry.models.groupowner import GroupOwner, GroupOwnerType

    invalid_group_owners = GroupOwner.objects.filter(
        group=group,
        type__in=[GroupOwnerType.OWNERSHIP_RULE.value, GroupOwnerType.CODEOWNERS.value],
    )
    for owner in invalid_group_owners:
        owner.delete()
        logger.info(
            "handle_invalid_group_owners.delete_group_owner",
            extra={"group": group.id, "group_owner_id": owner.id, "project": group.project_id},
        )


def handle_group_owners(
    project: Project,
    group: Group,
    issue_owners: Sequence[tuple[Rule, Sequence[Team | RpcUser], str]],
):
    """
    Stores group owners generated by `ProjectOwnership.get_issue_owners` in the
    `GroupOwner` model, and handles any diffing/changes of which owners we're keeping.
    :return:
    """
    from sentry.models.groupowner import GroupOwner, GroupOwnerType, OwnerRuleType
    from sentry.models.team import Team
    from sentry.models.user import User
    from sentry.services.hybrid_cloud.user import RpcUser

    lock = locks.get(f"groupowner-bulk:{group.id}", duration=10, name="groupowner_bulk")
    logging_params = {
        "group": group.id,
        "project": project.id,
        "organization": project.organization_id,
        "issue_owners_length": len(issue_owners) if issue_owners else 0,
    }
    try:
        logger.info("handle_group_owners.start", extra=logging_params)
        with (
            sentry_sdk.start_span(op="post_process.handle_group_owners"),
            lock.acquire(),
        ):
            current_group_owners = GroupOwner.objects.filter(
                group=group,
                type__in=[GroupOwnerType.OWNERSHIP_RULE.value, GroupOwnerType.CODEOWNERS.value],
            )
            new_owners: dict = {}
            for rule, owners, source in issue_owners:
                for owner in owners:
                    # Can potentially have multiple rules pointing to the same owner
                    if new_owners.get((type(owner), owner.id, source)):
                        new_owners[(type(owner), owner.id, source)].append(rule)
                    else:
                        new_owners[(type(owner), owner.id, source)] = [rule]

            # Owners already in the database that we'll keep
            keeping_owners = set()
            for group_owner in current_group_owners:
                local_logging_params = logging_params.copy()
                local_logging_params["group_owner_id"] = group_owner.id
                owner_rule_type = (
                    OwnerRuleType.CODEOWNERS.value
                    if group_owner.type == GroupOwnerType.CODEOWNERS.value
                    else OwnerRuleType.OWNERSHIP_RULE.value
                )
                lookup_key = (
                    (Team, group_owner.team_id, owner_rule_type)
                    if group_owner.team_id is not None
                    else (User, group_owner.user_id, owner_rule_type)
                )
                # Old groupowner assignments get deleted
                lookup_key_value = None
                if lookup_key not in new_owners:
                    group_owner.delete()
                    logger.info(
                        "handle_group_owners.delete_group_owner",
                        extra={**local_logging_params, "reason": "assignment_deleted"},
                    )
                else:
                    lookup_key_value = new_owners.get(lookup_key)
                # Old groupowner assignment from outdated rules get deleted
                if (
                    lookup_key_value
                    and (group_owner.context or {}).get("rule") not in lookup_key_value
                ):
                    group_owner.delete()
                    logger.info(
                        "handle_group_owners.delete_group_owner",
                        extra={**local_logging_params, "reason": "outdated_rule"},
                    )
                else:
                    keeping_owners.add(lookup_key)

            new_group_owners = []

            for key in new_owners.keys():
                if key not in keeping_owners:
                    owner_type, owner_id, owner_source = key
                    rules = new_owners[key]
                    group_owner_type = (
                        GroupOwnerType.OWNERSHIP_RULE.value
                        if owner_source == OwnerRuleType.OWNERSHIP_RULE.value
                        else GroupOwnerType.CODEOWNERS.value
                    )
                    user_id = None
                    team_id = None
                    if owner_type is RpcUser:
                        user_id = owner_id
                    if owner_type is Team:
                        team_id = owner_id
                    for rule in rules:
                        new_group_owners.append(
                            GroupOwner(
                                group=group,
                                type=group_owner_type,
                                user_id=user_id,
                                team_id=team_id,
                                project=project,
                                organization=project.organization,
                                context={"rule": str(rule)},
                            )
                        )
            if new_group_owners:
                GroupOwner.objects.bulk_create(new_group_owners)
                for go in new_group_owners:
                    post_save.send_robust(
                        sender=GroupOwner,
                        instance=go,
                        created=True,
                    )
                logging_params["count"] = len(new_group_owners)
                logger.info("group_owners.bulk_create", extra=logging_params)

    except UnableToAcquireLock:
        logger.info("handle_group_owners.lock_failed", extra=logging_params)
        pass


def update_existing_attachments(job):
    """
    Attaches the group_id to all event attachments that were either:

    1) ingested prior to the event via the standalone attachment endpoint.
    2) part of a different group before reprocessing started.
    """
    # Patch attachments that were ingested on the standalone path.
    with sentry_sdk.start_span(op="tasks.post_process_group.update_existing_attachments"):
        from sentry.models.eventattachment import EventAttachment

        event = job["event"]

        EventAttachment.objects.filter(project_id=event.project_id, event_id=event.event_id).update(
            group_id=event.group_id
        )


def fetch_buffered_group_stats(group):
    """
    Fetches buffered increments to `times_seen` for this group and adds them to the current
    `times_seen`.
    """
    from sentry import buffer
    from sentry.models.group import Group

    result = buffer.backend.get(Group, ["times_seen"], {"id": group.id})
    group.times_seen_pending = result["times_seen"]


MAX_FETCH_ATTEMPTS = 3


def should_retry_fetch(attempt: int, e: Exception) -> bool:
    from sentry.issues.occurrence_consumer import EventLookupError

    return not attempt > MAX_FETCH_ATTEMPTS and (
        isinstance(e, ServiceUnavailable) or isinstance(e, EventLookupError)
    )


fetch_retry_policy = ConditionalRetryPolicy(should_retry_fetch, exponential_delay(1.00))


def should_update_escalating_metrics(event: Event, is_transaction_event: bool) -> bool:
    return (
        features.has("organizations:escalating-metrics-backend", event.project.organization)
        and not is_transaction_event
        and event.group is not None
        and event.group.issue_type.should_detect_escalation()
    )


@instrumented_task(
    name="sentry.tasks.post_process.post_process_group",
    time_limit=120,
    soft_time_limit=110,
    silo_mode=SiloMode.REGION,
)
def post_process_group(
    is_new,
    is_regression,
    is_new_group_environment,
    cache_key,
    group_id=None,
    occurrence_id: str | None = None,
    *,
    project_id: int,
    **kwargs,
):
    """
    Fires post processing hooks for a group.
    """
    from sentry.utils import snuba

    with snuba.options_override({"consistent": True}):
        from sentry import eventstore
        from sentry.eventstore.processing import event_processing_store
        from sentry.ingest.transaction_clusterer.datasource.redis import (
            record_span_descriptions as record_span_descriptions_for_clustering,
        )
        from sentry.ingest.transaction_clusterer.datasource.redis import (
            record_transaction_name as record_transaction_name_for_clustering,
        )
        from sentry.issues.occurrence_consumer import EventLookupError
        from sentry.models.organization import Organization
        from sentry.models.project import Project
        from sentry.reprocessing2 import is_reprocessed_event

        if occurrence_id is None:
            # We use the data being present/missing in the processing store
            # to ensure that we don't duplicate work should the forwarding consumers
            # need to rewind history.
            data = event_processing_store.get(cache_key)
            if not data:
                logger.info(
                    "post_process.skipped",
                    extra={"cache_key": cache_key, "reason": "missing_cache"},
                )
                return
            with metrics.timer("tasks.post_process.delete_event_cache"):
                event_processing_store.delete_by_key(cache_key)

            occurrence = None
            event = process_event(data, group_id)
        else:
            # Note: We attempt to acquire the lock here, but we don't release it and instead just
            # rely on the ttl. The goal here is to make sure we only ever run post process group
            # at most once per occurrence. Even though we don't use retries on the task, this is
            # still necessary since the consumer that sends these might reprocess a batch.
            # TODO: It might be better to instead set a value that we delete here, similar to what
            # we do with `event_processing_store`. If we could do this *before* the occurrence ends
            # up in Kafka (IE via the api that will sit in front of it), then we could guarantee at
            # most once running of post process group.
            lock = locks.get(
                f"ppg:{occurrence_id}-once",
                duration=600,
                name="post_process_w_o",
            )

            try:
                lock.acquire()
            except Exception:
                # If we fail to acquire the lock, we've already run post process group for this
                # occurrence
                return

            occurrence = (
                IssueOccurrence.fetch(occurrence_id, project_id=project_id) if project_id else None
            )
            if not occurrence:
                logger.error(
                    "Failed to fetch occurrence",
                    extra={"occurrence_id": occurrence_id, "project_id": project_id},
                )
                return
            # Issue platform events don't use `event_processing_store`. Fetch from eventstore
            # instead.

            def get_event_raise_exception() -> Event:
                assert occurrence is not None
                retrieved = eventstore.backend.get_event_by_id(
                    project_id,
                    occurrence.event_id,
                    group_id=group_id,
                    skip_transaction_groupevent=True,
                    occurrence_id=occurrence_id,
                )
                if retrieved is None:
                    raise EventLookupError(
                        f"failed to retrieve event(project_id={project_id}, event_id={occurrence.event_id}, group_id={group_id}) from eventstore"
                    )
                return retrieved

            event = fetch_retry_policy(get_event_raise_exception)

        set_current_event_project(event.project_id)

        # Re-bind Project and Org since we're reading the Event object
        # from cache which may contain stale parent models.
        with sentry_sdk.start_span(op="tasks.post_process_group.project_get_from_cache"):
            try:
                event.project = Project.objects.get_from_cache(id=event.project_id)
            except Project.DoesNotExist:
                # project probably got deleted while this task was sitting in the queue
                return
            event.project.set_cached_field_value(
                "organization",
                Organization.objects.get_from_cache(id=event.project.organization_id),
            )

        is_reprocessed = is_reprocessed_event(event.data)
        sentry_sdk.set_tag("is_reprocessed", is_reprocessed)

        is_transaction_event = event.get_event_type() == "transaction"

        # Simplified post processing for transaction events.
        # This should eventually be completely removed and transactions
        # will not go through any post processing.
        if is_transaction_event:
            record_transaction_name_for_clustering(event.project, event.data)
            record_span_descriptions_for_clustering(event.project, event.data)
            with sentry_sdk.start_span(op="tasks.post_process_group.transaction_processed_signal"):
                transaction_processed.send_robust(
                    sender=post_process_group,
                    project=event.project,
                    event=event,
                )

        metric_tags = {}
        if group_id:
            group_state: GroupState = {
                "id": group_id,
                "is_new": is_new,
                "is_regression": is_regression,
                "is_new_group_environment": is_new_group_environment,
            }

            group_event = update_event_group(event, group_state)
            bind_organization_context(event.project.organization)
            _capture_event_stats(event)
            if should_update_escalating_metrics(event, is_transaction_event):
                _update_escalating_metrics(event)

            group_event.occurrence = occurrence

            run_post_process_job(
                {
                    "event": group_event,
                    "group_state": group_state,
                    "is_reprocessed": is_reprocessed,
                    "has_reappeared": bool(not group_state["is_new"]),
                    "has_alert": False,
                    "has_escalated": False,
                }
            )
            metric_tags["occurrence_type"] = group_event.group.issue_type.slug

        if not is_reprocessed and event.data.get("received"):
            duration = time() - event.data["received"]
            metrics.timing(
                "events.time-to-post-process",
                duration,
                instance=event.data["platform"],
                tags=metric_tags,
            )

            # We see occasional metrics being recorded with very old data,
            # temporarily log some information about these groups to help
            # investigate.
            if duration and duration > 432_000:  # 5 days (5*24*60*60)
                logger.warning(
                    "tasks.post_process.old_time_to_post_process",
                    extra={
                        "group_id": group_id,
                        "project_id": project_id,
                        "duration": duration,
                        "received": event.data["received"],
                        "platform": event.data["platform"],
                        "reprocessing": json.dumps(
                            get_path(event.data, "contexts", "reprocessing")
                        ),
                        "original_issue_id": json.dumps(
                            get_path(event.data, "contexts", "reprocessing", "original_issue_id")
                        ),
                    },
                )


def run_post_process_job(job: PostProcessJob) -> None:
    group_event = job["event"]
    issue_category = group_event.group.issue_category if group_event.group else None
    issue_category_metric = issue_category.name.lower() if issue_category else None

    if group_event.group and not group_event.group.issue_type.allow_post_process_group(
        group_event.group.organization
    ):
        return

    if issue_category not in GROUP_CATEGORY_POST_PROCESS_PIPELINE:
        # pipeline for generic issues
        pipeline = GENERIC_POST_PROCESS_PIPELINE
    else:
        # specific pipelines for issue types
        pipeline = GROUP_CATEGORY_POST_PROCESS_PIPELINE[issue_category]

    for pipeline_step in pipeline:
        try:
            with (
                metrics.timer(
                    "tasks.post_process.run_post_process_job.pipeline.duration",
                    tags={
                        "pipeline": pipeline_step.__name__,
                        "issue_category": issue_category_metric,
                        "is_reprocessed": job["is_reprocessed"],
                    },
                ),
                sentry_sdk.start_span(op=f"tasks.post_process_group.{pipeline_step.__name__}"),
            ):
                pipeline_step(job)
        except Exception:
            metrics.incr(
                "sentry.tasks.post_process.post_process_group.exception",
                tags={
                    "issue_category": issue_category_metric,
                    "pipeline": pipeline_step.__name__,
                },
            )
            logger.exception(
                "Failed to process pipeline step %s",
                pipeline_step.__name__,
                extra={"event": group_event, "group": group_event.group},
            )
        else:
            metrics.incr(
                "sentry.tasks.post_process.post_process_group.completed",
                tags={
                    "issue_category": issue_category_metric,
                    "pipeline": pipeline_step.__name__,
                },
            )


def process_event(data: MutableMapping[str, Any], group_id: int | None) -> Event:
    from sentry.eventstore.models import Event
    from sentry.models.event import EventDict

    event = Event(
        project_id=data["project"], event_id=data["event_id"], group_id=group_id, data=data
    )

    # Re-bind node data to avoid renormalization. We only want to
    # renormalize when loading old data from the database.
    event.data = EventDict(event.data, skip_renormalization=True)  # type: ignore[assignment]  # python/mypy#3004
    return event


def update_event_group(event: Event, group_state: GroupState) -> GroupEvent:
    # NOTE: we must pass through the full Event object, and not an
    # event_id since the Event object may not actually have been stored
    # in the database due to sampling.
    from sentry.models.group import get_group_with_redirect

    # Re-bind Group since we're reading the Event object
    # from cache, which may contain a stale group and project
    rebound_group = get_group_with_redirect(group_state["id"])[0]
    # We buffer updates to last_seen, assume it's at least >= the event datetime
    rebound_group.last_seen = max(event.datetime, rebound_group.last_seen)

    # We fetch buffered updates to group aggregates here and populate them on the Group. This
    # helps us avoid problems with processing group ignores and alert rules that rely on these
    # stats.
    with sentry_sdk.start_span(op="tasks.post_process_group.fetch_buffered_group_stats"):
        fetch_buffered_group_stats(rebound_group)

    rebound_group.project = event.project
    rebound_group.project.set_cached_field_value("organization", event.project.organization)
    group_state["id"] = rebound_group.id
    if event.group_id is not None:
        # deprecated event.group and event.group_id usage, kept here for backwards compatibility
        event.group = rebound_group

    event.groups = [rebound_group]
    return event.for_group(rebound_group)


def process_inbox_adds(job: PostProcessJob) -> None:
    from sentry.models.group import Group, GroupStatus
    from sentry.types.group import GroupSubStatus

    with sentry_sdk.start_span(op="tasks.post_process_group.add_group_to_inbox"):
        event = job["event"]
        is_reprocessed = job["is_reprocessed"]
        is_new = job["group_state"]["is_new"]
        is_regression = job["group_state"]["is_regression"]
        has_reappeared = job["has_reappeared"]

        from sentry.models.groupinbox import GroupInboxReason, add_group_to_inbox

        if not event.group:
            logger.error(
                "Group not found on event while processing inbox adds",
                extra={"event_id": event.event_id},
            )
            return

        if is_reprocessed and is_new:
            # keep Group.status=UNRESOLVED and Group.substatus=ONGOING if its reprocessed
            add_group_to_inbox(event.group, GroupInboxReason.REPROCESSED)
        elif (
            not is_reprocessed and not has_reappeared
        ):  # If true, we added the .ONGOING reason already
            if is_new:
                updated = (
                    Group.objects.filter(id=event.group.id)
                    .exclude(substatus=GroupSubStatus.NEW)
                    .update(status=GroupStatus.UNRESOLVED, substatus=GroupSubStatus.NEW)
                )
                if updated:
                    event.group.status = GroupStatus.UNRESOLVED
                    event.group.substatus = GroupSubStatus.NEW
                    add_group_to_inbox(event.group, GroupInboxReason.NEW)
            elif is_regression:
                # we don't need to update the group since that should've already been
                # handled on event ingest
                event.group.status = GroupStatus.UNRESOLVED
                event.group.substatus = GroupSubStatus.REGRESSED
                add_group_to_inbox(event.group, GroupInboxReason.REGRESSION)


def process_snoozes(job: PostProcessJob) -> None:
    """
    Set has_reappeared to True if the group is transitioning from "resolved" to "unresolved",
    otherwise set to False.
    """
    # we process snoozes before rules as it might create a regression
    # but not if it's new because you can't immediately snooze a new group
    if job["is_reprocessed"] or not job["has_reappeared"]:
        return

    from sentry.issues.escalating import is_escalating, manage_issue_states
    from sentry.models.group import GroupStatus
    from sentry.models.groupinbox import GroupInboxReason
    from sentry.models.groupsnooze import GroupSnooze
    from sentry.types.group import GroupSubStatus

    event = job["event"]
    group = event.group
    if not group:
        logger.error(
            "Group not found on event while processing snoozes", extra={"event_id": event.event_id}
        )
        return

    if not group.issue_type.should_detect_escalation():
        return

    # groups less than a day old should use the new -> escalating logic
    group_age_hours = (timezone.now() - group.first_seen).total_seconds() / 3600
    should_use_new_escalation_logic = (
        group_age_hours < MAX_NEW_ESCALATION_AGE_HOURS
        and features.has("projects:first-event-severity-new-escalation", group.project)
    )
    # Check if group is escalating
    if (
        not should_use_new_escalation_logic
        and group.status == GroupStatus.IGNORED
        and group.substatus == GroupSubStatus.UNTIL_ESCALATING
    ):
        escalating, forecast = is_escalating(group)
        if escalating:
            manage_issue_states(
                group, GroupInboxReason.ESCALATING, event, activity_data={"forecast": forecast}
            )

            job["has_reappeared"] = True
        return

    with metrics.timer("post_process.process_snoozes.duration"):
        key = GroupSnooze.get_cache_key(group.id)
        snooze = cache.get(key)
        if snooze is None:
            try:
                snooze = GroupSnooze.objects.get(group=group)
            except GroupSnooze.DoesNotExist:
                snooze = False
            # This cache is also set in post_save|delete.
            cache.set(key, snooze, 3600)
        if not snooze:
            job["has_reappeared"] = False
            return

        # GroupSnooze row exists but the Group.status isn't ignored
        # this shouldn't be possible, if this fires, there may be a race or bug
        if snooze is not None and group.status is not GroupStatus.IGNORED:
            # log a metric for now, we can potentially set the status and substatus but that might mask some other bug
            metrics.incr(
                "post_process.process_snoozes.mismatch_status",
                tags={
                    "group_status": group.status,
                    "group_substatus": group.substatus,
                },
            )

        snooze_condition_still_applies = snooze.is_valid(
            group, test_rates=True, use_pending_data=True
        )

        if not snooze_condition_still_applies:
            snooze_details = {
                "until": snooze.until,
                "count": snooze.count,
                "window": snooze.window,
                "user_count": snooze.user_count,
                "user_window": snooze.user_window,
            }

            # issues snoozed with a specific time duration should be marked ONGOING when the window expires
            reason = (
                GroupInboxReason.ONGOING
                if snooze.until is not None
                else GroupInboxReason.ESCALATING
            )
            manage_issue_states(group, reason, event, snooze_details)

            snooze.delete()

            issue_unignored.send_robust(
                project=group.project,
                user_id=None,
                group=group,
                transition_type="automatic",
                sender="process_snoozes",
            )

            job["has_reappeared"] = True
            return

        job["has_reappeared"] = False
        return


def process_replay_link(job: PostProcessJob) -> None:
    def _get_replay_id(event):
        # replay ids can either come as a context, or a tag.
        # right now they come as a context on non-js events,
        # and javascript transaction (through DSC context)
        # It comes as a tag on js errors.
        # TODO: normalize this upstream in relay and javascript SDK. and eventually remove the tag
        # logic.

        context_replay_id = get_path(event.data, "contexts", "replay", "replay_id")
        return context_replay_id or event.get_tag("replayId")

    if job["is_reprocessed"]:
        return

    metrics.incr("post_process.process_replay_link.id_sampled")

    group_event = job["event"]
    replay_id = _get_replay_id(group_event)
    if not replay_id:
        return

    # Validate the UUID.
    try:
        uuid.UUID(replay_id)
    except (ValueError, TypeError):
        return None

    metrics.incr("post_process.process_replay_link.id_exists")

    publisher = initialize_replays_publisher(is_async=True)
    try:
        kafka_payload = transform_event_for_linking_payload(replay_id, group_event)
    except ValueError:
        metrics.incr("post_process.process_replay_link.id_invalid")
    else:
        publisher.publish(
            "ingest-replay-events",
            json.dumps(kafka_payload),
        )


def process_rules(job: PostProcessJob) -> None:
    if job["is_reprocessed"]:
        return

    from sentry.rules.processing.processor import RuleProcessor

    group_event = job["event"]
    is_new = job["group_state"]["is_new"]
    is_regression = job["group_state"]["is_regression"]
    is_new_group_environment = job["group_state"]["is_new_group_environment"]
    has_reappeared = job["has_reappeared"]
    has_escalated = job["has_escalated"]

    has_alert = False

    rp = RuleProcessor(
        group_event,
        is_new,
        is_regression,
        is_new_group_environment,
        has_reappeared,
        has_escalated,
    )
    with sentry_sdk.start_span(op="tasks.post_process_group.rule_processor_callbacks"):
        # TODO(dcramer): ideally this would fanout, but serializing giant
        # objects back and forth isn't super efficient
        for callback, futures in rp.apply():
            has_alert = True
            safe_execute(callback, group_event, futures)

    job["has_alert"] = has_alert
    return


def process_code_mappings(job: PostProcessJob) -> None:
    if job["is_reprocessed"]:
        return

    from sentry.tasks.derive_code_mappings import SUPPORTED_LANGUAGES, derive_code_mappings

    try:
        event = job["event"]
        project = event.project
        group_id = event.group_id

        # Supported platforms
        if event.data.get("platform") not in SUPPORTED_LANGUAGES:
            return

        # To limit the overall number of tasks, only process one issue per project per hour. In
        # order to give the most issues a chance to to be processed, don't reprocess any given
        # issue for at least 24 hours.
        project_cache_key = f"code-mappings:project:{project.id}"
        issue_cache_key = f"code-mappings:group:{group_id}"
        if cache.get(project_cache_key) is None and cache.get(issue_cache_key) is None:
            cache.set(project_cache_key, True, 3600)  # 1 hour
            cache.set(issue_cache_key, True, 86400)  # 24 hours
        else:
            return

        org = event.project.organization
        org_slug = org.slug
        next_time = timezone.now() + timedelta(hours=1)

        if features.has("organizations:derive-code-mappings", org):
            extra: dict[str, Any] = {
                "organization.slug": org_slug,
                "project.slug": project.slug,
                "group_id": group_id,
                "next_time": next_time,
            }
            logger.info(
                "derive_code_mappings: Queuing code mapping derivation",
                extra=extra,
            )
            derive_code_mappings.delay(project.id, event.data)

    except Exception:
        logger.exception("derive_code_mappings: Failed to process code mappings")


def process_commits(job: PostProcessJob) -> None:
    if job["is_reprocessed"]:
        return

    from sentry.models.commit import Commit
    from sentry.tasks.commit_context import process_commit_context
    from sentry.tasks.groupowner import DEBOUNCE_CACHE_KEY as SUSPECT_COMMITS_DEBOUNCE_CACHE_KEY
    from sentry.tasks.groupowner import process_suspect_commits

    event = job["event"]

    try:
        lock = locks.get(
            f"w-o:{event.group_id}-d-l",
            duration=10,
            name="post_process_w_o",
        )
        with lock.acquire():
            has_commit_key = f"w-o:{event.project.organization_id}-h-c"
            org_has_commit = cache.get(has_commit_key)
            if org_has_commit is None:
                org_has_commit = Commit.objects.filter(
                    organization_id=event.project.organization_id
                ).exists()
                cache.set(has_commit_key, org_has_commit, 3600)

            if org_has_commit:
                from sentry.utils.committers import get_frame_paths

                event_frames = get_frame_paths(event)
                sdk_name = get_sdk_name(event.data)

                integration_cache_key = (
                    f"commit-context-scm-integration:{event.project.organization_id}"
                )
                has_integrations = cache.get(integration_cache_key)
                if has_integrations is None:
                    from sentry.services.hybrid_cloud.integration import integration_service

                    org_integrations = integration_service.get_organization_integrations(
                        organization_id=event.project.organization_id,
                        providers=["github", "gitlab", "github_enterprise"],
                    )
                    has_integrations = len(org_integrations) > 0
                    # Cache the integrations check for 4 hours
                    cache.set(integration_cache_key, has_integrations, 14400)

                if has_integrations:
                    if not job["group_state"]["is_new"]:
                        return

                    process_commit_context.delay(
                        event_id=event.event_id,
                        event_platform=event.platform,
                        event_frames=event_frames,
                        group_id=event.group_id,
                        project_id=event.project_id,
                        sdk_name=sdk_name,
                    )
                else:
                    cache_key = SUSPECT_COMMITS_DEBOUNCE_CACHE_KEY(event.group_id)
                    if cache.get(cache_key):
                        metrics.incr("sentry.tasks.process_suspect_commits.debounce")
                        return
                    process_suspect_commits.delay(
                        event_id=event.event_id,
                        event_platform=event.platform,
                        event_frames=event_frames,
                        group_id=event.group_id,
                        project_id=event.project_id,
                        sdk_name=sdk_name,
                    )
    except UnableToAcquireLock:
        pass


def handle_auto_assignment(job: PostProcessJob) -> None:
    if job["is_reprocessed"]:
        return

    from sentry.models.projectownership import ProjectOwnership

    event = job["event"]
    try:
        ProjectOwnership.handle_auto_assignment(
            project_id=event.project_id,
            organization_id=event.project.organization_id,
            event=event,
            logging_extra={
                "event_id": event.event_id,
                "group_id": str(event.group_id),
                "project_id": str(event.project_id),
                "organization_id": event.project.organization_id,
                "source": "post_process",
            },
        )
    except Exception:
        logger.exception("Failed to set auto-assignment")


def process_service_hooks(job: PostProcessJob) -> None:
    if job["is_reprocessed"]:
        return

    from sentry.tasks.servicehooks import process_service_hook

    event, has_alert = job["event"], job["has_alert"]

    if features.has("projects:servicehooks", project=event.project):
        allowed_events = {"event.created"}
        if has_alert:
            allowed_events.add("event.alert")

        if allowed_events:
            for servicehook_id, events in _get_service_hooks(project_id=event.project_id):
                if any(e in allowed_events for e in events):
                    process_service_hook.delay(servicehook_id=servicehook_id, event=event)


def process_resource_change_bounds(job: PostProcessJob) -> None:
    if job["is_reprocessed"]:
        return

    from sentry.tasks.sentry_apps import process_resource_change_bound

    event, is_new = job["event"], job["group_state"]["is_new"]

    if event.get_event_type() == "error" and _should_send_error_created_hooks(event.project):
        process_resource_change_bound.delay(
            action="created", sender="Error", instance_id=event.event_id, instance=event
        )
    if is_new:
        process_resource_change_bound.delay(
            action="created", sender="Group", instance_id=event.group_id
        )


def process_plugins(job: PostProcessJob) -> None:
    if job["is_reprocessed"]:
        return

    from sentry.plugins.base import plugins

    event, is_new, is_regression = (
        job["event"],
        job["group_state"]["is_new"],
        job["group_state"]["is_regression"],
    )

    for plugin in plugins.for_project(event.project):
        plugin_post_process_group(
            plugin_slug=plugin.slug, event=event, is_new=is_new, is_regresion=is_regression
        )


def process_similarity(job: PostProcessJob) -> None:
    if job["is_reprocessed"]:
        return

    from sentry import similarity

    event = job["event"]

    with sentry_sdk.start_span(op="tasks.post_process_group.similarity"):
        safe_execute(similarity.record, event.project, [event])


def fire_error_processed(job: PostProcessJob):
    if job["is_reprocessed"]:
        return
    event = job["event"]

    event_processed.send_robust(
        sender=post_process_group,
        project=event.project,
        event=event,
    )


def sdk_crash_monitoring(job: PostProcessJob):
    from sentry.utils.sdk_crashes.sdk_crash_detection import sdk_crash_detection

    if job["is_reprocessed"]:
        return

    event = job["event"]

    if not features.has("organizations:sdk-crash-detection", event.project.organization):
        return

    configs = build_sdk_crash_detection_configs()
    if not configs or len(configs) == 0:
        return None

    with sentry_sdk.start_span(op="tasks.post_process_group.sdk_crash_monitoring"):
        sdk_crash_detection.detect_sdk_crash(
            event=event,
            configs=configs,
        )


def plugin_post_process_group(plugin_slug, event, **kwargs):
    """
    Fires post processing hooks for a group.
    """
    set_current_event_project(event.project_id)

    from sentry.plugins.base import plugins

    plugin = plugins.get(plugin_slug)
    try:
        plugin.post_process(
            event=event,
            group=event.group,
            **kwargs,
        )
    except PluginError as e:
        logger.info("post_process.process_error_ignored", extra={"exception": e})
    except Exception as e:
        logger.exception("post_process.process_error", extra={"exception": e})


def feedback_filter_decorator(func):
    def wrapper(job):
        if not should_postprocess_feedback(job):
            return
        return func(job)

    return wrapper


def should_postprocess_feedback(job: PostProcessJob) -> bool:
    from sentry.feedback.usecases.create_feedback import FeedbackCreationSource

    event = job["event"]

    if not hasattr(event, "occurrence") or event.occurrence is None:
        return False

    if event.occurrence.evidence_data.get("is_spam") is True and features.has(
        "organizations:user-feedback-spam-filter-actions", job["event"].project.organization
    ):
        metrics.incr("feedback.spam-detection-actions.dont-send-notification")
        return False

    feedback_source = event.occurrence.evidence_data.get("source")

    if feedback_source in FeedbackCreationSource.new_feedback_category_values():
        return True

    should_notify_on_old_feedbacks = job["event"].project.get_option(
        "sentry:feedback_user_report_notifications"
    )
    if should_notify_on_old_feedbacks is None:
        should_notify_on_old_feedbacks = projectoptions.get_well_known_default(
            "sentry:feedback_user_report_notifications",
            epoch=job["event"].project.get_option(
                ("sentry:option-epoch"),
            ),
        )

    if (
        feedback_source in FeedbackCreationSource.old_feedback_category_values()
        and should_notify_on_old_feedbacks
    ):
        return True

    return False


def check_has_high_priority_alerts(job: PostProcessJob) -> None:
    """
    Determine if we should fire a task to check if the new issue
    threshold has been met to enable high priority alerts.
    """
    try:
        event = job["event"]
        if event.project.flags.has_high_priority_alerts:
            return

        from sentry.tasks.check_new_issue_threshold_met import (
            check_new_issue_threshold_met,
            new_issue_threshold_key,
        )

        # If the new issue volume has already been checked today, don't recalculate regardless of the value
        project_key = new_issue_threshold_key(event.project_id)
        threshold_met = cache.get(project_key)
        if threshold_met is not None:
            return

        try:
            lock = locks.get(project_key, duration=10)
            with lock.acquire():
                # If the threshold has already been calculated today, don't recalculate regardless of the value
                task_scheduled = cache.get(project_key)
                if task_scheduled is not None:
                    return

                check_new_issue_threshold_met.delay(event.project.id)

                # Add the key to cache for 24 hours
                cache.set(project_key, True, 60 * 60 * 24)
        except UnableToAcquireLock:
            pass
    except Exception as e:
        logger.warning(
            "Failed to check new issue threshold met",
            repr(e),
            extra={"project_id": event.project_id},
        )


def link_event_to_user_report(job: PostProcessJob) -> None:
    from sentry.feedback.usecases.create_feedback import FeedbackCreationSource, shim_to_feedback
    from sentry.models.userreport import UserReport

    event = job["event"]
    project = event.project
    group = event.group

    if (
        features.has(
            "organizations:user-feedback-event-link-ingestion-changes", project.organization
        )
        and not job["is_reprocessed"]
    ):
        metrics.incr("event_manager.save._update_user_reports_with_event_link")
        event = job["event"]
        project = event.project
        user_reports_without_group = UserReport.objects.filter(
            project_id=project.id,
            event_id=event.event_id,
            group_id__isnull=True,
            environment_id__isnull=True,
        )
        for report in user_reports_without_group:
            shim_to_feedback(
                {
                    "name": report.name,
                    "email": report.email,
                    "comments": report.comments,
                    "event_id": report.event_id,
                    "level": "error",
                },
                event,
                project,
                FeedbackCreationSource.USER_REPORT_ENVELOPE,
            )

        user_reports_updated = user_reports_without_group.update(
            group_id=group.id, environment_id=event.get_environment().id
        )

        if user_reports_updated:
            metrics.incr("event_manager.save._update_user_reports_with_event_link_updated")

    else:
        UserReport.objects.filter(project_id=project.id, event_id=job["event"].event_id).update(
            group_id=group.id, environment_id=event.get_environment().id
        )


MAX_NEW_ESCALATION_AGE_HOURS = 24
MIN_EVENTS_FOR_NEW_ESCALATION = 10


def detect_new_escalation(job: PostProcessJob):
    """
    Detects whether a new issue is escalating. New issues are issues less than
    MAX_NEW_ESCALATION_AGE_HOURS hours old.

    If we detect that the group has escalated, set has_escalated to True in the
    job.
    """
    from sentry.issues.issue_velocity import get_latest_threshold
    from sentry.issues.priority import PriorityChangeReason, auto_update_priority
    from sentry.models.activity import Activity
    from sentry.models.group import GroupStatus
    from sentry.models.grouphistory import GroupHistoryStatus, record_group_history
    from sentry.models.groupinbox import GroupInboxReason, add_group_to_inbox
    from sentry.types.activity import ActivityType

    group = job["event"].group
    if not group or not features.has(
        "projects:first-event-severity-new-escalation", job["event"].project
    ):
        return
    extra = {
        "org_id": group.organization.id,
        "project_id": job["event"].project.id,
        "group_id": group.id,
    }
    group_age_seconds = (timezone.now() - group.first_seen).total_seconds()
    group_age_hours = group_age_seconds / 3600 if group_age_seconds >= 3600 else 1
    times_seen = group.times_seen_with_pending
    has_valid_status = group.substatus == GroupSubStatus.NEW
    if (
        group_age_hours >= MAX_NEW_ESCALATION_AGE_HOURS
        or not has_valid_status
        or times_seen < MIN_EVENTS_FOR_NEW_ESCALATION
    ):
        metrics.incr("tasks.post_process.detect_new_escalation.skipping_detection")
        return
    # Get escalation lock for this group. If we're unable to acquire this lock, another process is handling
    # this group at the same time. In that case, just exit early, no need to retry.
    lock = locks.get(f"detect_escalation:{group.id}", duration=10, name="detect_escalation")
    try:
        with lock.acquire():
            project_escalation_rate = get_latest_threshold(job["event"].project)
            group_hourly_event_rate = times_seen / group_age_hours
            # a rate of 0 means there was no threshold that could be calculated
            if project_escalation_rate > 0 and group_hourly_event_rate > project_escalation_rate:
                job["has_escalated"] = True
                group.update(status=GroupStatus.UNRESOLVED, substatus=GroupSubStatus.ESCALATING)
                # TODO(snigdha): reuse manage_issue_states when we allow escalating from other statuses
                add_group_to_inbox(group, GroupInboxReason.ESCALATING)
                record_group_history(group, GroupHistoryStatus.ESCALATING)
                Activity.objects.create_group_activity(
                    group=group,
                    type=ActivityType.SET_ESCALATING,
                    data={"event_id": job["event"].event_id},
                )
                auto_update_priority(group, PriorityChangeReason.ESCALATING)
            logger.info(
                "tasks.post_process.detect_new_escalation",
                extra={
                    **extra,
                    "group_hourly_event_rate": group_hourly_event_rate,
                    "project_escalation_rate": project_escalation_rate,
                    "has_escalated": job["has_escalated"],
                },
            )
    except UnableToAcquireLock as error:
        extra["error"] = error
        logger.warning(
            "tasks.post_process.detect_new_escalation.unable_to_acquire_lock", extra=extra
        )
        return


GROUP_CATEGORY_POST_PROCESS_PIPELINE = {
    GroupCategory.ERROR: [
        _capture_group_stats,
        process_snoozes,
        process_inbox_adds,
        check_has_high_priority_alerts,
        detect_new_escalation,
        process_commits,
        handle_owner_assignment,
        handle_auto_assignment,
        process_rules,
        process_service_hooks,
        process_resource_change_bounds,
        process_plugins,
        process_code_mappings,
        process_similarity,
        update_existing_attachments,
        fire_error_processed,
        sdk_crash_monitoring,
        process_replay_link,
        link_event_to_user_report,
    ],
    GroupCategory.FEEDBACK: [
        feedback_filter_decorator(process_snoozes),
        feedback_filter_decorator(process_inbox_adds),
        feedback_filter_decorator(process_rules),
    ],
}

GENERIC_POST_PROCESS_PIPELINE = [
    process_snoozes,
    process_inbox_adds,
    process_rules,
]