SMusatov
/
sentry
mirror of https://github.com/getsentry/sentry


			
							123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174
							import time
import uuid

import confluent_kafka as kafka
import pytest

from sentry.sentry_metrics.indexer.strings import SHARED_STRINGS
from sentry.testutils.cases import TransactionTestCase
from sentry.testutils.helpers.datetime import before_now, iso_format
from sentry.testutils.helpers.features import Feature
from sentry.testutils.helpers.options import override_options
from sentry.testutils.relay import RelayStoreHelper
from sentry.testutils.skips import requires_kafka
from sentry.utils import json

pytestmark = [requires_kafka]


class MetricsExtractionTest(RelayStoreHelper, TransactionTestCase):
    @pytest.mark.skip("breaks in Relay for unknown reasons")
    @override_options({"relay.transaction-names-client-based": 1.0})
    def test_all_transaction_metrics_emitted(self):
        with Feature(
            {
                "organizations:transaction-metrics-extraction": True,
            }
        ):
            event_data = {
                "type": "transaction",
                "transaction": "foo",
                "transaction_info": {"source": "url"},  # 'transaction' tag not extracted
                "timestamp": iso_format(before_now(seconds=1)),
                "start_timestamp": iso_format(before_now(seconds=2)),
                "contexts": {
                    "trace": {
                        "trace_id": 32 * "b",
                        "span_id": 16 * "c",
                        "type": "trace",
                    }
                },
                "user": {"id": 123},
                "measurements": {
                    "fp": {"value": 2258.060000000114},
                    "fcp": {"value": 2258.060000000114},
                    "lcp": {"value": 2807.335},
                    "inp": {"value": 51.318},
                    "fid": {"value": 3.4900000027846545},
                    "cls": {"value": 0.0382},
                    "frames_total": {"value": 100},
                    "frames_slow": {"value": 10},
                    "frames_frozen": {"value": 5},
                    "stall_count": {"value": 2},
                    "stall_total_time": {"value": 12},
                    "stall_longest_time": {"value": 7},
                    "app_start_warm": {"value": 0.001},
                    "app_start_cold": {"value": 0.001},
                    "ttfb": {"value": 5},
                    "ttfb.requesttime": {"value": 6},
                },
                "spans": [
                    {
                        "op": op,
                        "trace_id": 32 * "b",
                        "span_id": 16 * "1",
                        "start_timestamp": iso_format(before_now(seconds=2)),
                        "timestamp": iso_format(before_now(seconds=1)),
                    }
                    for op in ("db", "http", "resource", "browser", "ui")
                ],
            }

            settings = {
                "bootstrap.servers": "127.0.0.1:9092",  # TODO: read from django settings here
                "group.id": "test-consumer-%s" % uuid.uuid4().hex,
                "enable.auto.commit": True,
                "auto.offset.reset": "earliest",
            }

            consumer = kafka.Consumer(settings)
            consumer.assign([kafka.TopicPartition("ingest-metrics", 0)])

            self.post_and_retrieve_event(event_data)

            strings_emitted = set()
            for _ in range(1000):
                message = consumer.poll(timeout=1.0)
                if message is None:
                    break
                message = json.loads(message.value())
                if message["project_id"] == self.project.id:
                    strings_emitted.add(message["name"])
                    for key, value in message["tags"].items():
                        strings_emitted.add(key)
                        strings_emitted.add(value)

            consumer.close()

            #: These strings should be common strings, but we cannot add them
            #: to the indexer because they already exist in the release health
            #: indexer db.
            known_non_common_strings = {
                "other",
                "platform",
                "d:transactions/measurements.inp@millisecond",
            }

            # Make sure that all the standard strings are part of the list of common strings:
            non_common_strings = strings_emitted - SHARED_STRINGS.keys()
            assert non_common_strings == known_non_common_strings

    def test_histogram_outliers(self):
        with Feature(
            {
                "organizations:transaction-metrics-extraction": True,
            }
        ):
            event_data = {
                "type": "transaction",
                "transaction": "foo",
                "transaction_info": {"source": "url"},  # 'transaction' tag not extracted
                "timestamp": iso_format(before_now(seconds=1)),
                "start_timestamp": iso_format(before_now(seconds=2)),
                "platform": "javascript",
                "contexts": {
                    "trace": {
                        "op": "pageload",
                        "trace_id": 32 * "b",
                        "span_id": 16 * "c",
                        "type": "trace",
                    }
                },
                "user": {"id": 123},
                "measurements": {
                    "fcp": {"value": 999999999.0},
                    "lcp": {"value": 0.0},
                },
            }

            settings = {
                "bootstrap.servers": "127.0.0.1:9092",  # TODO: read from django settings here
                "group.id": "test-consumer-%s" % uuid.uuid4().hex,
                "enable.auto.commit": True,
                "auto.offset.reset": "earliest",
            }

            consumer = kafka.Consumer(settings)
            consumer.assign([kafka.TopicPartition("ingest-performance-metrics", 0)])

            self.post_and_retrieve_event(event_data)

            histogram_outlier_tags = {}
            buckets = []
            t0 = time.monotonic()
            for attempt in range(1000):
                message = consumer.poll(timeout=1.0)
                if message is None:
                    break
                bucket = json.loads(message.value())
                buckets.append(bucket)
                try:
                    histogram_outlier_tags[bucket["name"]] = bucket["tags"]["histogram_outlier"]
                except KeyError:
                    pass

            consumer.close()
            assert histogram_outlier_tags == {
                "d:transactions/duration@millisecond": "inlier",
                "d:transactions/measurements.fcp@millisecond": "outlier",
                "d:transactions/measurements.lcp@millisecond": "inlier",
            }, {
                "attempts": attempt,
                "time_elapsed": time.monotonic() - t0,
                "bucket_count": len(buckets),
            }