123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203 |
- import copy
- import time
- import uuid
- from datetime import datetime, timedelta
- from unittest import mock
- import pytest
- from django.utils import timezone
- from snuba_sdk.column import InvalidColumnError
- from sentry.testutils.cases import SnubaTestCase, TestCase
- from sentry.testutils.helpers.datetime import before_now
- from sentry.utils import snuba
- class SnubaTest(TestCase, SnubaTestCase):
- def _insert_event_for_time(self, ts, hash="a" * 32, group_id=None):
- self.snuba_insert(
- (
- 2,
- "insert",
- {
- "event_id": uuid.uuid4().hex,
- "primary_hash": hash,
- "group_id": group_id if group_id else int(hash[:16], 16),
- "project_id": self.project.id,
- "message": "message",
- "platform": "python",
- "datetime": ts.strftime("%Y-%m-%dT%H:%M:%S.%fZ"),
- "data": {"received": time.mktime(ts.timetuple())},
- },
- {},
- )
- )
- def test(self) -> None:
- "This is just a simple 'hello, world' example test."
- now = datetime.now()
- self.snuba_insert(
- (
- 2,
- "insert",
- {
- "event_id": "a" * 32,
- "primary_hash": "1" * 32,
- "group_id": 1,
- "project_id": self.project.id,
- "message": "message",
- "platform": "python",
- "datetime": now.strftime("%Y-%m-%dT%H:%M:%S.%fZ"),
- "data": {"received": time.mktime(now.timetuple())},
- },
- {},
- )
- )
- assert snuba.query(
- start=now - timedelta(days=1),
- end=now + timedelta(days=1),
- groupby=["project_id"],
- filter_keys={"project_id": [self.project.id]},
- referrer="testing.test",
- tenant_ids={"referrer": "testing.test", "organization_id": 1},
- ) == {self.project.id: 1}
- def test_fail(self) -> None:
- now = datetime.now()
- with pytest.raises(InvalidColumnError):
- snuba.query(
- start=now - timedelta(days=1),
- end=now + timedelta(days=1),
- filter_keys={"project_id": [self.project.id]},
- groupby=[")("],
- referrer="testing.test",
- )
- def test_organization_retention_respected(self) -> None:
- base_time = timezone.now()
- self._insert_event_for_time(base_time - timedelta(minutes=1))
- self._insert_event_for_time(base_time - timedelta(days=2))
- def _get_event_count():
- # attempt to query back 90 days
- return snuba.query(
- start=base_time - timedelta(days=90),
- end=base_time + timedelta(days=1),
- groupby=["project_id"],
- filter_keys={"project_id": [self.project.id]},
- referrer="testing.test",
- tenant_ids={"referrer": "testing.test", "organization_id": 1},
- )
- assert _get_event_count() == {self.project.id: 2}
- with self.options({"system.event-retention-days": 1}):
- assert _get_event_count() == {self.project.id: 1}
- def test_organization_retention_larger_than_end_date(self) -> None:
- base_time = timezone.now()
- with self.options({"system.event-retention-days": 1}):
- assert (
- snuba.query(
- start=base_time - timedelta(days=90),
- end=base_time - timedelta(days=60),
- groupby=["project_id"],
- filter_keys={"project_id": [self.project.id]},
- referrer="testing.test",
- )
- == {}
- )
- class BulkRawQueryTest(TestCase, SnubaTestCase):
- def test_simple(self) -> None:
- one_min_ago = before_now(minutes=1).isoformat()
- event_1 = self.store_event(
- data={"fingerprint": ["group-1"], "message": "hello", "timestamp": one_min_ago},
- project_id=self.project.id,
- )
- event_2 = self.store_event(
- data={"fingerprint": ["group-2"], "message": "hello", "timestamp": one_min_ago},
- project_id=self.project.id,
- )
- results = snuba.bulk_raw_query(
- [
- snuba.SnubaQueryParams(
- start=timezone.now() - timedelta(days=1),
- end=timezone.now(),
- selected_columns=["event_id", "group_id", "timestamp"],
- filter_keys={"project_id": [self.project.id], "group_id": [event_1.group.id]},
- tenant_ids={"referrer": "testing.test", "organization_id": 1},
- ),
- snuba.SnubaQueryParams(
- start=timezone.now() - timedelta(days=1),
- end=timezone.now(),
- selected_columns=["event_id", "group_id", "timestamp"],
- filter_keys={"project_id": [self.project.id], "group_id": [event_2.group.id]},
- tenant_ids={"referrer": "testing.test", "organization_id": 1},
- ),
- ],
- )
- assert [{(item["group_id"], item["event_id"]) for item in r["data"]} for r in results] == [
- {(event_1.group.id, event_1.event_id)},
- {(event_2.group.id, event_2.event_id)},
- ]
- @mock.patch("sentry.utils.snuba._bulk_snuba_query", side_effect=snuba._bulk_snuba_query)
- def test_cache(self, _bulk_snuba_query):
- one_min_ago = before_now(minutes=1).isoformat()
- event_1 = self.store_event(
- data={"fingerprint": ["group-1"], "message": "hello", "timestamp": one_min_ago},
- project_id=self.project.id,
- )
- event_2 = self.store_event(
- data={"fingerprint": ["group-2"], "message": "hello", "timestamp": one_min_ago},
- project_id=self.project.id,
- )
- params = [
- snuba.SnubaQueryParams(
- start=timezone.now() - timedelta(days=1),
- end=timezone.now(),
- selected_columns=["event_id", "group_id", "timestamp"],
- filter_keys={"project_id": [self.project.id], "group_id": [event_1.group.id]},
- tenant_ids={"referrer": "testing.test", "organization_id": 1},
- ),
- snuba.SnubaQueryParams(
- start=timezone.now() - timedelta(days=1),
- end=timezone.now(),
- selected_columns=["event_id", "group_id", "timestamp"],
- filter_keys={"project_id": [self.project.id], "group_id": [event_2.group.id]},
- tenant_ids={"referrer": "testing.test", "organization_id": 1},
- ),
- ]
- results = snuba.bulk_raw_query(
- copy.deepcopy(params),
- use_cache=True,
- )
- assert [{(item["group_id"], item["event_id"]) for item in r["data"]} for r in results] == [
- {(event_1.group.id, event_1.event_id)},
- {(event_2.group.id, event_2.event_id)},
- ]
- assert _bulk_snuba_query.call_count == 1
- _bulk_snuba_query.reset_mock()
- # # Make sure this doesn't appear in the cached results
- self.store_event(
- data={"fingerprint": ["group-2"], "message": "hello there", "timestamp": one_min_ago},
- project_id=self.project.id,
- )
- results = snuba.bulk_raw_query(
- copy.deepcopy(params),
- use_cache=True,
- )
- assert [{(item["group_id"], item["event_id"]) for item in r["data"]} for r in results] == [
- {(event_1.group.id, event_1.event_id)},
- {(event_2.group.id, event_2.event_id)},
- ]
- assert _bulk_snuba_query.call_count == 0
|