test_snuba.py 7.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203
  1. import copy
  2. import time
  3. import uuid
  4. from datetime import datetime, timedelta
  5. from unittest import mock
  6. import pytest
  7. from django.utils import timezone
  8. from snuba_sdk.column import InvalidColumnError
  9. from sentry.testutils.cases import SnubaTestCase, TestCase
  10. from sentry.testutils.helpers.datetime import before_now
  11. from sentry.utils import snuba
  12. class SnubaTest(TestCase, SnubaTestCase):
  13. def _insert_event_for_time(self, ts, hash="a" * 32, group_id=None):
  14. self.snuba_insert(
  15. (
  16. 2,
  17. "insert",
  18. {
  19. "event_id": uuid.uuid4().hex,
  20. "primary_hash": hash,
  21. "group_id": group_id if group_id else int(hash[:16], 16),
  22. "project_id": self.project.id,
  23. "message": "message",
  24. "platform": "python",
  25. "datetime": ts.strftime("%Y-%m-%dT%H:%M:%S.%fZ"),
  26. "data": {"received": time.mktime(ts.timetuple())},
  27. },
  28. {},
  29. )
  30. )
  31. def test(self) -> None:
  32. "This is just a simple 'hello, world' example test."
  33. now = datetime.now()
  34. self.snuba_insert(
  35. (
  36. 2,
  37. "insert",
  38. {
  39. "event_id": "a" * 32,
  40. "primary_hash": "1" * 32,
  41. "group_id": 1,
  42. "project_id": self.project.id,
  43. "message": "message",
  44. "platform": "python",
  45. "datetime": now.strftime("%Y-%m-%dT%H:%M:%S.%fZ"),
  46. "data": {"received": time.mktime(now.timetuple())},
  47. },
  48. {},
  49. )
  50. )
  51. assert snuba.query(
  52. start=now - timedelta(days=1),
  53. end=now + timedelta(days=1),
  54. groupby=["project_id"],
  55. filter_keys={"project_id": [self.project.id]},
  56. referrer="testing.test",
  57. tenant_ids={"referrer": "testing.test", "organization_id": 1},
  58. ) == {self.project.id: 1}
  59. def test_fail(self) -> None:
  60. now = datetime.now()
  61. with pytest.raises(InvalidColumnError):
  62. snuba.query(
  63. start=now - timedelta(days=1),
  64. end=now + timedelta(days=1),
  65. filter_keys={"project_id": [self.project.id]},
  66. groupby=[")("],
  67. referrer="testing.test",
  68. )
  69. def test_organization_retention_respected(self) -> None:
  70. base_time = timezone.now()
  71. self._insert_event_for_time(base_time - timedelta(minutes=1))
  72. self._insert_event_for_time(base_time - timedelta(days=2))
  73. def _get_event_count():
  74. # attempt to query back 90 days
  75. return snuba.query(
  76. start=base_time - timedelta(days=90),
  77. end=base_time + timedelta(days=1),
  78. groupby=["project_id"],
  79. filter_keys={"project_id": [self.project.id]},
  80. referrer="testing.test",
  81. tenant_ids={"referrer": "testing.test", "organization_id": 1},
  82. )
  83. assert _get_event_count() == {self.project.id: 2}
  84. with self.options({"system.event-retention-days": 1}):
  85. assert _get_event_count() == {self.project.id: 1}
  86. def test_organization_retention_larger_than_end_date(self) -> None:
  87. base_time = timezone.now()
  88. with self.options({"system.event-retention-days": 1}):
  89. assert (
  90. snuba.query(
  91. start=base_time - timedelta(days=90),
  92. end=base_time - timedelta(days=60),
  93. groupby=["project_id"],
  94. filter_keys={"project_id": [self.project.id]},
  95. referrer="testing.test",
  96. )
  97. == {}
  98. )
  99. class BulkRawQueryTest(TestCase, SnubaTestCase):
  100. def test_simple(self) -> None:
  101. one_min_ago = before_now(minutes=1).isoformat()
  102. event_1 = self.store_event(
  103. data={"fingerprint": ["group-1"], "message": "hello", "timestamp": one_min_ago},
  104. project_id=self.project.id,
  105. )
  106. event_2 = self.store_event(
  107. data={"fingerprint": ["group-2"], "message": "hello", "timestamp": one_min_ago},
  108. project_id=self.project.id,
  109. )
  110. results = snuba.bulk_raw_query(
  111. [
  112. snuba.SnubaQueryParams(
  113. start=timezone.now() - timedelta(days=1),
  114. end=timezone.now(),
  115. selected_columns=["event_id", "group_id", "timestamp"],
  116. filter_keys={"project_id": [self.project.id], "group_id": [event_1.group.id]},
  117. tenant_ids={"referrer": "testing.test", "organization_id": 1},
  118. ),
  119. snuba.SnubaQueryParams(
  120. start=timezone.now() - timedelta(days=1),
  121. end=timezone.now(),
  122. selected_columns=["event_id", "group_id", "timestamp"],
  123. filter_keys={"project_id": [self.project.id], "group_id": [event_2.group.id]},
  124. tenant_ids={"referrer": "testing.test", "organization_id": 1},
  125. ),
  126. ],
  127. )
  128. assert [{(item["group_id"], item["event_id"]) for item in r["data"]} for r in results] == [
  129. {(event_1.group.id, event_1.event_id)},
  130. {(event_2.group.id, event_2.event_id)},
  131. ]
  132. @mock.patch("sentry.utils.snuba._bulk_snuba_query", side_effect=snuba._bulk_snuba_query)
  133. def test_cache(self, _bulk_snuba_query):
  134. one_min_ago = before_now(minutes=1).isoformat()
  135. event_1 = self.store_event(
  136. data={"fingerprint": ["group-1"], "message": "hello", "timestamp": one_min_ago},
  137. project_id=self.project.id,
  138. )
  139. event_2 = self.store_event(
  140. data={"fingerprint": ["group-2"], "message": "hello", "timestamp": one_min_ago},
  141. project_id=self.project.id,
  142. )
  143. params = [
  144. snuba.SnubaQueryParams(
  145. start=timezone.now() - timedelta(days=1),
  146. end=timezone.now(),
  147. selected_columns=["event_id", "group_id", "timestamp"],
  148. filter_keys={"project_id": [self.project.id], "group_id": [event_1.group.id]},
  149. tenant_ids={"referrer": "testing.test", "organization_id": 1},
  150. ),
  151. snuba.SnubaQueryParams(
  152. start=timezone.now() - timedelta(days=1),
  153. end=timezone.now(),
  154. selected_columns=["event_id", "group_id", "timestamp"],
  155. filter_keys={"project_id": [self.project.id], "group_id": [event_2.group.id]},
  156. tenant_ids={"referrer": "testing.test", "organization_id": 1},
  157. ),
  158. ]
  159. results = snuba.bulk_raw_query(
  160. copy.deepcopy(params),
  161. use_cache=True,
  162. )
  163. assert [{(item["group_id"], item["event_id"]) for item in r["data"]} for r in results] == [
  164. {(event_1.group.id, event_1.event_id)},
  165. {(event_2.group.id, event_2.event_id)},
  166. ]
  167. assert _bulk_snuba_query.call_count == 1
  168. _bulk_snuba_query.reset_mock()
  169. # # Make sure this doesn't appear in the cached results
  170. self.store_event(
  171. data={"fingerprint": ["group-2"], "message": "hello there", "timestamp": one_min_ago},
  172. project_id=self.project.id,
  173. )
  174. results = snuba.bulk_raw_query(
  175. copy.deepcopy(params),
  176. use_cache=True,
  177. )
  178. assert [{(item["group_id"], item["event_id"]) for item in r["data"]} for r in results] == [
  179. {(event_1.group.id, event_1.event_id)},
  180. {(event_2.group.id, event_2.event_id)},
  181. ]
  182. assert _bulk_snuba_query.call_count == 0