test_organization_events_stats_mep.py 23 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558
  1. from datetime import timedelta
  2. from unittest import mock
  3. import pytest
  4. from django.urls import reverse
  5. from sentry import options
  6. from sentry.testutils import MetricsEnhancedPerformanceTestCase
  7. from sentry.testutils.helpers.datetime import before_now, iso_format
  8. pytestmark = pytest.mark.sentry_metrics
  9. class OrganizationEventsStatsMetricsEnhancedPerformanceEndpointTest(
  10. MetricsEnhancedPerformanceTestCase
  11. ):
  12. endpoint = "sentry-api-0-organization-events-stats"
  13. METRIC_STRINGS = [
  14. "foo_transaction",
  15. "d:transactions/measurements.datacenter_memory@pebibyte",
  16. ]
  17. def setUp(self):
  18. super().setUp()
  19. self.login_as(user=self.user)
  20. self.day_ago = before_now(days=1).replace(hour=10, minute=0, second=0, microsecond=0)
  21. self.DEFAULT_METRIC_TIMESTAMP = self.day_ago
  22. self.url = reverse(
  23. "sentry-api-0-organization-events-stats",
  24. kwargs={"organization_slug": self.project.organization.slug},
  25. )
  26. self.features = {
  27. "organizations:performance-use-metrics": True,
  28. }
  29. def do_request(self, data, url=None, features=None):
  30. if features is None:
  31. features = {"organizations:discover-basic": True}
  32. features.update(self.features)
  33. with self.feature(features):
  34. return self.client.get(self.url if url is None else url, data=data, format="json")
  35. # These throughput tests should roughly match the ones in OrganizationEventsStatsEndpointTest
  36. def test_throughput_epm_hour_rollup(self):
  37. # Each of these denotes how many events to create in each hour
  38. event_counts = [6, 0, 6, 3, 0, 3]
  39. for hour, count in enumerate(event_counts):
  40. for minute in range(count):
  41. self.store_transaction_metric(
  42. 1, timestamp=self.day_ago + timedelta(hours=hour, minutes=minute)
  43. )
  44. for axis in ["epm()", "tpm()"]:
  45. response = self.do_request(
  46. data={
  47. "start": iso_format(self.day_ago),
  48. "end": iso_format(self.day_ago + timedelta(hours=6)),
  49. "interval": "1h",
  50. "yAxis": axis,
  51. "project": self.project.id,
  52. "dataset": "metricsEnhanced",
  53. },
  54. )
  55. assert response.status_code == 200, response.content
  56. data = response.data["data"]
  57. assert len(data) == 6
  58. assert response.data["isMetricsData"]
  59. rows = data[0:6]
  60. for test in zip(event_counts, rows):
  61. assert test[1][1][0]["count"] == test[0] / (3600.0 / 60.0)
  62. def test_throughput_epm_day_rollup(self):
  63. # Each of these denotes how many events to create in each minute
  64. event_counts = [6, 0, 6, 3, 0, 3]
  65. for hour, count in enumerate(event_counts):
  66. for minute in range(count):
  67. self.store_transaction_metric(
  68. 1, timestamp=self.day_ago + timedelta(hours=hour, minutes=minute)
  69. )
  70. for axis in ["epm()", "tpm()"]:
  71. response = self.do_request(
  72. data={
  73. "start": iso_format(self.day_ago),
  74. "end": iso_format(self.day_ago + timedelta(hours=24)),
  75. "interval": "24h",
  76. "yAxis": axis,
  77. "project": self.project.id,
  78. "dataset": "metricsEnhanced",
  79. },
  80. )
  81. assert response.status_code == 200, response.content
  82. data = response.data["data"]
  83. assert len(data) == 2
  84. assert response.data["isMetricsData"]
  85. assert data[0][1][0]["count"] == sum(event_counts) / (86400.0 / 60.0)
  86. def test_throughput_epm_hour_rollup_offset_of_hour(self):
  87. # Each of these denotes how many events to create in each hour
  88. event_counts = [6, 0, 6, 3, 0, 3]
  89. for hour, count in enumerate(event_counts):
  90. for minute in range(count):
  91. self.store_transaction_metric(
  92. 1, timestamp=self.day_ago + timedelta(hours=hour, minutes=minute + 30)
  93. )
  94. for axis in ["tpm()", "epm()"]:
  95. response = self.do_request(
  96. data={
  97. "start": iso_format(self.day_ago + timedelta(minutes=30)),
  98. "end": iso_format(self.day_ago + timedelta(hours=6, minutes=30)),
  99. "interval": "1h",
  100. "yAxis": axis,
  101. "project": self.project.id,
  102. "dataset": "metricsEnhanced",
  103. },
  104. )
  105. assert response.status_code == 200, response.content
  106. data = response.data["data"]
  107. assert len(data) == 6
  108. assert response.data["isMetricsData"]
  109. rows = data[0:6]
  110. for test in zip(event_counts, rows):
  111. assert test[1][1][0]["count"] == test[0] / (3600.0 / 60.0)
  112. def test_throughput_eps_minute_rollup(self):
  113. # Each of these denotes how many events to create in each minute
  114. event_counts = [6, 0, 6, 3, 0, 3]
  115. for minute, count in enumerate(event_counts):
  116. for second in range(count):
  117. self.store_transaction_metric(
  118. 1, timestamp=self.day_ago + timedelta(minutes=minute, seconds=second)
  119. )
  120. for axis in ["eps()", "tps()"]:
  121. response = self.do_request(
  122. data={
  123. "start": iso_format(self.day_ago),
  124. "end": iso_format(self.day_ago + timedelta(minutes=6)),
  125. "interval": "1m",
  126. "yAxis": axis,
  127. "project": self.project.id,
  128. "dataset": "metricsEnhanced",
  129. },
  130. )
  131. assert response.status_code == 200, response.content
  132. data = response.data["data"]
  133. assert len(data) == 6
  134. assert response.data["isMetricsData"]
  135. rows = data[0:6]
  136. for test in zip(event_counts, rows):
  137. assert test[1][1][0]["count"] == test[0] / 60.0
  138. def test_failure_rate(self):
  139. for hour in range(6):
  140. timestamp = self.day_ago + timedelta(hours=hour, minutes=30)
  141. self.store_transaction_metric(1, tags={"transaction.status": "ok"}, timestamp=timestamp)
  142. if hour < 3:
  143. self.store_transaction_metric(
  144. 1, tags={"transaction.status": "internal_error"}, timestamp=timestamp
  145. )
  146. response = self.do_request(
  147. data={
  148. "start": iso_format(self.day_ago),
  149. "end": iso_format(self.day_ago + timedelta(hours=6)),
  150. "interval": "1h",
  151. "yAxis": ["failure_rate()"],
  152. "project": self.project.id,
  153. "dataset": "metricsEnhanced",
  154. },
  155. )
  156. assert response.status_code == 200, response.content
  157. data = response.data["data"]
  158. assert len(data) == 6
  159. assert response.data["isMetricsData"]
  160. assert [attrs for time, attrs in response.data["data"]] == [
  161. [{"count": 0.5}],
  162. [{"count": 0.5}],
  163. [{"count": 0.5}],
  164. [{"count": 0}],
  165. [{"count": 0}],
  166. [{"count": 0}],
  167. ]
  168. def test_percentiles_multi_axis(self):
  169. for hour in range(6):
  170. timestamp = self.day_ago + timedelta(hours=hour, minutes=30)
  171. self.store_transaction_metric(111, timestamp=timestamp)
  172. self.store_transaction_metric(222, metric="measurements.lcp", timestamp=timestamp)
  173. response = self.do_request(
  174. data={
  175. "start": iso_format(self.day_ago),
  176. "end": iso_format(self.day_ago + timedelta(hours=6)),
  177. "interval": "1h",
  178. "yAxis": ["p75(measurements.lcp)", "p75(transaction.duration)"],
  179. "project": self.project.id,
  180. "dataset": "metricsEnhanced",
  181. },
  182. )
  183. assert response.status_code == 200, response.content
  184. lcp = response.data["p75(measurements.lcp)"]
  185. duration = response.data["p75(transaction.duration)"]
  186. assert len(duration["data"]) == 6
  187. assert duration["isMetricsData"]
  188. assert len(lcp["data"]) == 6
  189. assert lcp["isMetricsData"]
  190. for item in duration["data"]:
  191. assert item[1][0]["count"] == 111
  192. for item in lcp["data"]:
  193. assert item[1][0]["count"] == 222
  194. @mock.patch("sentry.snuba.metrics_enhanced_performance.timeseries_query", return_value={})
  195. def test_multiple_yaxis_only_one_query(self, mock_query):
  196. self.do_request(
  197. data={
  198. "project": self.project.id,
  199. "start": iso_format(self.day_ago),
  200. "end": iso_format(self.day_ago + timedelta(hours=2)),
  201. "interval": "1h",
  202. "yAxis": ["epm()", "eps()", "tpm()", "p50(transaction.duration)"],
  203. "dataset": "metricsEnhanced",
  204. },
  205. )
  206. assert mock_query.call_count == 1
  207. def test_aggregate_function_user_count(self):
  208. self.store_transaction_metric(
  209. 1, metric="user", timestamp=self.day_ago + timedelta(minutes=30)
  210. )
  211. self.store_transaction_metric(
  212. 1, metric="user", timestamp=self.day_ago + timedelta(hours=1, minutes=30)
  213. )
  214. response = self.do_request(
  215. data={
  216. "start": iso_format(self.day_ago),
  217. "end": iso_format(self.day_ago + timedelta(hours=2)),
  218. "interval": "1h",
  219. "yAxis": "count_unique(user)",
  220. "dataset": "metricsEnhanced",
  221. },
  222. )
  223. assert response.status_code == 200, response.content
  224. assert response.data["isMetricsData"]
  225. assert [attrs for time, attrs in response.data["data"]] == [[{"count": 1}], [{"count": 1}]]
  226. meta = response.data["meta"]
  227. assert meta["isMetricsData"] == response.data["isMetricsData"]
  228. def test_non_mep_query_fallsback(self):
  229. def get_mep(query):
  230. response = self.do_request(
  231. data={
  232. "project": self.project.id,
  233. "start": iso_format(self.day_ago),
  234. "end": iso_format(self.day_ago + timedelta(hours=2)),
  235. "interval": "1h",
  236. "query": query,
  237. "yAxis": ["epm()"],
  238. "dataset": "metricsEnhanced",
  239. },
  240. )
  241. assert response.status_code == 200, response.content
  242. return response.data["isMetricsData"]
  243. assert get_mep(""), "empty query"
  244. assert get_mep("event.type:transaction"), "event type transaction"
  245. assert not get_mep("event.type:error"), "event type error"
  246. assert not get_mep("transaction.duration:<15min"), "outlier filter"
  247. assert get_mep("epm():>0.01"), "throughput filter"
  248. assert not get_mep(
  249. "event.type:transaction OR event.type:error"
  250. ), "boolean with non-mep filter"
  251. assert get_mep(
  252. "event.type:transaction OR transaction:foo_transaction"
  253. ), "boolean with mep filter"
  254. def test_having_condition_with_preventing_aggregates(self):
  255. response = self.do_request(
  256. data={
  257. "project": self.project.id,
  258. "start": iso_format(self.day_ago),
  259. "end": iso_format(self.day_ago + timedelta(hours=2)),
  260. "interval": "1h",
  261. "query": "p95():<5s",
  262. "yAxis": ["epm()"],
  263. "dataset": "metricsEnhanced",
  264. "preventMetricAggregates": "1",
  265. },
  266. )
  267. assert response.status_code == 200, response.content
  268. assert not response.data["isMetricsData"]
  269. meta = response.data["meta"]
  270. assert meta["isMetricsData"] == response.data["isMetricsData"]
  271. def test_explicit_not_mep(self):
  272. response = self.do_request(
  273. data={
  274. "project": self.project.id,
  275. "start": iso_format(self.day_ago),
  276. "end": iso_format(self.day_ago + timedelta(hours=2)),
  277. "interval": "1h",
  278. # Should be a mep able query
  279. "query": "",
  280. "yAxis": ["epm()"],
  281. "metricsEnhanced": "0",
  282. },
  283. )
  284. assert response.status_code == 200, response.content
  285. return not response.data["isMetricsData"]
  286. meta = response.data["meta"]
  287. assert meta["isMetricsData"] == response.data["isMetricsData"]
  288. def test_sum_transaction_duration(self):
  289. self.store_transaction_metric(123, timestamp=self.day_ago + timedelta(minutes=30))
  290. self.store_transaction_metric(456, timestamp=self.day_ago + timedelta(hours=1, minutes=30))
  291. self.store_transaction_metric(789, timestamp=self.day_ago + timedelta(hours=1, minutes=30))
  292. response = self.do_request(
  293. data={
  294. "start": iso_format(self.day_ago),
  295. "end": iso_format(self.day_ago + timedelta(hours=2)),
  296. "interval": "1h",
  297. "yAxis": "sum(transaction.duration)",
  298. "dataset": "metricsEnhanced",
  299. },
  300. )
  301. assert response.status_code == 200, response.content
  302. assert response.data["isMetricsData"]
  303. assert [attrs for time, attrs in response.data["data"]] == [
  304. [{"count": 123}],
  305. [{"count": 1245}],
  306. ]
  307. meta = response.data["meta"]
  308. assert meta["isMetricsData"] == response.data["isMetricsData"]
  309. assert meta["fields"] == {"time": "date", "sum_transaction_duration": "duration"}
  310. assert meta["units"] == {"time": None, "sum_transaction_duration": "millisecond"}
  311. def test_custom_measurement(self):
  312. self.store_transaction_metric(
  313. 123,
  314. metric="measurements.bytes_transfered",
  315. internal_metric="d:transactions/measurements.datacenter_memory@pebibyte",
  316. entity="metrics_distributions",
  317. tags={"transaction": "foo_transaction"},
  318. timestamp=self.day_ago + timedelta(minutes=30),
  319. )
  320. self.store_transaction_metric(
  321. 456,
  322. metric="measurements.bytes_transfered",
  323. internal_metric="d:transactions/measurements.datacenter_memory@pebibyte",
  324. entity="metrics_distributions",
  325. tags={"transaction": "foo_transaction"},
  326. timestamp=self.day_ago + timedelta(hours=1, minutes=30),
  327. )
  328. self.store_transaction_metric(
  329. 789,
  330. metric="measurements.bytes_transfered",
  331. internal_metric="d:transactions/measurements.datacenter_memory@pebibyte",
  332. entity="metrics_distributions",
  333. tags={"transaction": "foo_transaction"},
  334. timestamp=self.day_ago + timedelta(hours=1, minutes=30),
  335. )
  336. response = self.do_request(
  337. data={
  338. "start": iso_format(self.day_ago),
  339. "end": iso_format(self.day_ago + timedelta(hours=2)),
  340. "interval": "1h",
  341. "yAxis": "sum(measurements.datacenter_memory)",
  342. "dataset": "metricsEnhanced",
  343. },
  344. )
  345. assert response.status_code == 200, response.content
  346. assert response.data["isMetricsData"]
  347. assert [attrs for time, attrs in response.data["data"]] == [
  348. [{"count": 123}],
  349. [{"count": 1245}],
  350. ]
  351. meta = response.data["meta"]
  352. assert meta["isMetricsData"] == response.data["isMetricsData"]
  353. assert meta["fields"] == {"time": "date", "sum_measurements_datacenter_memory": "size"}
  354. assert meta["units"] == {"time": None, "sum_measurements_datacenter_memory": "pebibyte"}
  355. def test_does_not_fallback_if_custom_metric_is_out_of_request_time_range(self):
  356. self.store_transaction_metric(
  357. 123,
  358. timestamp=self.day_ago + timedelta(hours=1),
  359. internal_metric="d:transactions/measurements.custom@kibibyte",
  360. entity="metrics_distributions",
  361. )
  362. response = self.do_request(
  363. data={
  364. "start": iso_format(self.day_ago),
  365. "end": iso_format(self.day_ago + timedelta(hours=2)),
  366. "interval": "1h",
  367. "yAxis": "p99(measurements.custom)",
  368. "dataset": "metricsEnhanced",
  369. },
  370. )
  371. meta = response.data["meta"]
  372. assert response.status_code == 200, response.content
  373. assert response.data["isMetricsData"]
  374. assert meta["isMetricsData"]
  375. assert meta["fields"] == {"time": "date", "p99_measurements_custom": "size"}
  376. assert meta["units"] == {"time": None, "p99_measurements_custom": "kibibyte"}
  377. def test_multi_yaxis_custom_measurement(self):
  378. self.store_transaction_metric(
  379. 123,
  380. metric="measurements.bytes_transfered",
  381. internal_metric="d:transactions/measurements.datacenter_memory@pebibyte",
  382. entity="metrics_distributions",
  383. tags={"transaction": "foo_transaction"},
  384. timestamp=self.day_ago + timedelta(minutes=30),
  385. )
  386. self.store_transaction_metric(
  387. 456,
  388. metric="measurements.bytes_transfered",
  389. internal_metric="d:transactions/measurements.datacenter_memory@pebibyte",
  390. entity="metrics_distributions",
  391. tags={"transaction": "foo_transaction"},
  392. timestamp=self.day_ago + timedelta(hours=1, minutes=30),
  393. )
  394. self.store_transaction_metric(
  395. 789,
  396. metric="measurements.bytes_transfered",
  397. internal_metric="d:transactions/measurements.datacenter_memory@pebibyte",
  398. entity="metrics_distributions",
  399. tags={"transaction": "foo_transaction"},
  400. timestamp=self.day_ago + timedelta(hours=1, minutes=30),
  401. )
  402. response = self.do_request(
  403. data={
  404. "start": iso_format(self.day_ago),
  405. "end": iso_format(self.day_ago + timedelta(hours=2)),
  406. "interval": "1h",
  407. "yAxis": [
  408. "sum(measurements.datacenter_memory)",
  409. "p50(measurements.datacenter_memory)",
  410. ],
  411. "dataset": "metricsEnhanced",
  412. },
  413. )
  414. assert response.status_code == 200, response.content
  415. sum_data = response.data["sum(measurements.datacenter_memory)"]
  416. p50_data = response.data["p50(measurements.datacenter_memory)"]
  417. assert sum_data["isMetricsData"]
  418. assert p50_data["isMetricsData"]
  419. assert [attrs for time, attrs in sum_data["data"]] == [
  420. [{"count": 123}],
  421. [{"count": 1245}],
  422. ]
  423. assert [attrs for time, attrs in p50_data["data"]] == [
  424. [{"count": 123}],
  425. [{"count": 622.5}],
  426. ]
  427. sum_meta = sum_data["meta"]
  428. assert sum_meta["isMetricsData"] == sum_data["isMetricsData"]
  429. assert sum_meta["fields"] == {
  430. "time": "date",
  431. "sum_measurements_datacenter_memory": "size",
  432. "p50_measurements_datacenter_memory": "size",
  433. }
  434. assert sum_meta["units"] == {
  435. "time": None,
  436. "sum_measurements_datacenter_memory": "pebibyte",
  437. "p50_measurements_datacenter_memory": "pebibyte",
  438. }
  439. p50_meta = p50_data["meta"]
  440. assert p50_meta["isMetricsData"] == p50_data["isMetricsData"]
  441. assert p50_meta["fields"] == {
  442. "time": "date",
  443. "sum_measurements_datacenter_memory": "size",
  444. "p50_measurements_datacenter_memory": "size",
  445. }
  446. assert p50_meta["units"] == {
  447. "time": None,
  448. "sum_measurements_datacenter_memory": "pebibyte",
  449. "p50_measurements_datacenter_memory": "pebibyte",
  450. }
  451. def test_dataset_metrics_does_not_fallback(self):
  452. self.store_transaction_metric(123, timestamp=self.day_ago + timedelta(minutes=30))
  453. self.store_transaction_metric(456, timestamp=self.day_ago + timedelta(hours=1, minutes=30))
  454. self.store_transaction_metric(789, timestamp=self.day_ago + timedelta(hours=1, minutes=30))
  455. response = self.do_request(
  456. data={
  457. "start": iso_format(self.day_ago),
  458. "end": iso_format(self.day_ago + timedelta(hours=2)),
  459. "interval": "1h",
  460. "query": "transaction.duration:<5s",
  461. "yAxis": "sum(transaction.duration)",
  462. "dataset": "metrics",
  463. },
  464. )
  465. assert response.status_code == 400, response.content
  466. def test_title_filter(self):
  467. self.store_transaction_metric(
  468. 123,
  469. tags={"transaction": "foo_transaction"},
  470. timestamp=self.day_ago + timedelta(minutes=30),
  471. )
  472. response = self.do_request(
  473. data={
  474. "start": iso_format(self.day_ago),
  475. "end": iso_format(self.day_ago + timedelta(hours=2)),
  476. "interval": "1h",
  477. "query": "title:foo_transaction",
  478. "yAxis": [
  479. "sum(transaction.duration)",
  480. ],
  481. "dataset": "metricsEnhanced",
  482. },
  483. )
  484. assert response.status_code == 200, response.content
  485. data = response.data["data"]
  486. assert [attrs for time, attrs in data] == [
  487. [{"count": 123}],
  488. [{"count": 0}],
  489. ]
  490. def test_search_query_if_environment_does_not_exist_on_indexer(self):
  491. if options.get("sentry-metrics.performance.tags-values-are-strings"):
  492. pytest.skip("test does not apply if tag values are in clickhouse")
  493. self.create_environment(self.project, name="prod")
  494. self.create_environment(self.project, name="dev")
  495. self.store_transaction_metric(
  496. 123,
  497. tags={"transaction": "foo_transaction"},
  498. timestamp=self.day_ago + timedelta(minutes=30),
  499. )
  500. response = self.do_request(
  501. data={
  502. "start": iso_format(self.day_ago),
  503. "end": iso_format(self.day_ago + timedelta(hours=2)),
  504. "interval": "1h",
  505. "yAxis": [
  506. "sum(transaction.duration)",
  507. ],
  508. "environment": ["prod", "dev"],
  509. "dataset": "metricsEnhanced",
  510. },
  511. )
  512. assert response.status_code == 200, response.content
  513. data = response.data["data"]
  514. assert [attrs for time, attrs in data] == [
  515. [{"count": 0}],
  516. [{"count": 0}],
  517. ]
  518. assert not response.data["isMetricsData"]