test_backend.py 85 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493149414951496149714981499150015011502150315041505150615071508150915101511151215131514151515161517151815191520152115221523152415251526152715281529153015311532153315341535153615371538153915401541154215431544154515461547154815491550155115521553155415551556155715581559156015611562156315641565156615671568156915701571157215731574157515761577157815791580158115821583158415851586158715881589159015911592159315941595159615971598159916001601160216031604160516061607160816091610161116121613161416151616161716181619162016211622162316241625162616271628162916301631163216331634163516361637163816391640164116421643164416451646164716481649165016511652165316541655165616571658165916601661166216631664166516661667166816691670167116721673167416751676167716781679168016811682168316841685168616871688168916901691169216931694169516961697169816991700170117021703170417051706170717081709171017111712171317141715171617171718171917201721172217231724172517261727172817291730173117321733173417351736173717381739174017411742174317441745174617471748174917501751175217531754175517561757175817591760176117621763176417651766176717681769177017711772177317741775177617771778177917801781178217831784178517861787178817891790179117921793179417951796179717981799180018011802180318041805180618071808180918101811181218131814181518161817181818191820182118221823182418251826182718281829183018311832183318341835183618371838183918401841184218431844184518461847184818491850185118521853185418551856185718581859186018611862186318641865186618671868186918701871187218731874187518761877187818791880188118821883188418851886188718881889189018911892189318941895189618971898189919001901190219031904190519061907190819091910191119121913191419151916191719181919192019211922192319241925192619271928192919301931193219331934193519361937193819391940194119421943194419451946194719481949195019511952195319541955195619571958195919601961196219631964196519661967196819691970197119721973197419751976197719781979198019811982198319841985198619871988198919901991199219931994199519961997199819992000200120022003200420052006200720082009201020112012201320142015201620172018201920202021202220232024202520262027202820292030203120322033203420352036203720382039204020412042204320442045204620472048204920502051205220532054205520562057205820592060206120622063206420652066206720682069207020712072207320742075207620772078207920802081208220832084208520862087208820892090209120922093209420952096209720982099210021012102210321042105210621072108210921102111211221132114211521162117211821192120212121222123212421252126212721282129213021312132213321342135213621372138213921402141214221432144214521462147214821492150215121522153215421552156215721582159216021612162216321642165216621672168216921702171217221732174217521762177217821792180218121822183218421852186218721882189219021912192219321942195219621972198219922002201220222032204220522062207220822092210221122122213221422152216221722182219222022212222222322242225222622272228222922302231223222332234223522362237223822392240224122422243224422452246224722482249225022512252225322542255225622572258225922602261226222632264226522662267226822692270227122722273227422752276227722782279
  1. import uuid
  2. from datetime import datetime, timedelta
  3. from hashlib import md5
  4. from unittest import mock
  5. import pytest
  6. import pytz
  7. from django.utils import timezone
  8. from sentry import options
  9. from sentry.api.issue_search import convert_query_values, issue_search_config, parse_search_query
  10. from sentry.exceptions import InvalidSearchQuery
  11. from sentry.models import (
  12. Environment,
  13. Group,
  14. GroupAssignee,
  15. GroupBookmark,
  16. GroupEnvironment,
  17. GroupHistoryStatus,
  18. GroupStatus,
  19. GroupSubscription,
  20. Integration,
  21. record_group_history,
  22. )
  23. from sentry.models.groupowner import GroupOwner
  24. from sentry.search.snuba.backend import (
  25. CdcEventsDatasetSnubaSearchBackend,
  26. EventsDatasetSnubaSearchBackend,
  27. )
  28. from sentry.search.snuba.executors import InvalidQueryForExecutor
  29. from sentry.testutils import SnubaTestCase, TestCase, xfail_if_not_postgres
  30. from sentry.testutils.helpers.datetime import before_now, iso_format
  31. from sentry.utils.snuba import SENTRY_SNUBA_MAP, Dataset, SnubaError
  32. def date_to_query_format(date):
  33. return date.strftime("%Y-%m-%dT%H:%M:%S")
  34. class EventsSnubaSearchTest(TestCase, SnubaTestCase):
  35. @property
  36. def backend(self):
  37. return EventsDatasetSnubaSearchBackend()
  38. def setUp(self):
  39. super().setUp()
  40. self.base_datetime = (datetime.utcnow() - timedelta(days=3)).replace(tzinfo=pytz.utc)
  41. event1_timestamp = iso_format(self.base_datetime - timedelta(days=21))
  42. self.event1 = self.store_event(
  43. data={
  44. "fingerprint": ["put-me-in-group1"],
  45. "event_id": "a" * 32,
  46. "message": "foo. Also, this message is intended to be greater than 256 characters so that we can put some unique string identifier after that point in the string. The purpose of this is in order to verify we are using snuba to search messages instead of Postgres (postgres truncates at 256 characters and clickhouse does not). santryrox.",
  47. "environment": "production",
  48. "tags": {"server": "example.com", "sentry:user": "event1@example.com"},
  49. "timestamp": event1_timestamp,
  50. "stacktrace": {"frames": [{"module": "group1"}]},
  51. },
  52. project_id=self.project.id,
  53. )
  54. self.event3 = self.store_event(
  55. data={
  56. "fingerprint": ["put-me-in-group1"],
  57. "event_id": "c" * 32,
  58. "message": "group1",
  59. "environment": "production",
  60. "tags": {"server": "example.com", "sentry:user": "event3@example.com"},
  61. "timestamp": iso_format(self.base_datetime),
  62. "stacktrace": {"frames": [{"module": "group1"}]},
  63. },
  64. project_id=self.project.id,
  65. )
  66. self.group1 = Group.objects.get(id=self.event1.group.id)
  67. assert self.group1.id == self.event1.group.id
  68. assert self.group1.id == self.event3.group.id
  69. assert self.group1.first_seen == self.event1.datetime
  70. assert self.group1.last_seen == self.event3.datetime
  71. self.group1.times_seen = 5
  72. self.group1.status = GroupStatus.UNRESOLVED
  73. self.group1.save()
  74. self.store_group(self.group1)
  75. self.event2 = self.store_event(
  76. data={
  77. "fingerprint": ["put-me-in-group2"],
  78. "event_id": "b" * 32,
  79. "timestamp": iso_format(self.base_datetime - timedelta(days=20)),
  80. "message": "bar",
  81. "stacktrace": {"frames": [{"module": "group2"}]},
  82. "environment": "staging",
  83. "tags": {
  84. "server": "example.com",
  85. "url": "http://example.com",
  86. "sentry:user": "event2@example.com",
  87. },
  88. },
  89. project_id=self.project.id,
  90. )
  91. self.group2 = Group.objects.get(id=self.event2.group.id)
  92. assert self.group2.id == self.event2.group.id
  93. assert self.group2.first_seen == self.group2.last_seen == self.event2.datetime
  94. self.group2.status = GroupStatus.RESOLVED
  95. self.group2.times_seen = 10
  96. self.group2.save()
  97. self.store_group(self.group2)
  98. GroupBookmark.objects.create(user=self.user, group=self.group2, project=self.group2.project)
  99. GroupAssignee.objects.create(user=self.user, group=self.group2, project=self.group2.project)
  100. GroupSubscription.objects.create(
  101. user=self.user, group=self.group1, project=self.group1.project, is_active=True
  102. )
  103. GroupSubscription.objects.create(
  104. user=self.user, group=self.group2, project=self.group2.project, is_active=False
  105. )
  106. self.environments = {
  107. "production": self.event1.get_environment(),
  108. "staging": self.event2.get_environment(),
  109. }
  110. def store_event(self, data, *args, **kwargs):
  111. event = super().store_event(data, *args, **kwargs)
  112. environment_name = data.get("environment")
  113. if environment_name:
  114. GroupEnvironment.objects.filter(
  115. group_id=event.group_id,
  116. environment__name=environment_name,
  117. first_seen__gt=event.datetime,
  118. ).update(first_seen=event.datetime)
  119. return event
  120. def set_up_multi_project(self):
  121. self.project2 = self.create_project(organization=self.project.organization)
  122. self.event_p2 = self.store_event(
  123. data={
  124. "event_id": "a" * 32,
  125. "fingerprint": ["put-me-in-groupP2"],
  126. "timestamp": iso_format(self.base_datetime - timedelta(days=21)),
  127. "message": "foo",
  128. "stacktrace": {"frames": [{"module": "group_p2"}]},
  129. "tags": {"server": "example.com"},
  130. "environment": "production",
  131. },
  132. project_id=self.project2.id,
  133. )
  134. self.group_p2 = Group.objects.get(id=self.event_p2.group.id)
  135. self.group_p2.times_seen = 6
  136. self.group_p2.last_seen = self.base_datetime - timedelta(days=1)
  137. self.group_p2.save()
  138. self.store_group(self.group_p2)
  139. def create_group_with_integration_external_issue(self, environment="production"):
  140. event = self.store_event(
  141. data={
  142. "fingerprint": ["linked_group1"],
  143. "event_id": uuid.uuid4().hex,
  144. "timestamp": iso_format(self.base_datetime),
  145. "environment": environment,
  146. },
  147. project_id=self.project.id,
  148. )
  149. integration = Integration.objects.create(provider="example", name="Example")
  150. integration.add_organization(event.group.organization, self.user)
  151. self.create_integration_external_issue(
  152. group=event.group,
  153. integration=integration,
  154. key="APP-123",
  155. )
  156. return event.group
  157. def create_group_with_platform_external_issue(self, environment="production"):
  158. event = self.store_event(
  159. data={
  160. "fingerprint": ["linked_group2"],
  161. "event_id": uuid.uuid4().hex,
  162. "timestamp": iso_format(self.base_datetime),
  163. "environment": environment,
  164. },
  165. project_id=self.project.id,
  166. )
  167. self.create_platform_external_issue(
  168. group=event.group,
  169. service_type="sentry-app",
  170. display_name="App#issue-1",
  171. web_url="https://example.com/app/issues/1",
  172. )
  173. return event.group
  174. def build_search_filter(self, query, projects=None, user=None, environments=None):
  175. user = user if user is not None else self.user
  176. projects = projects if projects is not None else [self.project]
  177. return convert_query_values(parse_search_query(query), projects, user, environments)
  178. def make_query(
  179. self,
  180. projects=None,
  181. search_filter_query=None,
  182. environments=None,
  183. sort_by="date",
  184. limit=None,
  185. count_hits=False,
  186. date_from=None,
  187. date_to=None,
  188. ):
  189. search_filters = []
  190. projects = projects if projects is not None else [self.project]
  191. if search_filter_query is not None:
  192. search_filters = self.build_search_filter(
  193. search_filter_query, projects, environments=environments
  194. )
  195. kwargs = {}
  196. if limit is not None:
  197. kwargs["limit"] = limit
  198. return self.backend.query(
  199. projects,
  200. search_filters=search_filters,
  201. environments=environments,
  202. count_hits=count_hits,
  203. sort_by=sort_by,
  204. date_from=date_from,
  205. date_to=date_to,
  206. **kwargs,
  207. )
  208. def run_test_query_in_syntax(
  209. self, query, expected_groups, expected_negative_groups=None, environments=None
  210. ):
  211. results = self.make_query(search_filter_query=query, environments=environments)
  212. sort_key = lambda result: result.id
  213. print("results", results.results)
  214. assert sorted(results, key=sort_key) == sorted(expected_groups, key=sort_key)
  215. if expected_negative_groups is not None:
  216. results = self.make_query(search_filter_query=f"!{query}")
  217. assert sorted(results, key=sort_key) == sorted(expected_negative_groups, key=sort_key)
  218. def test_query(self):
  219. results = self.make_query(search_filter_query="foo")
  220. assert set(results) == {self.group1}
  221. results = self.make_query(search_filter_query="bar")
  222. assert set(results) == {self.group2}
  223. def test_query_multi_project(self):
  224. self.set_up_multi_project()
  225. results = self.make_query([self.project, self.project2], search_filter_query="foo")
  226. assert set(results) == {self.group1, self.group_p2}
  227. def test_query_with_environment(self):
  228. results = self.make_query(
  229. environments=[self.environments["production"]], search_filter_query="foo"
  230. )
  231. assert set(results) == {self.group1}
  232. results = self.make_query(
  233. environments=[self.environments["production"]], search_filter_query="bar"
  234. )
  235. assert set(results) == set()
  236. results = self.make_query(
  237. environments=[self.environments["staging"]], search_filter_query="bar"
  238. )
  239. assert set(results) == {self.group2}
  240. def test_query_for_text_in_long_message(self):
  241. results = self.make_query(
  242. [self.project],
  243. environments=[self.environments["production"]],
  244. search_filter_query="santryrox",
  245. )
  246. assert set(results) == {self.group1}
  247. def test_multi_environments(self):
  248. self.set_up_multi_project()
  249. results = self.make_query(
  250. [self.project, self.project2],
  251. environments=[self.environments["production"], self.environments["staging"]],
  252. )
  253. assert set(results) == {self.group1, self.group2, self.group_p2}
  254. def test_query_with_environment_multi_project(self):
  255. self.set_up_multi_project()
  256. results = self.make_query(
  257. [self.project, self.project2],
  258. environments=[self.environments["production"]],
  259. search_filter_query="foo",
  260. )
  261. assert set(results) == {self.group1, self.group_p2}
  262. results = self.make_query(
  263. [self.project, self.project2],
  264. environments=[self.environments["production"]],
  265. search_filter_query="bar",
  266. )
  267. assert set(results) == set()
  268. def test_sort(self):
  269. results = self.make_query(sort_by="date")
  270. assert list(results) == [self.group1, self.group2]
  271. results = self.make_query(sort_by="new")
  272. assert list(results) == [self.group2, self.group1]
  273. results = self.make_query(sort_by="freq")
  274. assert list(results) == [self.group1, self.group2]
  275. results = self.make_query(sort_by="priority")
  276. assert list(results) == [self.group1, self.group2]
  277. results = self.make_query(sort_by="user")
  278. assert list(results) == [self.group1, self.group2]
  279. def test_sort_with_environment(self):
  280. for dt in [
  281. self.group1.first_seen + timedelta(days=1),
  282. self.group1.first_seen + timedelta(days=2),
  283. self.group1.last_seen + timedelta(days=1),
  284. ]:
  285. self.store_event(
  286. data={
  287. "fingerprint": ["put-me-in-group2"],
  288. "timestamp": iso_format(dt),
  289. "stacktrace": {"frames": [{"module": "group2"}]},
  290. "environment": "production",
  291. "message": "group2",
  292. },
  293. project_id=self.project.id,
  294. )
  295. results = self.make_query(environments=[self.environments["production"]], sort_by="date")
  296. assert list(results) == [self.group2, self.group1]
  297. results = self.make_query(environments=[self.environments["production"]], sort_by="new")
  298. assert list(results) == [self.group2, self.group1]
  299. results = self.make_query(environments=[self.environments["production"]], sort_by="freq")
  300. assert list(results) == [self.group2, self.group1]
  301. results = self.make_query(
  302. environments=[self.environments["production"]], sort_by="priority"
  303. )
  304. assert list(results) == [self.group2, self.group1]
  305. results = self.make_query(environments=[self.environments["production"]], sort_by="user")
  306. assert list(results) == [self.group1, self.group2]
  307. def test_status(self):
  308. results = self.make_query(search_filter_query="is:unresolved")
  309. assert set(results) == {self.group1}
  310. results = self.make_query(search_filter_query="is:resolved")
  311. assert set(results) == {self.group2}
  312. event_3 = self.store_event(
  313. data={
  314. "fingerprint": ["put-me-in-group3"],
  315. "event_id": "c" * 32,
  316. "timestamp": iso_format(self.base_datetime - timedelta(days=20)),
  317. },
  318. project_id=self.project.id,
  319. )
  320. group_3 = event_3.group
  321. group_3.status = GroupStatus.MUTED
  322. group_3.save()
  323. self.run_test_query_in_syntax(
  324. "status:[unresolved, resolved]", [self.group1, self.group2], [group_3]
  325. )
  326. self.run_test_query_in_syntax(
  327. "status:[resolved, muted]", [self.group2, group_3], [self.group1]
  328. )
  329. def test_status_with_environment(self):
  330. results = self.make_query(
  331. environments=[self.environments["production"]], search_filter_query="is:unresolved"
  332. )
  333. assert set(results) == {self.group1}
  334. results = self.make_query(
  335. environments=[self.environments["staging"]], search_filter_query="is:resolved"
  336. )
  337. assert set(results) == {self.group2}
  338. results = self.make_query(
  339. environments=[self.environments["production"]], search_filter_query="is:resolved"
  340. )
  341. assert set(results) == set()
  342. def test_tags(self):
  343. results = self.make_query(search_filter_query="environment:staging")
  344. assert set(results) == {self.group2}
  345. results = self.make_query(search_filter_query="environment:example.com")
  346. assert set(results) == set()
  347. results = self.make_query(search_filter_query="has:environment")
  348. assert set(results) == {self.group2, self.group1}
  349. results = self.make_query(search_filter_query="environment:staging server:example.com")
  350. assert set(results) == {self.group2}
  351. results = self.make_query(search_filter_query='url:"http://example.com"')
  352. assert set(results) == {self.group2}
  353. results = self.make_query(search_filter_query="environment:staging has:server")
  354. assert set(results) == {self.group2}
  355. results = self.make_query(search_filter_query="environment:staging server:bar.example.com")
  356. assert set(results) == set()
  357. def test_tags_with_environment(self):
  358. results = self.make_query(
  359. environments=[self.environments["production"]], search_filter_query="server:example.com"
  360. )
  361. assert set(results) == {self.group1}
  362. results = self.make_query(
  363. environments=[self.environments["staging"]], search_filter_query="server:example.com"
  364. )
  365. assert set(results) == {self.group2}
  366. results = self.make_query(
  367. environments=[self.environments["staging"]], search_filter_query="has:server"
  368. )
  369. assert set(results) == {self.group2}
  370. results = self.make_query(
  371. environments=[self.environments["production"]],
  372. search_filter_query='url:"http://example.com"',
  373. )
  374. assert set(results) == set()
  375. results = self.make_query(
  376. environments=[self.environments["staging"]],
  377. search_filter_query='url:"http://example.com"',
  378. )
  379. assert set(results) == {self.group2}
  380. results = self.make_query(
  381. environments=[self.environments["staging"]],
  382. search_filter_query="server:bar.example.com",
  383. )
  384. assert set(results) == set()
  385. def test_bookmarked_by(self):
  386. results = self.make_query(search_filter_query="bookmarks:%s" % self.user.username)
  387. assert set(results) == {self.group2}
  388. def test_bookmarked_by_in_syntax(self):
  389. self.run_test_query_in_syntax(
  390. f"bookmarks:[{self.user.username}]", [self.group2], [self.group1]
  391. )
  392. user_2 = self.create_user()
  393. GroupBookmark.objects.create(user=user_2, group=self.group1, project=self.group2.project)
  394. self.run_test_query_in_syntax(
  395. f"bookmarks:[{self.user.username}, {user_2.username}]", [self.group2, self.group1], []
  396. )
  397. def test_bookmarked_by_with_environment(self):
  398. results = self.make_query(
  399. environments=[self.environments["staging"]],
  400. search_filter_query="bookmarks:%s" % self.user.username,
  401. )
  402. assert set(results) == {self.group2}
  403. results = self.make_query(
  404. environments=[self.environments["production"]],
  405. search_filter_query="bookmarks:%s" % self.user.username,
  406. )
  407. assert set(results) == set()
  408. def test_search_filter_query_with_custom_priority_tag(self):
  409. priority = "high"
  410. self.store_event(
  411. data={
  412. "fingerprint": ["put-me-in-group2"],
  413. "timestamp": iso_format(self.group2.first_seen + timedelta(days=1)),
  414. "stacktrace": {"frames": [{"module": "group2"}]},
  415. "message": "group2",
  416. "tags": {"priority": priority},
  417. },
  418. project_id=self.project.id,
  419. )
  420. results = self.make_query(search_filter_query="priority:%s" % priority)
  421. assert set(results) == {self.group2}
  422. def test_search_filter_query_with_custom_priority_tag_and_priority_sort(self):
  423. priority = "high"
  424. for i in range(1, 3):
  425. self.store_event(
  426. data={
  427. "fingerprint": ["put-me-in-group1"],
  428. "timestamp": iso_format(self.group2.last_seen + timedelta(days=i)),
  429. "stacktrace": {"frames": [{"module": "group1"}]},
  430. "message": "group1",
  431. "tags": {"priority": priority},
  432. },
  433. project_id=self.project.id,
  434. )
  435. self.store_event(
  436. data={
  437. "fingerprint": ["put-me-in-group2"],
  438. "timestamp": iso_format(self.group2.last_seen + timedelta(days=2)),
  439. "stacktrace": {"frames": [{"module": "group2"}]},
  440. "message": "group2",
  441. "tags": {"priority": priority},
  442. },
  443. project_id=self.project.id,
  444. )
  445. results = self.make_query(search_filter_query="priority:%s" % priority, sort_by="priority")
  446. assert list(results) == [self.group1, self.group2]
  447. def test_search_tag_overlapping_with_internal_fields(self):
  448. # Using a tag of email overlaps with the promoted user.email column in events.
  449. # We don't want to bypass public schema limits in issue search.
  450. self.store_event(
  451. data={
  452. "fingerprint": ["put-me-in-group2"],
  453. "timestamp": iso_format(self.group2.first_seen + timedelta(days=1)),
  454. "stacktrace": {"frames": [{"module": "group2"}]},
  455. "message": "group2",
  456. "tags": {"email": "tags@example.com"},
  457. },
  458. project_id=self.project.id,
  459. )
  460. results = self.make_query(search_filter_query="email:tags@example.com")
  461. assert set(results) == {self.group2}
  462. def test_project(self):
  463. results = self.make_query([self.create_project(name="other")])
  464. assert set(results) == set()
  465. def test_pagination(self):
  466. for options_set in [
  467. {"snuba.search.min-pre-snuba-candidates": None},
  468. {"snuba.search.min-pre-snuba-candidates": 500},
  469. ]:
  470. with self.options(options_set):
  471. results = self.backend.query([self.project], limit=1, sort_by="date")
  472. assert set(results) == {self.group1}
  473. assert not results.prev.has_results
  474. assert results.next.has_results
  475. results = self.backend.query(
  476. [self.project], cursor=results.next, limit=1, sort_by="date"
  477. )
  478. assert set(results) == {self.group2}
  479. assert results.prev.has_results
  480. assert not results.next.has_results
  481. # note: previous cursor
  482. results = self.backend.query(
  483. [self.project], cursor=results.prev, limit=1, sort_by="date"
  484. )
  485. assert set(results) == {self.group1}
  486. assert results.prev.has_results
  487. assert results.next.has_results
  488. # note: previous cursor, paging too far into 0 results
  489. results = self.backend.query(
  490. [self.project], cursor=results.prev, limit=1, sort_by="date"
  491. )
  492. assert set(results) == set()
  493. assert not results.prev.has_results
  494. assert results.next.has_results
  495. results = self.backend.query(
  496. [self.project], cursor=results.next, limit=1, sort_by="date"
  497. )
  498. assert set(results) == {self.group1}
  499. assert results.prev.has_results
  500. assert results.next.has_results
  501. results = self.backend.query(
  502. [self.project], cursor=results.next, limit=1, sort_by="date"
  503. )
  504. assert set(results) == {self.group2}
  505. assert results.prev.has_results
  506. assert not results.next.has_results
  507. results = self.backend.query(
  508. [self.project], cursor=results.next, limit=1, sort_by="date"
  509. )
  510. assert set(results) == set()
  511. assert results.prev.has_results
  512. assert not results.next.has_results
  513. def test_pagination_with_environment(self):
  514. for dt in [
  515. self.group1.first_seen + timedelta(days=1),
  516. self.group1.first_seen + timedelta(days=2),
  517. self.group1.last_seen + timedelta(days=1),
  518. ]:
  519. self.store_event(
  520. data={
  521. "fingerprint": ["put-me-in-group2"],
  522. "timestamp": iso_format(dt),
  523. "environment": "production",
  524. "message": "group2",
  525. "stacktrace": {"frames": [{"module": "group2"}]},
  526. },
  527. project_id=self.project.id,
  528. )
  529. results = self.backend.query(
  530. [self.project],
  531. environments=[self.environments["production"]],
  532. sort_by="date",
  533. limit=1,
  534. count_hits=True,
  535. )
  536. assert list(results) == [self.group2]
  537. assert results.hits == 2
  538. results = self.backend.query(
  539. [self.project],
  540. environments=[self.environments["production"]],
  541. sort_by="date",
  542. limit=1,
  543. cursor=results.next,
  544. count_hits=True,
  545. )
  546. assert list(results) == [self.group1]
  547. assert results.hits == 2
  548. results = self.backend.query(
  549. [self.project],
  550. environments=[self.environments["production"]],
  551. sort_by="date",
  552. limit=1,
  553. cursor=results.next,
  554. count_hits=True,
  555. )
  556. assert list(results) == []
  557. assert results.hits == 2
  558. def test_age_filter(self):
  559. results = self.make_query(
  560. search_filter_query="firstSeen:>=%s" % date_to_query_format(self.group2.first_seen)
  561. )
  562. assert set(results) == {self.group2}
  563. results = self.make_query(
  564. search_filter_query="firstSeen:<=%s"
  565. % date_to_query_format(self.group1.first_seen + timedelta(minutes=1))
  566. )
  567. assert set(results) == {self.group1}
  568. results = self.make_query(
  569. search_filter_query="firstSeen:>=%s firstSeen:<=%s"
  570. % (
  571. date_to_query_format(self.group1.first_seen),
  572. date_to_query_format(self.group1.first_seen + timedelta(minutes=1)),
  573. )
  574. )
  575. assert set(results) == {self.group1}
  576. def test_age_filter_with_environment(self):
  577. # add time instead to make it greater than or less than as needed.
  578. group1_first_seen = GroupEnvironment.objects.get(
  579. environment=self.environments["production"], group=self.group1
  580. ).first_seen
  581. results = self.make_query(
  582. environments=[self.environments["production"]],
  583. search_filter_query="firstSeen:>=%s" % date_to_query_format(group1_first_seen),
  584. )
  585. assert set(results) == {self.group1}
  586. results = self.make_query(
  587. environments=[self.environments["production"]],
  588. search_filter_query="firstSeen:<=%s" % date_to_query_format(group1_first_seen),
  589. )
  590. assert set(results) == {self.group1}
  591. results = self.make_query(
  592. environments=[self.environments["production"]],
  593. search_filter_query="firstSeen:>%s" % date_to_query_format(group1_first_seen),
  594. )
  595. assert set(results) == set()
  596. self.store_event(
  597. data={
  598. "fingerprint": ["put-me-in-group1"],
  599. "timestamp": iso_format(group1_first_seen + timedelta(days=1)),
  600. "message": "group1",
  601. "stacktrace": {"frames": [{"module": "group1"}]},
  602. "environment": "development",
  603. },
  604. project_id=self.project.id,
  605. )
  606. results = self.make_query(
  607. environments=[self.environments["production"]],
  608. search_filter_query="firstSeen:>%s" % date_to_query_format(group1_first_seen),
  609. )
  610. assert set(results) == set()
  611. results = self.make_query(
  612. environments=[Environment.objects.get(name="development")],
  613. search_filter_query="firstSeen:>%s" % date_to_query_format(group1_first_seen),
  614. )
  615. assert set(results) == {self.group1}
  616. def test_times_seen_filter(self):
  617. results = self.make_query([self.project], search_filter_query="times_seen:2")
  618. assert set(results) == {self.group1}
  619. results = self.make_query([self.project], search_filter_query="times_seen:>=2")
  620. assert set(results) == {self.group1}
  621. results = self.make_query([self.project], search_filter_query="times_seen:<=1")
  622. assert set(results) == {self.group2}
  623. def test_last_seen_filter(self):
  624. results = self.make_query(
  625. search_filter_query="lastSeen:>=%s" % date_to_query_format(self.group1.last_seen)
  626. )
  627. assert set(results) == {self.group1}
  628. results = self.make_query(
  629. search_filter_query="lastSeen:>=%s lastSeen:<=%s"
  630. % (
  631. date_to_query_format(self.group1.last_seen),
  632. date_to_query_format(self.group1.last_seen + timedelta(minutes=1)),
  633. )
  634. )
  635. assert set(results) == {self.group1}
  636. def test_last_seen_filter_with_environment(self):
  637. results = self.make_query(
  638. environments=[self.environments["production"]],
  639. search_filter_query="lastSeen:>=%s" % date_to_query_format(self.group1.last_seen),
  640. )
  641. assert set(results) == {self.group1}
  642. results = self.make_query(
  643. environments=[self.environments["production"]],
  644. search_filter_query="lastSeen:<=%s" % date_to_query_format(self.group1.last_seen),
  645. )
  646. assert set(results) == {self.group1}
  647. results = self.make_query(
  648. environments=[self.environments["production"]],
  649. search_filter_query="lastSeen:>%s" % date_to_query_format(self.group1.last_seen),
  650. )
  651. assert set(results) == set()
  652. self.store_event(
  653. data={
  654. "fingerprint": ["put-me-in-group1"],
  655. "timestamp": iso_format(self.group1.last_seen + timedelta(days=1)),
  656. "message": "group1",
  657. "stacktrace": {"frames": [{"module": "group1"}]},
  658. "environment": "development",
  659. },
  660. project_id=self.project.id,
  661. )
  662. self.group1.update(last_seen=self.group1.last_seen + timedelta(days=1))
  663. results = self.make_query(
  664. environments=[self.environments["production"]],
  665. search_filter_query="lastSeen:>%s" % date_to_query_format(self.group1.last_seen),
  666. )
  667. assert set(results) == set()
  668. results = self.make_query(
  669. environments=[Environment.objects.get(name="development")],
  670. search_filter_query="lastSeen:>%s" % date_to_query_format(self.group1.last_seen),
  671. )
  672. assert set(results) == set()
  673. results = self.make_query(
  674. environments=[Environment.objects.get(name="development")],
  675. search_filter_query="lastSeen:>=%s" % date_to_query_format(self.group1.last_seen),
  676. )
  677. assert set(results) == {self.group1}
  678. def test_date_filter(self):
  679. results = self.make_query(
  680. date_from=self.event2.datetime,
  681. search_filter_query="timestamp:>=%s" % date_to_query_format(self.event2.datetime),
  682. )
  683. assert set(results) == {self.group1, self.group2}
  684. results = self.make_query(
  685. date_to=self.event1.datetime + timedelta(minutes=1),
  686. search_filter_query="timestamp:<=%s"
  687. % date_to_query_format(self.event1.datetime + timedelta(minutes=1)),
  688. )
  689. assert set(results) == {self.group1}
  690. results = self.make_query(
  691. date_from=self.event1.datetime,
  692. date_to=self.event2.datetime + timedelta(minutes=1),
  693. search_filter_query="timestamp:>=%s timestamp:<=%s"
  694. % (
  695. date_to_query_format(self.event1.datetime),
  696. date_to_query_format(self.event2.datetime + timedelta(minutes=1)),
  697. ),
  698. )
  699. assert set(results) == {self.group1, self.group2}
  700. # Test with `Z` utc marker, should be equivalent
  701. results = self.make_query(
  702. date_from=self.event1.datetime,
  703. date_to=self.event2.datetime + timedelta(minutes=1),
  704. search_filter_query="timestamp:>=%s timestamp:<=%s"
  705. % (
  706. date_to_query_format(self.event1.datetime) + "Z",
  707. date_to_query_format(self.event2.datetime + timedelta(minutes=1)) + "Z",
  708. ),
  709. )
  710. assert set(results) == {self.group1, self.group2}
  711. def test_date_filter_with_environment(self):
  712. results = self.backend.query(
  713. [self.project],
  714. environments=[self.environments["production"]],
  715. date_from=self.event2.datetime,
  716. )
  717. assert set(results) == {self.group1}
  718. results = self.backend.query(
  719. [self.project],
  720. environments=[self.environments["production"]],
  721. date_to=self.event1.datetime + timedelta(minutes=1),
  722. )
  723. assert set(results) == {self.group1}
  724. results = self.backend.query(
  725. [self.project],
  726. environments=[self.environments["staging"]],
  727. date_from=self.event1.datetime,
  728. date_to=self.event2.datetime + timedelta(minutes=1),
  729. )
  730. assert set(results) == {self.group2}
  731. def test_linked(self):
  732. linked_group1 = self.create_group_with_integration_external_issue()
  733. linked_group2 = self.create_group_with_platform_external_issue()
  734. results = self.make_query(search_filter_query="is:unlinked")
  735. assert set(results) == {self.group1, self.group2}
  736. results = self.make_query(search_filter_query="is:linked")
  737. assert set(results) == {linked_group1, linked_group2}
  738. def test_linked_with_only_integration_external_issue(self):
  739. linked_group = self.create_group_with_integration_external_issue()
  740. results = self.make_query(search_filter_query="is:unlinked")
  741. assert set(results) == {self.group1, self.group2}
  742. results = self.make_query(search_filter_query="is:linked")
  743. assert set(results) == {linked_group}
  744. def test_linked_with_only_platform_external_issue(self):
  745. linked_group = self.create_group_with_platform_external_issue()
  746. results = self.make_query(search_filter_query="is:unlinked")
  747. assert set(results) == {self.group1, self.group2}
  748. results = self.make_query(search_filter_query="is:linked")
  749. assert set(results) == {linked_group}
  750. def test_linked_with_environment(self):
  751. linked_group1 = self.create_group_with_integration_external_issue(environment="production")
  752. linked_group2 = self.create_group_with_platform_external_issue(environment="staging")
  753. results = self.make_query(
  754. environments=[self.environments["production"]], search_filter_query="is:unlinked"
  755. )
  756. assert set(results) == {self.group1}
  757. results = self.make_query(
  758. environments=[self.environments["staging"]], search_filter_query="is:unlinked"
  759. )
  760. assert set(results) == {self.group2}
  761. results = self.make_query(
  762. environments=[self.environments["production"]], search_filter_query="is:linked"
  763. )
  764. assert set(results) == {linked_group1}
  765. results = self.make_query(
  766. environments=[self.environments["staging"]], search_filter_query="is:linked"
  767. )
  768. assert set(results) == {linked_group2}
  769. def test_unassigned(self):
  770. results = self.make_query(search_filter_query="is:unassigned")
  771. assert set(results) == {self.group1}
  772. results = self.make_query(search_filter_query="is:assigned")
  773. assert set(results) == {self.group2}
  774. def test_unassigned_with_environment(self):
  775. results = self.make_query(
  776. environments=[self.environments["production"]], search_filter_query="is:unassigned"
  777. )
  778. assert set(results) == {self.group1}
  779. results = self.make_query(
  780. environments=[self.environments["staging"]], search_filter_query="is:assigned"
  781. )
  782. assert set(results) == {self.group2}
  783. results = self.make_query(
  784. environments=[self.environments["production"]], search_filter_query="is:assigned"
  785. )
  786. assert set(results) == set()
  787. def test_assigned_to(self):
  788. results = self.make_query(search_filter_query="assigned:%s" % self.user.username)
  789. assert set(results) == {self.group2}
  790. # test team assignee
  791. ga = GroupAssignee.objects.get(
  792. user=self.user, group=self.group2, project=self.group2.project
  793. )
  794. ga.update(team=self.team, user=None)
  795. assert GroupAssignee.objects.get(id=ga.id).user is None
  796. results = self.make_query(search_filter_query="assigned:%s" % self.user.username)
  797. assert set(results) == {self.group2}
  798. # test when there should be no results
  799. other_user = self.create_user()
  800. results = self.make_query(search_filter_query="assigned:%s" % other_user.username)
  801. assert set(results) == set()
  802. owner = self.create_user()
  803. self.create_member(
  804. organization=self.project.organization, user=owner, role="owner", teams=[]
  805. )
  806. # test that owners don't see results for all teams
  807. results = self.make_query(search_filter_query="assigned:%s" % owner.username)
  808. assert set(results) == set()
  809. def test_assigned_to_in_syntax(self):
  810. group_3 = self.store_event(
  811. data={
  812. "fingerprint": ["put-me-in-group3"],
  813. "event_id": "c" * 32,
  814. "timestamp": iso_format(self.base_datetime - timedelta(days=20)),
  815. },
  816. project_id=self.project.id,
  817. ).group
  818. group_3.status = GroupStatus.MUTED
  819. group_3.save()
  820. other_user = self.create_user()
  821. self.run_test_query_in_syntax(
  822. f"assigned:[{self.user.username}, {other_user.username}]",
  823. [self.group2],
  824. [self.group1, group_3],
  825. )
  826. GroupAssignee.objects.create(project=self.project, group=group_3, user=other_user)
  827. self.run_test_query_in_syntax(
  828. f"assigned:[{self.user.username}, {other_user.username}]",
  829. [self.group2, group_3],
  830. [self.group1],
  831. )
  832. self.run_test_query_in_syntax(
  833. f"assigned:[#{self.team.slug}, {other_user.username}]",
  834. [group_3],
  835. [self.group1, self.group2],
  836. )
  837. ga_2 = GroupAssignee.objects.get(
  838. user=self.user, group=self.group2, project=self.group2.project
  839. )
  840. ga_2.update(team=self.team, user=None)
  841. self.run_test_query_in_syntax(
  842. f"assigned:[{self.user.username}, {other_user.username}]",
  843. [self.group2, group_3],
  844. [self.group1],
  845. )
  846. self.run_test_query_in_syntax(
  847. f"assigned:[#{self.team.slug}, {other_user.username}]",
  848. [self.group2, group_3],
  849. [self.group1],
  850. )
  851. self.run_test_query_in_syntax(
  852. f"assigned:[me, none, {other_user.username}]",
  853. [self.group1, self.group2, group_3],
  854. [],
  855. )
  856. def test_assigned_or_suggested_in_syntax(self):
  857. Group.objects.all().delete()
  858. group = self.store_event(
  859. data={
  860. "timestamp": iso_format(before_now(seconds=180)),
  861. "fingerprint": ["group-1"],
  862. },
  863. project_id=self.project.id,
  864. ).group
  865. group1 = self.store_event(
  866. data={
  867. "timestamp": iso_format(before_now(seconds=185)),
  868. "fingerprint": ["group-2"],
  869. },
  870. project_id=self.project.id,
  871. ).group
  872. group2 = self.store_event(
  873. data={
  874. "timestamp": iso_format(before_now(seconds=190)),
  875. "fingerprint": ["group-3"],
  876. },
  877. project_id=self.project.id,
  878. ).group
  879. assigned_group = self.store_event(
  880. data={
  881. "timestamp": iso_format(before_now(seconds=195)),
  882. "fingerprint": ["group-4"],
  883. },
  884. project_id=self.project.id,
  885. ).group
  886. assigned_to_other_group = self.store_event(
  887. data={
  888. "timestamp": iso_format(before_now(seconds=195)),
  889. "fingerprint": ["group-5"],
  890. },
  891. project_id=self.project.id,
  892. ).group
  893. self.run_test_query_in_syntax(
  894. "assigned_or_suggested:[me]",
  895. [],
  896. [group, group1, group2, assigned_group, assigned_to_other_group],
  897. )
  898. GroupOwner.objects.create(
  899. group=assigned_to_other_group,
  900. project=self.project,
  901. organization=self.organization,
  902. type=0,
  903. team_id=None,
  904. user_id=self.user.id,
  905. )
  906. GroupOwner.objects.create(
  907. group=group,
  908. project=self.project,
  909. organization=self.organization,
  910. type=0,
  911. team_id=None,
  912. user_id=self.user.id,
  913. )
  914. self.run_test_query_in_syntax(
  915. "assigned_or_suggested:[me]",
  916. [group, assigned_to_other_group],
  917. [group1, group2, assigned_group],
  918. )
  919. # Because assigned_to_other_event is assigned to self.other_user, it should not show up in assigned_or_suggested search for anyone but self.other_user. (aka. they are now the only owner)
  920. other_user = self.create_user("other@user.com", is_superuser=False)
  921. GroupAssignee.objects.create(
  922. group=assigned_to_other_group,
  923. project=self.project,
  924. user=other_user,
  925. )
  926. self.run_test_query_in_syntax(
  927. "assigned_or_suggested:[me]",
  928. [group],
  929. [group1, group2, assigned_group, assigned_to_other_group],
  930. )
  931. self.run_test_query_in_syntax(
  932. f"assigned_or_suggested:[{other_user.email}]",
  933. [assigned_to_other_group],
  934. [group, group1, group2, assigned_group],
  935. )
  936. GroupAssignee.objects.create(group=assigned_group, project=self.project, user=self.user)
  937. self.run_test_query_in_syntax(
  938. f"assigned_or_suggested:[{self.user.email}]",
  939. [assigned_group, group],
  940. )
  941. GroupOwner.objects.create(
  942. group=group,
  943. project=self.project,
  944. organization=self.organization,
  945. type=0,
  946. team_id=self.team.id,
  947. user_id=None,
  948. )
  949. self.run_test_query_in_syntax(
  950. f"assigned_or_suggested:[#{self.team.slug}]",
  951. [group],
  952. )
  953. self.run_test_query_in_syntax(
  954. "assigned_or_suggested:[me, none]",
  955. [group, group1, group2, assigned_group],
  956. [assigned_to_other_group],
  957. )
  958. not_me = self.create_user(email="notme@sentry.io")
  959. GroupOwner.objects.create(
  960. group=group2,
  961. project=self.project,
  962. organization=self.organization,
  963. type=0,
  964. team_id=None,
  965. user_id=not_me.id,
  966. )
  967. self.run_test_query_in_syntax(
  968. "assigned_or_suggested:[me, none]",
  969. [group, group1, assigned_group],
  970. [assigned_to_other_group, group2],
  971. )
  972. GroupOwner.objects.filter(group=group, user=self.user).delete()
  973. self.run_test_query_in_syntax(
  974. f"assigned_or_suggested:[me, none, #{self.team.slug}]",
  975. [group, group1, assigned_group],
  976. [assigned_to_other_group, group2],
  977. )
  978. self.run_test_query_in_syntax(
  979. f"assigned_or_suggested:[me, none, #{self.team.slug}, {not_me.email}]",
  980. [group, group1, assigned_group, group2],
  981. [assigned_to_other_group],
  982. )
  983. def test_assigned_to_with_environment(self):
  984. results = self.make_query(
  985. environments=[self.environments["staging"]],
  986. search_filter_query="assigned:%s" % self.user.username,
  987. )
  988. assert set(results) == {self.group2}
  989. results = self.make_query(
  990. environments=[self.environments["production"]],
  991. search_filter_query="assigned:%s" % self.user.username,
  992. )
  993. assert set(results) == set()
  994. def test_subscribed_by(self):
  995. results = self.make_query(
  996. [self.group1.project], search_filter_query="subscribed:%s" % self.user.username
  997. )
  998. assert set(results) == {self.group1}
  999. def test_subscribed_by_in_syntax(self):
  1000. self.run_test_query_in_syntax(
  1001. f"subscribed:[{self.user.username}]", [self.group1], [self.group2]
  1002. )
  1003. user_2 = self.create_user()
  1004. GroupSubscription.objects.create(
  1005. user=user_2, group=self.group2, project=self.project, is_active=True
  1006. )
  1007. self.run_test_query_in_syntax(
  1008. f"subscribed:[{self.user.username}, {user_2.username}]", [self.group1, self.group2], []
  1009. )
  1010. def test_subscribed_by_with_environment(self):
  1011. results = self.make_query(
  1012. [self.group1.project],
  1013. environments=[self.environments["production"]],
  1014. search_filter_query="subscribed:%s" % self.user.username,
  1015. )
  1016. assert set(results) == {self.group1}
  1017. results = self.make_query(
  1018. [self.group1.project],
  1019. environments=[self.environments["staging"]],
  1020. search_filter_query="subscribed:%s" % self.user.username,
  1021. )
  1022. assert set(results) == set()
  1023. @mock.patch("sentry.utils.snuba.raw_query")
  1024. def test_snuba_not_called_optimization(self, query_mock):
  1025. assert self.make_query(search_filter_query="status:unresolved").results == [self.group1]
  1026. assert not query_mock.called
  1027. assert (
  1028. self.make_query(
  1029. search_filter_query="last_seen:>%s" % date_to_query_format(timezone.now()),
  1030. sort_by="date",
  1031. ).results
  1032. == []
  1033. )
  1034. assert query_mock.called
  1035. @mock.patch("sentry.utils.snuba.raw_query")
  1036. def test_optimized_aggregates(self, query_mock):
  1037. # TODO this test is annoyingly fragile and breaks in hard-to-see ways
  1038. # any time anything about the snuba query changes
  1039. query_mock.return_value = {"data": [], "totals": {"total": 0}}
  1040. def Any(cls):
  1041. class Any:
  1042. def __eq__(self, other):
  1043. return isinstance(other, cls)
  1044. return Any()
  1045. DEFAULT_LIMIT = 100
  1046. chunk_growth = options.get("snuba.search.chunk-growth-rate")
  1047. limit = int(DEFAULT_LIMIT * chunk_growth)
  1048. common_args = {
  1049. "arrayjoin": None,
  1050. "dataset": Dataset.Events,
  1051. "start": Any(datetime),
  1052. "end": Any(datetime),
  1053. "filter_keys": {
  1054. "project_id": [self.project.id],
  1055. "group_id": [self.group1.id, self.group2.id],
  1056. },
  1057. "referrer": "search",
  1058. "groupby": ["group_id"],
  1059. "conditions": [[["positionCaseInsensitive", ["message", "'foo'"]], "!=", 0]],
  1060. "selected_columns": [],
  1061. "limit": limit,
  1062. "offset": 0,
  1063. "totals": True,
  1064. "turbo": False,
  1065. "sample": 1,
  1066. }
  1067. self.make_query(search_filter_query="status:unresolved")
  1068. assert not query_mock.called
  1069. self.make_query(
  1070. search_filter_query="last_seen:>=%s foo" % date_to_query_format(timezone.now()),
  1071. sort_by="date",
  1072. )
  1073. query_mock.call_args[1]["aggregations"].sort()
  1074. assert query_mock.call_args == mock.call(
  1075. orderby=["-last_seen", "group_id"],
  1076. aggregations=[
  1077. ["multiply(toUInt64(max(timestamp)), 1000)", "", "last_seen"],
  1078. ["uniq", "group_id", "total"],
  1079. ],
  1080. having=[["last_seen", ">=", Any(int)]],
  1081. **common_args,
  1082. )
  1083. self.make_query(search_filter_query="foo", sort_by="priority")
  1084. query_mock.call_args[1]["aggregations"].sort()
  1085. assert query_mock.call_args == mock.call(
  1086. orderby=["-priority", "group_id"],
  1087. aggregations=[
  1088. ["count()", "", "times_seen"],
  1089. ["multiply(toUInt64(max(timestamp)), 1000)", "", "last_seen"],
  1090. ["toUInt64(plus(multiply(log(times_seen), 600), last_seen))", "", "priority"],
  1091. ["uniq", "group_id", "total"],
  1092. ],
  1093. having=[],
  1094. **common_args,
  1095. )
  1096. self.make_query(search_filter_query="times_seen:5 foo", sort_by="freq")
  1097. query_mock.call_args[1]["aggregations"].sort()
  1098. assert query_mock.call_args == mock.call(
  1099. orderby=["-times_seen", "group_id"],
  1100. aggregations=[["count()", "", "times_seen"], ["uniq", "group_id", "total"]],
  1101. having=[["times_seen", "=", 5]],
  1102. **common_args,
  1103. )
  1104. self.make_query(search_filter_query="foo", sort_by="user")
  1105. query_mock.call_args[1]["aggregations"].sort()
  1106. assert query_mock.call_args == mock.call(
  1107. orderby=["-user_count", "group_id"],
  1108. aggregations=[
  1109. ["uniq", "group_id", "total"],
  1110. ["uniq", "tags[sentry:user]", "user_count"],
  1111. ],
  1112. having=[],
  1113. **common_args,
  1114. )
  1115. def test_pre_and_post_filtering(self):
  1116. prev_max_pre = options.get("snuba.search.max-pre-snuba-candidates")
  1117. options.set("snuba.search.max-pre-snuba-candidates", 1)
  1118. try:
  1119. # normal queries work as expected
  1120. results = self.make_query(search_filter_query="foo")
  1121. assert set(results) == {self.group1}
  1122. results = self.make_query(search_filter_query="bar")
  1123. assert set(results) == {self.group2}
  1124. # no candidate matches in Sentry, immediately return empty paginator
  1125. results = self.make_query(search_filter_query="NO MATCHES IN SENTRY")
  1126. assert set(results) == set()
  1127. # too many candidates, skip pre-filter, requires >1 postfilter queries
  1128. results = self.make_query()
  1129. assert set(results) == {self.group1, self.group2}
  1130. finally:
  1131. options.set("snuba.search.max-pre-snuba-candidates", prev_max_pre)
  1132. def test_optimizer_enabled(self):
  1133. prev_optimizer_enabled = options.get("snuba.search.pre-snuba-candidates-optimizer")
  1134. options.set("snuba.search.pre-snuba-candidates-optimizer", True)
  1135. try:
  1136. results = self.make_query(
  1137. search_filter_query="server:example.com",
  1138. environments=[self.environments["production"]],
  1139. )
  1140. assert set(results) == {self.group1}
  1141. finally:
  1142. options.set("snuba.search.pre-snuba-candidates-optimizer", prev_optimizer_enabled)
  1143. def test_search_out_of_range(self):
  1144. the_date = datetime(2000, 1, 1, 0, 0, 0, tzinfo=pytz.utc)
  1145. results = self.make_query(
  1146. search_filter_query=f"event.timestamp:>{the_date} event.timestamp:<{the_date}",
  1147. date_from=the_date,
  1148. date_to=the_date,
  1149. )
  1150. assert set(results) == set()
  1151. def test_hits_estimate(self):
  1152. # 400 Groups/Events
  1153. # Every 3rd one is Unresolved
  1154. # Every 2nd one has tag match=1
  1155. for i in range(400):
  1156. event = self.store_event(
  1157. data={
  1158. "event_id": md5(f"event {i}".encode()).hexdigest(),
  1159. "fingerprint": [f"put-me-in-group{i}"],
  1160. "timestamp": iso_format(self.base_datetime - timedelta(days=21)),
  1161. "message": f"group {i} event",
  1162. "stacktrace": {"frames": [{"module": f"module {i}"}]},
  1163. "tags": {"match": f"{i % 2}"},
  1164. "environment": "production",
  1165. },
  1166. project_id=self.project.id,
  1167. )
  1168. group = event.group
  1169. group.times_seen = 5
  1170. group.status = GroupStatus.UNRESOLVED if i % 3 == 0 else GroupStatus.RESOLVED
  1171. group.save()
  1172. self.store_group(group)
  1173. # Sample should estimate there are roughly 66 overall matching groups
  1174. # based on a random sample of 100 (or $sample_size) of the total 200
  1175. # snuba matches, of which 33% should pass the postgres filter.
  1176. with self.options(
  1177. {
  1178. # Too small to pass all django candidates down to snuba
  1179. "snuba.search.max-pre-snuba-candidates": 5,
  1180. "snuba.search.hits-sample-size": 50,
  1181. }
  1182. ):
  1183. first_results = self.make_query(
  1184. search_filter_query="is:unresolved match:1", limit=10, count_hits=True
  1185. )
  1186. # Deliberately do not assert that the value is within some margin
  1187. # of error, as this will fail tests at some rate corresponding to
  1188. # our confidence interval.
  1189. assert first_results.hits > 10
  1190. # When searching for the same tags, we should get the same set of
  1191. # hits as the sampling is based on the hash of the query.
  1192. second_results = self.make_query(
  1193. search_filter_query="is:unresolved match:1", limit=10, count_hits=True
  1194. )
  1195. assert first_results.results == second_results.results
  1196. # When using a different search, we should get a different sample
  1197. # but still should have some hits.
  1198. third_results = self.make_query(
  1199. search_filter_query="is:unresolved match:0", limit=10, count_hits=True
  1200. )
  1201. assert third_results.hits > 10
  1202. assert third_results.results != second_results.results
  1203. def test_regressed_in_release(self):
  1204. # expect no groups within the results since there are no releases
  1205. results = self.make_query(search_filter_query="regressed_in_release:fake")
  1206. assert set(results) == set()
  1207. # expect no groups even though there is a release; since no group regressed in this release
  1208. release_1 = self.create_release()
  1209. results = self.make_query(search_filter_query="regressed_in_release:%s" % release_1.version)
  1210. assert set(results) == set()
  1211. # Create a new event so that we get a group in this release
  1212. group = self.store_event(
  1213. data={
  1214. "release": release_1.version,
  1215. },
  1216. project_id=self.project.id,
  1217. ).group
  1218. # # Should still be no group since we didn't regress in this release
  1219. results = self.make_query(search_filter_query="regressed_in_release:%s" % release_1.version)
  1220. assert set(results) == set()
  1221. record_group_history(group, GroupHistoryStatus.REGRESSED, release=release_1)
  1222. results = self.make_query(search_filter_query="regressed_in_release:%s" % release_1.version)
  1223. assert set(results) == {group}
  1224. # Make sure this works correctly with multiple releases
  1225. release_2 = self.create_release()
  1226. group_2 = self.store_event(
  1227. data={
  1228. "fingerprint": ["put-me-in-group9001"],
  1229. "event_id": "a" * 32,
  1230. "release": release_2.version,
  1231. },
  1232. project_id=self.project.id,
  1233. ).group
  1234. record_group_history(group_2, GroupHistoryStatus.REGRESSED, release=release_2)
  1235. results = self.make_query(search_filter_query="regressed_in_release:%s" % release_1.version)
  1236. assert set(results) == {group}
  1237. results = self.make_query(search_filter_query="regressed_in_release:%s" % release_2.version)
  1238. assert set(results) == {group_2}
  1239. def test_first_release(self):
  1240. # expect no groups within the results since there are no releases
  1241. results = self.make_query(search_filter_query="first_release:%s" % "fake")
  1242. assert set(results) == set()
  1243. # expect no groups even though there is a release; since no group
  1244. # is attached to a release
  1245. release_1 = self.create_release(self.project)
  1246. results = self.make_query(search_filter_query="first_release:%s" % release_1.version)
  1247. assert set(results) == set()
  1248. # Create a new event so that we get a group in this release
  1249. group = self.store_event(
  1250. data={
  1251. "fingerprint": ["put-me-in-group9001"],
  1252. "event_id": "a" * 32,
  1253. "message": "hello",
  1254. "environment": "production",
  1255. "tags": {"server": "example.com"},
  1256. "release": release_1.version,
  1257. "stacktrace": {"frames": [{"module": "group1"}]},
  1258. },
  1259. project_id=self.project.id,
  1260. ).group
  1261. results = self.make_query(search_filter_query="first_release:%s" % release_1.version)
  1262. assert set(results) == {group}
  1263. def test_first_release_in_syntax(self):
  1264. # expect no groups within the results since there are no releases
  1265. self.run_test_query_in_syntax("first_release:[fake, fake2]", [])
  1266. # expect no groups even though there is a release; since no group
  1267. # is attached to a release
  1268. release_1 = self.create_release(self.project)
  1269. release_2 = self.create_release(self.project)
  1270. self.run_test_query_in_syntax(
  1271. f"first_release:[{release_1.version}, {release_2.version}]", []
  1272. )
  1273. # Create a new event so that we get a group in this release
  1274. group = self.store_event(
  1275. data={
  1276. "fingerprint": ["put-me-in-group9001"],
  1277. "event_id": "a" * 32,
  1278. "message": "hello",
  1279. "environment": "production",
  1280. "tags": {"server": "example.com"},
  1281. "release": release_1.version,
  1282. "stacktrace": {"frames": [{"module": "group1"}]},
  1283. },
  1284. project_id=self.project.id,
  1285. ).group
  1286. self.run_test_query_in_syntax(
  1287. f"first_release:[{release_1.version}, {release_2.version}]",
  1288. [group],
  1289. [self.group1, self.group2],
  1290. )
  1291. # Create a new event so that we get a group in this release
  1292. group_2 = self.store_event(
  1293. data={
  1294. "fingerprint": ["put-me-in-group9002"],
  1295. "event_id": "a" * 32,
  1296. "message": "hello",
  1297. "environment": "production",
  1298. "tags": {"server": "example.com"},
  1299. "release": release_2.version,
  1300. "stacktrace": {"frames": [{"module": "group1"}]},
  1301. },
  1302. project_id=self.project.id,
  1303. ).group
  1304. self.run_test_query_in_syntax(
  1305. f"first_release:[{release_1.version}, {release_2.version}]",
  1306. [group, group_2],
  1307. )
  1308. def test_first_release_environments(self):
  1309. results = self.make_query(
  1310. environments=[self.environments["production"]],
  1311. search_filter_query="first_release:fake",
  1312. )
  1313. assert set(results) == set()
  1314. release = self.create_release(self.project)
  1315. group_env = GroupEnvironment.get_or_create(
  1316. group_id=self.group1.id, environment_id=self.environments["production"].id
  1317. )[0]
  1318. results = self.make_query(
  1319. environments=[self.environments["production"]],
  1320. search_filter_query=f"first_release:{release.version}",
  1321. )
  1322. assert set(results) == set()
  1323. group_env.first_release = release
  1324. group_env.save()
  1325. results = self.make_query(
  1326. environments=[self.environments["production"]],
  1327. search_filter_query=f"first_release:{release.version}",
  1328. )
  1329. assert set(results) == {self.group1}
  1330. def test_first_release_environments_in_syntax(self):
  1331. self.run_test_query_in_syntax(
  1332. "first_release:[fake, fake2]",
  1333. [],
  1334. [self.group1, self.group2],
  1335. environments=[self.environments["production"]],
  1336. )
  1337. release = self.create_release(self.project)
  1338. group_1_env = GroupEnvironment.objects.get(
  1339. group_id=self.group1.id, environment_id=self.environments["production"].id
  1340. )
  1341. group_1_env.update(first_release=release)
  1342. self.run_test_query_in_syntax(
  1343. f"first_release:[{release.version}, fake2]",
  1344. [self.group1],
  1345. [self.group2],
  1346. environments=[self.environments["production"]],
  1347. )
  1348. group_2_env = GroupEnvironment.objects.get(
  1349. group_id=self.group2.id, environment_id=self.environments["staging"].id
  1350. )
  1351. group_2_env.update(first_release=release)
  1352. self.run_test_query_in_syntax(
  1353. f"first_release:[{release.version}, fake2]",
  1354. [self.group1, self.group2],
  1355. [],
  1356. environments=[self.environments["production"], self.environments["staging"]],
  1357. )
  1358. # Make sure we don't get duplicate groups
  1359. GroupEnvironment.objects.create(
  1360. group_id=self.group1.id,
  1361. environment_id=self.environments["staging"].id,
  1362. first_release=release,
  1363. )
  1364. self.run_test_query_in_syntax(
  1365. f"first_release:[{release.version}, fake2]",
  1366. [self.group1, self.group2],
  1367. [],
  1368. environments=[self.environments["production"], self.environments["staging"]],
  1369. )
  1370. def test_query_enclosed_in_quotes(self):
  1371. results = self.make_query(search_filter_query='"foo"')
  1372. assert set(results) == {self.group1}
  1373. results = self.make_query(search_filter_query='"bar"')
  1374. assert set(results) == {self.group2}
  1375. @xfail_if_not_postgres("Wildcard searching only supported in Postgres")
  1376. def test_wildcard(self):
  1377. escaped_event = self.store_event(
  1378. data={
  1379. "fingerprint": ["hello-there"],
  1380. "event_id": "f" * 32,
  1381. "message": "somet[hing]",
  1382. "environment": "production",
  1383. "tags": {"server": "example.net"},
  1384. "timestamp": iso_format(self.base_datetime),
  1385. "stacktrace": {"frames": [{"module": "group1"}]},
  1386. },
  1387. project_id=self.project.id,
  1388. )
  1389. # Note: Adding in `environment:production` so that we make sure we query
  1390. # in both snuba and postgres
  1391. results = self.make_query(search_filter_query="environment:production so*t")
  1392. assert set(results) == {escaped_event.group}
  1393. # Make sure it's case insensitive
  1394. results = self.make_query(search_filter_query="environment:production SO*t")
  1395. assert set(results) == {escaped_event.group}
  1396. results = self.make_query(search_filter_query="environment:production so*zz")
  1397. assert set(results) == set()
  1398. results = self.make_query(search_filter_query="environment:production [hing]")
  1399. assert set(results) == {escaped_event.group}
  1400. results = self.make_query(search_filter_query="environment:production s*]")
  1401. assert set(results) == {escaped_event.group}
  1402. results = self.make_query(search_filter_query="environment:production server:example.*")
  1403. assert set(results) == {self.group1, escaped_event.group}
  1404. results = self.make_query(search_filter_query="environment:production !server:*net")
  1405. assert set(results) == {self.group1}
  1406. # TODO: Disabling tests that use [] syntax for the moment. Re-enable
  1407. # these if we decide to add back in, or remove if this comment has been
  1408. # here a while.
  1409. # results = self.make_query(
  1410. # search_filter_query='environment:production [s][of][mz]',
  1411. # )
  1412. # assert set(results) == set([escaped_event.group])
  1413. # results = self.make_query(
  1414. # search_filter_query='environment:production [z][of][mz]',
  1415. # )
  1416. # assert set(results) == set()
  1417. def test_null_tags(self):
  1418. tag_event = self.store_event(
  1419. data={
  1420. "fingerprint": ["hello-there"],
  1421. "event_id": "f" * 32,
  1422. "message": "something",
  1423. "environment": "production",
  1424. "tags": {"server": "example.net"},
  1425. "timestamp": iso_format(self.base_datetime),
  1426. "stacktrace": {"frames": [{"module": "group1"}]},
  1427. },
  1428. project_id=self.project.id,
  1429. )
  1430. no_tag_event = self.store_event(
  1431. data={
  1432. "fingerprint": ["hello-there-2"],
  1433. "event_id": "5" * 32,
  1434. "message": "something",
  1435. "environment": "production",
  1436. "timestamp": iso_format(self.base_datetime),
  1437. "stacktrace": {"frames": [{"module": "group2"}]},
  1438. },
  1439. project_id=self.project.id,
  1440. )
  1441. results = self.make_query(search_filter_query="environment:production !server:*net")
  1442. assert set(results) == {self.group1, no_tag_event.group}
  1443. results = self.make_query(search_filter_query="environment:production server:*net")
  1444. assert set(results) == {tag_event.group}
  1445. results = self.make_query(search_filter_query="environment:production !server:example.net")
  1446. assert set(results) == {self.group1, no_tag_event.group}
  1447. results = self.make_query(search_filter_query="environment:production server:example.net")
  1448. assert set(results) == {tag_event.group}
  1449. results = self.make_query(search_filter_query="environment:production has:server")
  1450. assert set(results) == {self.group1, tag_event.group}
  1451. results = self.make_query(search_filter_query="environment:production !has:server")
  1452. assert set(results) == {no_tag_event.group}
  1453. def test_null_promoted_tags(self):
  1454. tag_event = self.store_event(
  1455. data={
  1456. "fingerprint": ["hello-there"],
  1457. "event_id": "f" * 32,
  1458. "message": "something",
  1459. "environment": "production",
  1460. "tags": {"logger": "csp"},
  1461. "timestamp": iso_format(self.base_datetime),
  1462. "stacktrace": {"frames": [{"module": "group1"}]},
  1463. },
  1464. project_id=self.project.id,
  1465. )
  1466. no_tag_event = self.store_event(
  1467. data={
  1468. "fingerprint": ["hello-there-2"],
  1469. "event_id": "5" * 32,
  1470. "message": "something",
  1471. "environment": "production",
  1472. "timestamp": iso_format(self.base_datetime),
  1473. "stacktrace": {"frames": [{"module": "group2"}]},
  1474. },
  1475. project_id=self.project.id,
  1476. )
  1477. results = self.make_query(search_filter_query="environment:production !logger:*sp")
  1478. assert set(results) == {self.group1, no_tag_event.group}
  1479. results = self.make_query(search_filter_query="environment:production logger:*sp")
  1480. assert set(results) == {tag_event.group}
  1481. results = self.make_query(search_filter_query="environment:production !logger:csp")
  1482. assert set(results) == {self.group1, no_tag_event.group}
  1483. results = self.make_query(search_filter_query="environment:production logger:csp")
  1484. assert set(results) == {tag_event.group}
  1485. results = self.make_query(search_filter_query="environment:production has:logger")
  1486. assert set(results) == {tag_event.group}
  1487. results = self.make_query(search_filter_query="environment:production !has:logger")
  1488. assert set(results) == {self.group1, no_tag_event.group}
  1489. def test_sort_multi_project(self):
  1490. self.set_up_multi_project()
  1491. results = self.make_query([self.project, self.project2], sort_by="date")
  1492. assert list(results) == [self.group1, self.group_p2, self.group2]
  1493. results = self.make_query([self.project, self.project2], sort_by="new")
  1494. assert list(results) == [self.group2, self.group_p2, self.group1]
  1495. results = self.make_query([self.project, self.project2], sort_by="freq")
  1496. assert list(results) == [self.group1, self.group_p2, self.group2]
  1497. results = self.make_query([self.project, self.project2], sort_by="priority")
  1498. assert list(results) == [self.group1, self.group2, self.group_p2]
  1499. results = self.make_query([self.project, self.project2], sort_by="user")
  1500. assert list(results) == [self.group1, self.group2, self.group_p2]
  1501. def test_sort_trend(self):
  1502. start = self.group1.first_seen - timedelta(days=1)
  1503. end = before_now(days=1).replace(tzinfo=pytz.utc)
  1504. middle = start + ((end - start) / 2)
  1505. self.store_event(
  1506. data={
  1507. "fingerprint": ["put-me-in-group1"],
  1508. "event_id": "2" * 32,
  1509. "message": "something",
  1510. "timestamp": iso_format(self.base_datetime),
  1511. },
  1512. project_id=self.project.id,
  1513. )
  1514. self.store_event(
  1515. data={
  1516. "fingerprint": ["put-me-in-group1"],
  1517. "event_id": "3" * 32,
  1518. "message": "something",
  1519. "timestamp": iso_format(self.base_datetime),
  1520. },
  1521. project_id=self.project.id,
  1522. )
  1523. fewer_events_group = self.store_event(
  1524. data={
  1525. "fingerprint": ["put-me-in-group4"],
  1526. "event_id": "4" * 32,
  1527. "message": "something",
  1528. "timestamp": iso_format(middle - timedelta(days=1)),
  1529. },
  1530. project_id=self.project.id,
  1531. ).group
  1532. self.store_event(
  1533. data={
  1534. "fingerprint": ["put-me-in-group4"],
  1535. "event_id": "5" * 32,
  1536. "message": "something",
  1537. "timestamp": iso_format(middle - timedelta(days=1)),
  1538. },
  1539. project_id=self.project.id,
  1540. )
  1541. self.store_event(
  1542. data={
  1543. "fingerprint": ["put-me-in-group4"],
  1544. "event_id": "6" * 32,
  1545. "message": "something",
  1546. "timestamp": iso_format(self.base_datetime),
  1547. },
  1548. project_id=self.project.id,
  1549. )
  1550. no_before_group = self.store_event(
  1551. data={
  1552. "fingerprint": ["put-me-in-group5"],
  1553. "event_id": "3" * 32,
  1554. "message": "something",
  1555. "timestamp": iso_format(self.base_datetime),
  1556. },
  1557. project_id=self.project.id,
  1558. ).group
  1559. no_after_group = self.store_event(
  1560. data={
  1561. "fingerprint": ["put-me-in-group6"],
  1562. "event_id": "4" * 32,
  1563. "message": "something",
  1564. "timestamp": iso_format(middle - timedelta(days=1)),
  1565. },
  1566. project_id=self.project.id,
  1567. ).group
  1568. self.set_up_multi_project()
  1569. results = self.make_query([self.project], sort_by="trend", date_from=start, date_to=end)
  1570. assert results[:2] == [self.group1, fewer_events_group]
  1571. # These will be arbitrarily ordered since their trend values are all 0
  1572. assert set(results[2:]) == {self.group2, no_before_group, no_after_group}
  1573. def test_in_syntax_is_invalid(self):
  1574. with pytest.raises(InvalidSearchQuery, match='"in" syntax invalid for "is" search'):
  1575. self.make_query(search_filter_query="is:[unresolved, resolved]")
  1576. def test_first_release_any_or_no_environments(self):
  1577. # test scenarios for tickets:
  1578. # SEN-571
  1579. # ISSUE-432
  1580. # given the following setup:
  1581. #
  1582. # groups table:
  1583. # group first_release
  1584. # A 1
  1585. # B 1
  1586. # C 2
  1587. #
  1588. # groupenvironments table:
  1589. # group environment first_release
  1590. # A staging 1
  1591. # A production 2
  1592. #
  1593. # when querying by first release, the appropriate set of groups should be displayed:
  1594. #
  1595. # first_release: 1
  1596. # env=[]: A, B
  1597. # env=[production, staging]: A
  1598. # env=[staging]: A
  1599. # env=[production]: nothing
  1600. #
  1601. # first_release: 2
  1602. # env=[]: A, C
  1603. # env=[production, staging]: A
  1604. # env=[staging]: nothing
  1605. # env=[production]: A
  1606. # create an issue/group whose events that occur in 2 distinct environments
  1607. group_a_event_1 = self.store_event(
  1608. data={
  1609. "fingerprint": ["group_a"],
  1610. "event_id": "aaa" + ("1" * 29),
  1611. "environment": "example_staging",
  1612. "release": "release_1",
  1613. },
  1614. project_id=self.project.id,
  1615. )
  1616. group_a_event_2 = self.store_event(
  1617. data={
  1618. "fingerprint": ["group_a"],
  1619. "event_id": "aaa" + ("2" * 29),
  1620. "environment": "example_production",
  1621. "release": "release_2",
  1622. },
  1623. project_id=self.project.id,
  1624. )
  1625. group_a = group_a_event_1.group
  1626. # get the environments for group_a
  1627. prod_env = group_a_event_2.get_environment()
  1628. staging_env = group_a_event_1.get_environment()
  1629. # create an issue/group whose event that occur in no environments
  1630. # but will be tied to release release_1
  1631. group_b_event_1 = self.store_event(
  1632. data={
  1633. "fingerprint": ["group_b"],
  1634. "event_id": "bbb" + ("1" * 29),
  1635. "release": "release_1",
  1636. },
  1637. project_id=self.project.id,
  1638. )
  1639. assert group_b_event_1.get_environment().name == "" # has no environment
  1640. group_b = group_b_event_1.group
  1641. # create an issue/group whose event that occur in no environments
  1642. # but will be tied to release release_2
  1643. group_c_event_1 = self.store_event(
  1644. data={
  1645. "fingerprint": ["group_c"],
  1646. "event_id": "ccc" + ("1" * 29),
  1647. "release": "release_2",
  1648. },
  1649. project_id=self.project.id,
  1650. )
  1651. assert group_c_event_1.get_environment().name == "" # has no environment
  1652. group_c = group_c_event_1.group
  1653. # query by release release_1
  1654. results = self.make_query(search_filter_query="first_release:%s" % "release_1")
  1655. assert set(results) == {group_a, group_b}
  1656. results = self.make_query(
  1657. environments=[staging_env, prod_env],
  1658. search_filter_query="first_release:%s" % "release_1",
  1659. )
  1660. assert set(results) == {group_a}
  1661. results = self.make_query(
  1662. environments=[staging_env], search_filter_query="first_release:%s" % "release_1"
  1663. )
  1664. assert set(results) == {group_a}
  1665. results = self.make_query(
  1666. environments=[prod_env], search_filter_query="first_release:%s" % "release_1"
  1667. )
  1668. assert set(results) == set()
  1669. # query by release release_2
  1670. results = self.make_query(search_filter_query="first_release:%s" % "release_2")
  1671. assert set(results) == {group_a, group_c}
  1672. results = self.make_query(
  1673. environments=[staging_env, prod_env],
  1674. search_filter_query="first_release:%s" % "release_2",
  1675. )
  1676. assert set(results) == {group_a}
  1677. results = self.make_query(
  1678. environments=[staging_env], search_filter_query="first_release:%s" % "release_2"
  1679. )
  1680. assert set(results) == set()
  1681. results = self.make_query(
  1682. environments=[prod_env], search_filter_query="first_release:%s" % "release_2"
  1683. )
  1684. assert set(results) == {group_a}
  1685. def test_all_fields_do_not_error(self):
  1686. # Just a sanity check to make sure that all fields can be successfully
  1687. # searched on without returning type errors and other schema related
  1688. # issues.
  1689. def test_query(query):
  1690. try:
  1691. self.make_query(search_filter_query=query)
  1692. except SnubaError as e:
  1693. self.fail(f"Query {query} errored. Error info: {e}")
  1694. for key in SENTRY_SNUBA_MAP:
  1695. if key in ["project.id", "issue.id"]:
  1696. continue
  1697. test_query("has:%s" % key)
  1698. test_query("!has:%s" % key)
  1699. if key == "error.handled":
  1700. val = 1
  1701. elif key in issue_search_config.numeric_keys:
  1702. val = "123"
  1703. elif key in issue_search_config.date_keys:
  1704. val = self.base_datetime.isoformat()
  1705. elif key in issue_search_config.boolean_keys:
  1706. val = "true"
  1707. elif key in {"trace.span", "trace.parent_span"}:
  1708. val = "abcdef1234abcdef"
  1709. test_query(f"!{key}:{val}")
  1710. else:
  1711. val = "abadcafedeadbeefdeaffeedabadfeed"
  1712. test_query(f"!{key}:{val}")
  1713. test_query(f"{key}:{val}")
  1714. class CdcEventsSnubaSearchTest(TestCase, SnubaTestCase):
  1715. @property
  1716. def backend(self):
  1717. return CdcEventsDatasetSnubaSearchBackend()
  1718. def setUp(self):
  1719. super().setUp()
  1720. self.base_datetime = (datetime.utcnow() - timedelta(days=3)).replace(tzinfo=pytz.utc)
  1721. self.event1 = self.store_event(
  1722. data={
  1723. "fingerprint": ["put-me-in-group1"],
  1724. "event_id": "a" * 32,
  1725. "environment": "production",
  1726. "timestamp": iso_format(self.base_datetime - timedelta(days=21)),
  1727. "tags": {"sentry:user": "user1"},
  1728. },
  1729. project_id=self.project.id,
  1730. )
  1731. self.env1 = self.event1.get_environment()
  1732. self.group1 = self.event1.group
  1733. self.event3 = self.store_event(
  1734. data={
  1735. "fingerprint": ["put-me-in-group1"],
  1736. "environment": "staging",
  1737. "timestamp": iso_format(self.base_datetime),
  1738. "tags": {"sentry:user": "user2"},
  1739. },
  1740. project_id=self.project.id,
  1741. )
  1742. self.event2 = self.store_event(
  1743. data={
  1744. "fingerprint": ["put-me-in-group2"],
  1745. "timestamp": iso_format(self.base_datetime - timedelta(days=20)),
  1746. "environment": "staging",
  1747. "tags": {"sentry:user": "user1"},
  1748. },
  1749. project_id=self.project.id,
  1750. )
  1751. self.group2 = self.event2.group
  1752. self.env2 = self.event2.get_environment()
  1753. def build_search_filter(self, query, projects=None, user=None, environments=None):
  1754. user = user if user is not None else self.user
  1755. projects = projects if projects is not None else [self.project]
  1756. return convert_query_values(parse_search_query(query), projects, user, environments)
  1757. def make_query(
  1758. self,
  1759. projects=None,
  1760. search_filter_query=None,
  1761. environments=None,
  1762. sort_by="date",
  1763. limit=None,
  1764. count_hits=False,
  1765. date_from=None,
  1766. date_to=None,
  1767. cursor=None,
  1768. ):
  1769. search_filters = []
  1770. projects = projects if projects is not None else [self.project]
  1771. if search_filter_query is not None:
  1772. search_filters = self.build_search_filter(
  1773. search_filter_query, projects, environments=environments
  1774. )
  1775. kwargs = {}
  1776. if limit is not None:
  1777. kwargs["limit"] = limit
  1778. return self.backend.query(
  1779. projects,
  1780. search_filters=search_filters,
  1781. environments=environments,
  1782. count_hits=count_hits,
  1783. sort_by=sort_by,
  1784. date_from=date_from,
  1785. date_to=date_to,
  1786. cursor=cursor,
  1787. **kwargs,
  1788. )
  1789. def run_test(
  1790. self,
  1791. search_filter_query,
  1792. expected_groups,
  1793. expected_hits,
  1794. projects=None,
  1795. environments=None,
  1796. sort_by="date",
  1797. limit=None,
  1798. count_hits=False,
  1799. date_from=None,
  1800. date_to=None,
  1801. cursor=None,
  1802. ):
  1803. results = self.make_query(
  1804. projects=projects,
  1805. search_filter_query=search_filter_query,
  1806. environments=environments,
  1807. sort_by=sort_by,
  1808. limit=limit,
  1809. count_hits=count_hits,
  1810. date_from=date_from,
  1811. date_to=date_to,
  1812. cursor=cursor,
  1813. )
  1814. assert list(results) == expected_groups
  1815. assert results.hits == expected_hits
  1816. return results
  1817. def test(self):
  1818. self.run_test("is:unresolved", [self.group1, self.group2], None)
  1819. def test_invalid(self):
  1820. with self.assertRaises(InvalidQueryForExecutor):
  1821. self.make_query(search_filter_query="is:unresolved abc:123")
  1822. def test_resolved_group(self):
  1823. self.group2.status = GroupStatus.RESOLVED
  1824. self.group2.save()
  1825. self.store_group(self.group2)
  1826. self.run_test("is:unresolved", [self.group1], None)
  1827. self.run_test("is:resolved", [self.group2], None)
  1828. self.run_test("is:unresolved is:resolved", [], None)
  1829. def test_environment(self):
  1830. self.run_test("is:unresolved", [self.group1], None, environments=[self.env1])
  1831. self.run_test("is:unresolved", [self.group1, self.group2], None, environments=[self.env2])
  1832. def test_sort_times_seen(self):
  1833. self.run_test(
  1834. "is:unresolved",
  1835. [self.group1, self.group2],
  1836. None,
  1837. sort_by="freq",
  1838. date_from=self.base_datetime - timedelta(days=30),
  1839. )
  1840. self.store_event(
  1841. data={
  1842. "fingerprint": ["put-me-in-group2"],
  1843. "timestamp": iso_format(self.base_datetime - timedelta(days=15)),
  1844. },
  1845. project_id=self.project.id,
  1846. )
  1847. self.store_event(
  1848. data={
  1849. "fingerprint": ["put-me-in-group2"],
  1850. "timestamp": iso_format(self.base_datetime - timedelta(days=10)),
  1851. "tags": {"sentry:user": "user2"},
  1852. },
  1853. project_id=self.project.id,
  1854. )
  1855. self.run_test(
  1856. "is:unresolved",
  1857. [self.group2, self.group1],
  1858. None,
  1859. sort_by="freq",
  1860. # Change the date range to bust the cache
  1861. date_from=self.base_datetime - timedelta(days=29),
  1862. )
  1863. def test_sort_first_seen(self):
  1864. self.run_test(
  1865. "is:unresolved",
  1866. [self.group2, self.group1],
  1867. None,
  1868. sort_by="new",
  1869. date_from=self.base_datetime - timedelta(days=30),
  1870. )
  1871. group3 = self.store_event(
  1872. data={
  1873. "fingerprint": ["put-me-in-group3"],
  1874. "timestamp": iso_format(self.base_datetime + timedelta(days=1)),
  1875. },
  1876. project_id=self.project.id,
  1877. ).group
  1878. self.run_test(
  1879. "is:unresolved",
  1880. [group3, self.group2, self.group1],
  1881. None,
  1882. sort_by="new",
  1883. # Change the date range to bust the cache
  1884. date_from=self.base_datetime - timedelta(days=29),
  1885. )
  1886. def test_sort_user(self):
  1887. self.run_test(
  1888. "is:unresolved",
  1889. [self.group1, self.group2],
  1890. None,
  1891. sort_by="user",
  1892. date_from=self.base_datetime - timedelta(days=30),
  1893. )
  1894. self.store_event(
  1895. data={
  1896. "fingerprint": ["put-me-in-group2"],
  1897. "timestamp": iso_format(self.base_datetime + timedelta(days=1)),
  1898. "tags": {"sentry:user": "user2"},
  1899. },
  1900. project_id=self.project.id,
  1901. )
  1902. self.store_event(
  1903. data={
  1904. "fingerprint": ["put-me-in-group2"],
  1905. "timestamp": iso_format(self.base_datetime + timedelta(days=1)),
  1906. "tags": {"sentry:user": "user2"},
  1907. },
  1908. project_id=self.project.id,
  1909. )
  1910. self.store_event(
  1911. data={
  1912. "fingerprint": ["put-me-in-group1"],
  1913. "timestamp": iso_format(self.base_datetime + timedelta(days=1)),
  1914. "tags": {"sentry:user": "user1"},
  1915. },
  1916. project_id=self.project.id,
  1917. )
  1918. self.store_event(
  1919. data={
  1920. "fingerprint": ["put-me-in-group1"],
  1921. "timestamp": iso_format(self.base_datetime + timedelta(days=1)),
  1922. "tags": {"sentry:user": "user1"},
  1923. },
  1924. project_id=self.project.id,
  1925. )
  1926. # Test group with no users, which can return a null count
  1927. group3 = self.store_event(
  1928. data={
  1929. "fingerprint": ["put-me-in-group3"],
  1930. "timestamp": iso_format(self.base_datetime + timedelta(days=1)),
  1931. },
  1932. project_id=self.project.id,
  1933. ).group
  1934. self.run_test(
  1935. "is:unresolved",
  1936. [self.group2, self.group1, group3],
  1937. None,
  1938. sort_by="user",
  1939. # Change the date range to bust the cache
  1940. date_from=self.base_datetime - timedelta(days=29),
  1941. )
  1942. def test_sort_priority(self):
  1943. self.run_test(
  1944. "is:unresolved",
  1945. [self.group1, self.group2],
  1946. None,
  1947. sort_by="priority",
  1948. date_from=self.base_datetime - timedelta(days=30),
  1949. )
  1950. def test_cursor(self):
  1951. group3 = self.store_event(
  1952. data={
  1953. "fingerprint": ["put-me-in-group3"],
  1954. "timestamp": iso_format(self.base_datetime + timedelta(days=1)),
  1955. "tags": {"sentry:user": "user2"},
  1956. },
  1957. project_id=self.project.id,
  1958. ).group
  1959. group4 = self.store_event(
  1960. data={
  1961. "fingerprint": ["put-me-in-group7"],
  1962. "timestamp": iso_format(self.base_datetime + timedelta(days=2)),
  1963. "tags": {"sentry:user": "user2"},
  1964. },
  1965. project_id=self.project.id,
  1966. ).group
  1967. results = self.run_test("is:unresolved", [group4], 4, limit=1, count_hits=True)
  1968. results = self.run_test(
  1969. "is:unresolved", [group3], 4, limit=1, cursor=results.next, count_hits=True
  1970. )
  1971. results = self.run_test(
  1972. "is:unresolved", [group4], 4, limit=1, cursor=results.prev, count_hits=True
  1973. )
  1974. self.run_test(
  1975. "is:unresolved", [group3, self.group1], 4, limit=2, cursor=results.next, count_hits=True
  1976. )
  1977. def test_rechecking(self):
  1978. self.group2.status = GroupStatus.RESOLVED
  1979. self.group2.save()
  1980. # Explicitly avoid calling `store_group` here. This means that Clickhouse will still see
  1981. # this group as `UNRESOLVED` and it will be returned in the snuba results. This group
  1982. # should still be filtered out by our recheck.
  1983. self.run_test("is:unresolved", [self.group1], None)