3 лет назад · d0ec2a94ba
--- a/src/sentry/api/endpoints/organization_events_facets_performance.py
+++ b/src/sentry/api/endpoints/organization_events_facets_performance.py
@@ -1,5 +1,5 @@
 
				 import math
			
 
				-from typing import Any, Dict, Mapping, Optional
			
 
				+from typing import Any, Dict, List, Mapping, Optional
			
 
				 
			
 
				 import sentry_sdk
			
 
				 from django.http import Http404
			
@@ -9,6 +9,7 @@ from rest_framework.response import Response
 
				 from sentry import features, tagstore
			
 
				 from sentry.api.bases import NoProjects, OrganizationEventsV2EndpointBase
			
 
				 from sentry.api.paginator import GenericOffsetPaginator
			
 
				+from sentry.search.events.filter import get_filter
			
 
				 from sentry.snuba import discover
			
 
				 from sentry.utils.snuba import Dataset
			
 
				 
			
@@ -128,32 +129,53 @@ class OrganizationEventsFacetsPerformanceHistogramEndpoint(
 
				             return Response([])
			
 
				 
			
 
				         tag_key = request.GET.get("tagKey")
			
 
				+        tag_key_limit = request.GET.get("tagKeyLimit")
			
 
				+        num_buckets_per_key = request.GET.get("numBucketsPerKey")
			
 
				+
			
 
				+        if not tag_key_limit:
			
 
				+            raise ParseError(detail="'tagKeyLimit' must be provided for the performance histogram.")
			
 
				+        if not num_buckets_per_key:
			
 
				+            raise ParseError(
			
 
				+                detail="'numBucketsPerKey' must be provided for the performance histogram."
			
 
				+            )
			
 
				+        try:
			
 
				+            tag_key_limit = int(tag_key_limit)
			
 
				+            num_buckets_per_key = int(num_buckets_per_key)
			
 
				+        except ValueError:
			
 
				+            raise ParseError(detail="Bucket and tag key limits must be numeric.")
			
 
				+
			
 
				+        if tag_key_limit * num_buckets_per_key > 500:
			
 
				+            raise ParseError(
			
 
				+                detail="The number of total buckets ('tagKeyLimit' * 'numBucketsPerKey') cannot exceed 500"
			
 
				+            )
			
 
				 
			
 
				         if not tag_key:
			
 
				             raise ParseError(detail="'tagKey' must be provided when using histograms.")
			
 
				 
			
 
				-        def data_fn(offset, limit):
			
 
				+        def data_fn():
			
 
				             with sentry_sdk.start_span(op="discover.endpoint", description="discover_query"):
			
 
				-                referrer = "api.organization-events-facets-performance-histogram.top-tags"
			
 
				-                tag_data = query_tag_data(
			
 
				+                referrer = "api.organization-events-facets-performance-histogram"
			
 
				+                top_tags = query_top_tags(
			
 
				+                    tag_key=tag_key,
			
 
				+                    limit=tag_key_limit,
			
 
				                     filter_query=filter_query,
			
 
				-                    aggregate_column=aggregate_column,
			
 
				-                    referrer=referrer,
			
 
				                     params=params,
			
 
				+                    referrer=referrer,
			
 
				                 )
			
 
				 
			
 
				-                if not tag_data:
			
 
				+                if not top_tags:
			
 
				                     return {"data": []}
			
 
				 
			
 
				                 results = query_facet_performance_key_histogram(
			
 
				-                    tag_data=tag_data,
			
 
				+                    top_tags=top_tags,
			
 
				                     tag_key=tag_key,
			
 
				                     filter_query=filter_query,
			
 
				                     aggregate_column=aggregate_column,
			
 
				                     referrer=referrer,
			
 
				                     orderby=self.get_orderby(request),
			
 
				                     params=params,
			
 
				-                    limit=limit,
			
 
				+                    limit=tag_key_limit,
			
 
				+                    num_buckets_per_key=num_buckets_per_key,
			
 
				                 )
			
 
				 
			
 
				                 if not results:
			
@@ -167,23 +189,17 @@ class OrganizationEventsFacetsPerformanceHistogramEndpoint(
 
				 
			
 
				                 return results
			
 
				 
			
 
				-        with self.handle_query_errors():
			
 
				-            return self.paginate(
			
 
				-                request=request,
			
 
				-                paginator=GenericOffsetPaginator(data_fn=data_fn),
			
 
				-                on_results=lambda results: self.handle_results_with_meta(
			
 
				-                    request, organization, params["project_id"], results
			
 
				-                ),
			
 
				-                default_per_page=10,
			
 
				-                max_per_page=50,
			
 
				-            )
			
 
				+        results = data_fn()
			
 
				+        return Response(
			
 
				+            self.handle_results_with_meta(request, organization, params["project_id"], results)
			
 
				+        )
			
 
				 
			
 
				 
			
 
				 def query_tag_data(
			
 
				     params: Mapping[str, str],
			
 
				+    referrer: str,
			
 
				     filter_query: Optional[str] = None,
			
 
				     aggregate_column: Optional[str] = None,
			
 
				-    referrer: Optional[str] = None,
			
 
				 ) -> Optional[Dict]:
			
 
				     """
			
 
				     Fetch general data about all the transactions with this transaction name to feed into the facet query
			
@@ -194,7 +210,7 @@ def query_tag_data(
 
				         op="discover.discover", description="facets.filter_transform"
			
 
				     ) as span:
			
 
				         span.set_data("query", filter_query)
			
 
				-        snuba_filter = discover.get_filter(filter_query, params)
			
 
				+        snuba_filter = get_filter(filter_query, params)
			
 
				 
			
 
				         # Resolve the public aliases into the discover dataset names.
			
 
				         snuba_filter, translated_columns = discover.resolve_discover_aliases(snuba_filter)
			
@@ -229,13 +245,64 @@ def query_tag_data(
 
				     return tag_data["data"][0]
			
 
				 
			
 
				 
			
 
				+def query_top_tags(
			
 
				+    params: Mapping[str, str],
			
 
				+    tag_key: str,
			
 
				+    limit: int,
			
 
				+    referrer: str,
			
 
				+    filter_query: Optional[str] = None,
			
 
				+) -> Optional[List[Any]]:
			
 
				+    """
			
 
				+    Fetch counts by tag value, finding the top tag values for a tag key by a limit.
			
 
				+    :return: Returns the row with the value, the aggregate and the count if the query was successful
			
 
				+             Returns None if query was not successful which causes the endpoint to return early
			
 
				+    """
			
 
				+    with sentry_sdk.start_span(
			
 
				+        op="discover.discover", description="facets.filter_transform"
			
 
				+    ) as span:
			
 
				+        span.set_data("query", filter_query)
			
 
				+        snuba_filter = get_filter(filter_query, params)
			
 
				+
			
 
				+        # Resolve the public aliases into the discover dataset names.
			
 
				+        snuba_filter, translated_columns = discover.resolve_discover_aliases(snuba_filter)
			
 
				+
			
 
				+    with sentry_sdk.start_span(op="discover.discover", description="facets.top_tags"):
			
 
				+
			
 
				+        # Get the average and count to use to filter the next request to facets
			
 
				+        tag_data = discover.query(
			
 
				+            selected_columns=[
			
 
				+                "count()",
			
 
				+                "array_join(tags.value) as tags_value",
			
 
				+            ],
			
 
				+            query=filter_query,
			
 
				+            params=params,
			
 
				+            orderby=["-count"],
			
 
				+            conditions=[["tags_key", "IN", [tag_key]]],
			
 
				+            functions_acl=["array_join"],
			
 
				+            referrer=f"{referrer}.top_tags",
			
 
				+            limit=limit,
			
 
				+        )
			
 
				+
			
 
				+        if len(tag_data["data"]) <= 0:
			
 
				+            return None
			
 
				+
			
 
				+        counts = [r["count"] for r in tag_data["data"]]
			
 
				+
			
 
				+        # Return early to avoid doing more queries with 0 count transactions or aggregates for columns that dont exist
			
 
				+        if counts[0] == 0:
			
 
				+            return None
			
 
				+    if not tag_data["data"]:
			
 
				+        return None
			
 
				+    return tag_data["data"]
			
 
				+
			
 
				+
			
 
				 def query_facet_performance(
			
 
				     params: Mapping[str, str],
			
 
				     tag_data: Mapping[str, Any],
			
 
				+    referrer: str,
			
 
				     aggregate_column: Optional[str] = None,
			
 
				     filter_query: Optional[str] = None,
			
 
				     orderby: Optional[str] = None,
			
 
				-    referrer: Optional[str] = None,
			
 
				     limit: Optional[int] = None,
			
 
				     offset: Optional[int] = None,
			
 
				     all_tag_keys: Optional[bool] = None,
			
@@ -245,7 +312,7 @@ def query_facet_performance(
 
				         op="discover.discover", description="facets.filter_transform"
			
 
				     ) as span:
			
 
				         span.set_data("query", filter_query)
			
 
				-        snuba_filter = discover.get_filter(filter_query, params)
			
 
				+        snuba_filter = get_filter(filter_query, params)
			
 
				 
			
 
				         # Resolve the public aliases into the discover dataset names.
			
 
				         snuba_filter, translated_columns = discover.resolve_discover_aliases(snuba_filter)
			
@@ -337,18 +404,20 @@ def query_facet_performance(
 
				 
			
 
				 def query_facet_performance_key_histogram(
			
 
				     params: Mapping[str, str],
			
 
				-    tag_data: Mapping[str, Any],
			
 
				+    top_tags: List[Any],
			
 
				     tag_key: str,
			
 
				+    num_buckets_per_key: int,
			
 
				+    limit: int,
			
 
				+    referrer: str,
			
 
				     aggregate_column: Optional[str] = None,
			
 
				     filter_query: Optional[str] = None,
			
 
				     orderby: Optional[str] = None,
			
 
				-    referrer: Optional[str] = None,
			
 
				-    limit: Optional[int] = None,
			
 
				 ) -> Dict:
			
 
				     precision = 0
			
 
				-    num_buckets = 100
			
 
				-    min_value = tag_data["min"]
			
 
				-    max_value = tag_data["max"]
			
 
				+
			
 
				+    tag_values = [x["tags_value"] for x in top_tags]
			
 
				+
			
 
				+    num_buckets = num_buckets_per_key * limit
			
 
				 
			
 
				     results = discover.histogram_query(
			
 
				         [aggregate_column],
			
@@ -356,12 +425,13 @@ def query_facet_performance_key_histogram(
 
				         params,
			
 
				         num_buckets,
			
 
				         precision,
			
 
				-        min_value=min_value,
			
 
				-        max_value=max_value,
			
 
				         referrer="api.organization-events-facets-performance-histogram",
			
 
				-        limit_by=[limit, "tags_key"] if limit else None,
			
 
				         group_by=["tags_value", "tags_key"],
			
 
				-        extra_conditions=[["tags_key", "IN", [tag_key]]],
			
 
				+        limit_by=[num_buckets_per_key, "tags_value"],
			
 
				+        extra_conditions=[
			
 
				+            ["tags_key", "IN", [tag_key]],
			
 
				+            ["tags_value", "IN", tag_values],
			
 
				+        ],
			
 
				         normalize_results=False,
			
 
				     )
			
 
				     return results
			
--- a/src/sentry/snuba/discover.py
+++ b/src/sentry/snuba/discover.py
@@ -940,7 +940,7 @@ def histogram_query(
 
				         conditions.append([key_alias, "IN", field_names])
			
 
				 
			
 
				     if extra_conditions:
			
 
				-        conditions.append(extra_conditions)
			
 
				+        conditions.extend(extra_conditions)
			
 
				 
			
 
				     histogram_params = find_histogram_params(num_buckets, min_value, max_value, multiplier)
			
 
				     histogram_column = get_histogram_column(fields, key_column, histogram_params, array_column)
			
--- a/static/app/utils/performance/segmentExplorer/tagKeyHistogramQuery.tsx
+++ b/static/app/utils/performance/segmentExplorer/tagKeyHistogramQuery.tsx
@@ -34,6 +34,8 @@ type ChildrenProps = Omit<GenericChildrenProps<TableData>, 'tableData'> & {
 
				 type QueryProps = DiscoverQueryProps & {
			
 
				   aggregateColumn: string;
			
 
				   tagKey: string;
			
 
				+  tagKeyLimit: number;
			
 
				+  numBucketsPerKey: number;
			
 
				   sort?: string | string[];
			
 
				   children: (props: ChildrenProps) => React.ReactNode;
			
 
				 };
			
@@ -41,6 +43,8 @@ type QueryProps = DiscoverQueryProps & {
 
				 type FacetQuery = LocationQuery &
			
 
				   EventQuery & {
			
 
				     tagKey?: string;
			
 
				+    tagKeyLimit?: number;
			
 
				+    numBucketsPerKey?: number;
			
 
				     sort?: string | string[];
			
 
				     aggregateColumn?: string;
			
 
				   };
			
@@ -53,6 +57,8 @@ export function getRequestFunction(_props: QueryProps) {
 
				     apiPayload.aggregateColumn = aggregateColumn;
			
 
				     apiPayload.sort = _props.sort ? _props.sort : '-sumdelta';
			
 
				     apiPayload.tagKey = _props.tagKey;
			
 
				+    apiPayload.tagKeyLimit = _props.tagKeyLimit;
			
 
				+    apiPayload.numBucketsPerKey = _props.numBucketsPerKey;
			
 
				     return apiPayload;
			
 
				   }
			
 
				   return getTagExplorerRequestPayload;
			
--- a/static/app/views/performance/transactionSummary/transactionTags/tagsDisplay.tsx
+++ b/static/app/views/performance/transactionSummary/transactionTags/tagsDisplay.tsx
@@ -23,7 +23,9 @@ type Props = {
 
				 };
			
 
				 
			
 
				 const TAG_VALUE_LIMIT = 10;
			
 
				-const HISTOGRAM_BUCKET_LIMIT = 20;
			
 
				+
			
 
				+const HISTOGRAM_TAG_KEY_LIMIT = 8;
			
 
				+const HISTOGRAM_BUCKET_LIMIT = 50;
			
 
				 
			
 
				 const TagsDisplay = (props: Props) => {
			
 
				   const {eventView, location, organization, projects, tagKey} = props;
			
@@ -42,7 +44,8 @@ const TagsDisplay = (props: Props) => {
 
				         orgSlug={organization.slug}
			
 
				         location={location}
			
 
				         aggregateColumn={aggregateColumn}
			
 
				-        limit={HISTOGRAM_BUCKET_LIMIT}
			
 
				+        tagKeyLimit={HISTOGRAM_TAG_KEY_LIMIT}
			
 
				+        numBucketsPerKey={HISTOGRAM_BUCKET_LIMIT}
			
 
				         tagKey={tagKey}
			
 
				         sort="-frequency"
			
 
				       >
			
--- a/tests/snuba/api/endpoints/test_organization_events_facets_performance_histogram.py
+++ b/tests/snuba/api/endpoints/test_organization_events_facets_performance_histogram.py
@@ -107,12 +107,51 @@ class OrganizationEventsFacetsPerformanceHistogramEndpointTest(SnubaTestCase, AP
 
				         )
			
 
				         assert error_response.status_code == 404
			
 
				 
			
 
				+    def test_tag_key_limit_error(self):
			
 
				+        request = {
			
 
				+            "aggregateColumn": "transaction.duration",
			
 
				+            "sort": "-frequency",
			
 
				+            "per_page": 5,
			
 
				+            "statsPeriod": "14d",
			
 
				+            "query": "(color:red or color:blue)",
			
 
				+        }
			
 
				+        # With feature access, no tag key
			
 
				+        error_response = self.do_request(
			
 
				+            request, feature_list=self.feature_list + ("organizations:performance-tag-page",)
			
 
				+        )
			
 
				+
			
 
				+        assert error_response.status_code == 400, error_response.content
			
 
				+        assert error_response.data == {
			
 
				+            "detail": "'tagKeyLimit' must be provided for the performance histogram."
			
 
				+        }
			
 
				+
			
 
				+    def test_num_buckets_error(self):
			
 
				+        request = {
			
 
				+            "aggregateColumn": "transaction.duration",
			
 
				+            "sort": "-frequency",
			
 
				+            "per_page": 5,
			
 
				+            "statsPeriod": "14d",
			
 
				+            "query": "(color:red or color:blue)",
			
 
				+            "tagKeyLimit": 5,
			
 
				+        }
			
 
				+        # With feature access, no tag key
			
 
				+        error_response = self.do_request(
			
 
				+            request, feature_list=self.feature_list + ("organizations:performance-tag-page",)
			
 
				+        )
			
 
				+
			
 
				+        assert error_response.status_code == 400, error_response.content
			
 
				+        assert error_response.data == {
			
 
				+            "detail": "'numBucketsPerKey' must be provided for the performance histogram."
			
 
				+        }
			
 
				+
			
 
				     def test_tag_key_histograms(self):
			
 
				         request = {
			
 
				             "aggregateColumn": "transaction.duration",
			
 
				             "sort": "-frequency",
			
 
				             "per_page": 5,
			
 
				             "statsPeriod": "14d",
			
 
				+            "tagKeyLimit": 10,
			
 
				+            "numBucketsPerKey": 10,
			
 
				             "query": "(color:red or color:blue)",
			
 
				         }
			
 
				         # With feature access, no tag key
			
@@ -139,3 +178,48 @@ class OrganizationEventsFacetsPerformanceHistogramEndpointTest(SnubaTestCase, AP
 
				         assert histogram_data[1]["histogram_transaction_duration_50000_1000000_1"] == 4000000.0
			
 
				         assert histogram_data[1]["tags_value"] == "blue"
			
 
				         assert histogram_data[1]["tags_key"] == "color"
			
 
				+
			
 
				+    def test_tag_key_histogram_buckets(self):
			
 
				+        request = {
			
 
				+            "aggregateColumn": "transaction.duration",
			
 
				+            "sort": "-frequency",
			
 
				+            "per_page": 5,
			
 
				+            "statsPeriod": "14d",
			
 
				+            "tagKeyLimit": 1,
			
 
				+            "numBucketsPerKey": 2,
			
 
				+            "tagKey": "color",
			
 
				+            "query": "(color:red or color:blue or color:green)",
			
 
				+        }
			
 
				+
			
 
				+        data_response = self.do_request(
			
 
				+            request, feature_list=self.feature_list + ("organizations:performance-tag-page",)
			
 
				+        )
			
 
				+
			
 
				+        histogram_data = data_response.data["data"]
			
 
				+        assert len(histogram_data) == 1
			
 
				+        assert histogram_data[0]["count"] == 14
			
 
				+        assert histogram_data[0]["histogram_transaction_duration_2500000_0_1"] == 0.0
			
 
				+        assert histogram_data[0]["tags_value"] == "red"
			
 
				+        assert histogram_data[0]["tags_key"] == "color"
			
 
				+
			
 
				+        request["tagKeyLimit"] = 3
			
 
				+        data_response = self.do_request(
			
 
				+            request, feature_list=self.feature_list + ("organizations:performance-tag-page",)
			
 
				+        )
			
 
				+
			
 
				+        histogram_data = data_response.data["data"]
			
 
				+        assert len(histogram_data) == 3
			
 
				+        assert histogram_data[0]["count"] == 14
			
 
				+        assert histogram_data[0]["histogram_transaction_duration_750000_750000_1"] == 750000.0
			
 
				+        assert histogram_data[0]["tags_value"] == "red"
			
 
				+        assert histogram_data[0]["tags_key"] == "color"
			
 
				+
			
 
				+        assert histogram_data[1]["count"] == 5
			
 
				+        assert histogram_data[1]["histogram_transaction_duration_750000_750000_1"] == 3750000.0
			
 
				+        assert histogram_data[1]["tags_value"] == "blue"
			
 
				+        assert histogram_data[1]["tags_key"] == "color"
			
 
				+
			
 
				+        assert histogram_data[2]["count"] == 1
			
 
				+        assert histogram_data[2]["histogram_transaction_duration_750000_750000_1"] == 4500000.0
			
 
				+        assert histogram_data[2]["tags_value"] == "green"
			
 
				+        assert histogram_data[2]["tags_key"] == "color"