123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206 |
- import copy
- import itertools
- import re
- from os.path import splitext
- from typing import TYPE_CHECKING
- from urllib.parse import urlsplit
- from symbolic import SourceMapView, SourceView
- from apps.sourcecode.models import DebugSymbolBundle
- from sentry.utils.safe import get_path
- if TYPE_CHECKING:
- from .schema import IssueEventSchema, StackTrace, StackTraceFrame
- UNKNOWN_MODULE = "<unknown module>"
- CLEAN_MODULE_RE = re.compile(
- r"""^
- (?:/| # Leading slashes
- (?:
- (?:java)?scripts?|js|build|static|node_modules|bower_components|[_\.~].*?| # common folder prefixes
- v?(?:\d+\.)*\d+| # version numbers, v1, 1.0.0
- [a-f0-9]{7,8}| # short sha
- [a-f0-9]{32}| # md5
- [a-f0-9]{40} # sha1
- )/)+|
- (?:[-\.][a-f0-9]{7,}$) # Ending in a commitish
- """,
- re.X | re.I,
- )
- VERSION_RE = re.compile(r"^[a-f0-9]{32}|[a-f0-9]{40}$", re.I)
- NODE_MODULES_RE = re.compile(r"\bnode_modules/")
- def generate_module(src):
- """
- Converts a url into a made-up module name by doing the following:
- * Extract just the path name ignoring querystrings
- * Trimming off the initial /
- * Trimming off the file extension
- * Removes off useless folder prefixes
- e.g. http://google.com/js/v1.0/foo/bar/baz.js -> foo/bar/baz
- """
- if not src:
- return UNKNOWN_MODULE
- filename, _ = splitext(urlsplit(src).path)
- if filename.endswith(".min"):
- filename = filename[:-4]
- tokens = filename.split("/")
- for idx, token in enumerate(tokens):
- # a SHA
- if VERSION_RE.match(token):
- return "/".join(tokens[idx + 1 :])
- return CLEAN_MODULE_RE.sub("", filename) or UNKNOWN_MODULE
- class JavascriptEventProcessor:
- """
- Based partially on sentry/lang/javascript/processor.py
- """
- def __init__(
- self,
- release_id: int,
- data: "IssueEventSchema",
- debug_bundles: list[DebugSymbolBundle],
- ):
- self.release_id = release_id
- self.data = data
- self.debug_bundles = debug_bundles
- def get_stacktraces(self) -> list["StackTrace"]:
- data = self.data
- if data.exception and not isinstance(data.exception, list):
- return [e.stacktrace for e in data.exception.values if e.stacktrace]
- return []
- def get_valid_frames(self, stacktraces) -> list["StackTraceFrame"]:
- frames = [stacktrace.frames for stacktrace in stacktraces]
- merged = list(itertools.chain(*frames))
- return [f for f in merged if f is not None and f.lineno is not None]
- def process_frame(self, frame, map_file, minified_source):
- # Required to determine source
- if not frame.abs_path or not frame.lineno:
- return
- minified_source.blob.blob.seek(0)
- map_file.blob.blob.seek(0)
- sourcemap_view = SourceMapView.from_json_bytes(map_file.blob.blob.read())
- minified_source_view = SourceView.from_bytes(minified_source.blob.blob.read())
- token = sourcemap_view.lookup(
- frame.lineno - 1,
- frame.colno - 1,
- frame.function,
- minified_source_view,
- )
- if not token:
- return
- frame.lineno = token.src_line + 1
- frame.colno = token.src_col + 1
- if token.function_name:
- frame.function = token.function_name
- filename = token.src
- abs_path = frame.abs_path
- in_app = None
- # special case webpack support
- # abs_path will always be the full path with webpack:/// prefix.
- # filename will be relative to that
- if abs_path.startswith("webpack:"):
- filename = abs_path
- # webpack seems to use ~ to imply "relative to resolver root"
- # which is generally seen for third party deps
- # (i.e. node_modules)
- if "/~/" in filename:
- filename = "~/" + abs_path.split("/~/", 1)[-1]
- else:
- filename = filename.split("webpack:///", 1)[-1]
- # As noted above:
- # * [js/node] '~/' means they're coming from node_modules, so these are not app dependencies
- # * [node] sames goes for `./node_modules/` and '../node_modules/', which is used when bundling node apps
- # * [node] and webpack, which includes it's own code to bootstrap all modules and its internals
- # eg. webpack:///webpack/bootstrap, webpack:///external
- if (
- filename.startswith("~/")
- or "/node_modules/" in filename
- or not filename.startswith("./")
- ):
- in_app = False
- # And conversely, local dependencies start with './'
- elif filename.startswith("./"):
- in_app = True
- # We want to explicitly generate a webpack module name
- frame["module"] = generate_module(filename)
- elif "/node_modules/" in abs_path:
- in_app = False
- if abs_path.startswith("app:"):
- if filename and NODE_MODULES_RE.search(filename):
- in_app = False
- else:
- in_app = True
- frame.filename = filename
- if not frame.module and abs_path.startswith(
- ("http:", "https:", "webpack:", "app:")
- ):
- frame.module = generate_module(abs_path)
- if in_app is not None:
- frame.in_app = in_app
- # Extract frame context
- source_result = next(
- (x for x in sourcemap_view.iter_sources() if x[1] == token.src), None
- )
- if source_result is not None:
- sourceview = sourcemap_view.get_sourceview(source_result[0])
- source = sourceview.get_source().splitlines()
- pre_lines = max(0, token.src_line - 5)
- past_lines = min(len(source), token.src_line + 5)
- frame.context_line = source[token.src_line]
- frame.pre_context = source[pre_lines : token.src_line]
- frame.post_context = source[token.src_line + 1 : past_lines]
- def transform(self):
- stacktraces = self.get_stacktraces()
- frames = self.get_valid_frames(stacktraces)
- if not self.debug_bundles:
- return
- # Copy original stacktrace before modifying them
- for exception in get_path(
- self.data, "exception", "values", filter=True, default=()
- ):
- exception["raw_stacktrace"] = copy.deepcopy(exception["stacktrace"])
- frames_with_source = []
- for frame in frames:
- minified_filename = frame.abs_path.split("/")[-1] if frame.abs_path else ""
- minified_file = None
- map_file = None
- for debug_bundle in self.debug_bundles:
- # File name as given. When debug ids are used, this is based on the debug id
- file_name = debug_bundle.file.name
- # The code file name is the one given by the debug_meta source code image
- # When debug id is used, we must match on this name
- code_file = debug_bundle.data.get("code_file")
- if code_file: # Get name, not full path
- code_file = code_file.split("/")[-1]
- if minified_filename in [file_name, code_file]:
- minified_file = debug_bundle.file
- map_file = debug_bundle.sourcemap_file
- if map_file:
- frames_with_source.append((frame, map_file, minified_file))
- for frame_with_source in frames_with_source:
- self.process_frame(*frame_with_source)
|