123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371 |
- #!/usr/bin/env sh
- # Please, keep this script in sync with arcadia/ya
- # Shell commands follow
- # Next line is bilingual: it starts a comment in Python, but do nothing in shell
- """:"
- # Find a suitable python interpreter
- for cmd in python3 python; do
- command -v > /dev/null $cmd && exec "$(command -v $cmd)" "$0" "$@"
- done
- echo "Python interpreter is not found in this system, please, install python" >&2
- exit 2
- ":"""
- # Previous line is bilingual: it ends a comment in Python, but do nothing in shell
- # Shell commands end here
- # Python script follows
- import os
- import sys
- import platform
- RETRIES = 5
- HASH_PREFIX = 10
- REGISTRY_ENDPOINT = os.environ.get("YA_REGISTRY_ENDPOINT", "https://devtools-registry.s3.yandex.net")
- # Please do not change this dict, it is updated automatically
- # Start of mapping
- PLATFORM_MAP = {
- "data": {
- "darwin": {
- "md5": "f8eb20c1a507736a81834a17d047652b",
- "urls": [
- f"{REGISTRY_ENDPOINT}/5923491707"
- ]
- },
- "darwin-arm64": {
- "md5": "6a990034f3f6e23e5fbdbdb91302b523",
- "urls": [
- f"{REGISTRY_ENDPOINT}/5923490842"
- ]
- },
- "linux-aarch64": {
- "md5": "96beea81023bb48e268519a50c07419a",
- "urls": [
- f"{REGISTRY_ENDPOINT}/5923490453"
- ]
- },
- "win32-clang-cl": {
- "md5": "87eb5f132bcb294f0127a505d00f0735",
- "urls": [
- f"{REGISTRY_ENDPOINT}/5923492435"
- ]
- },
- "linux": {
- "md5": "6062cf519b6899fcd49422749e8f35ae",
- "urls": [
- f"{REGISTRY_ENDPOINT}/5923493257"
- ]
- }
- }
- } # End of mapping
- def create_dirs(path):
- try:
- os.makedirs(path)
- except OSError as e:
- import errno
- if e.errno != errno.EEXIST:
- raise
- return path
- def home_dir():
- # Do not trust $HOME, as it is unreliable in certain environments
- # Temporarily delete os.environ["HOME"] to force reading current home directory from /etc/passwd
- home_from_env = os.environ.pop("HOME", None)
- try:
- home_from_passwd = os.path.expanduser("~")
- if os.path.isabs(home_from_passwd):
- # This home dir is valid, prefer it over $HOME
- return home_from_passwd
- else:
- # When python is built with musl (this is quire weird though),
- # only users from /etc/passwd will be properly resolved,
- # as musl does not have nss module for LDAP integration.
- return home_from_env
- finally:
- if home_from_env is not None:
- os.environ["HOME"] = home_from_env
- def misc_root():
- return create_dirs(os.getenv('YA_CACHE_DIR') or os.path.join(home_dir(), '.ya'))
- def tool_root():
- return create_dirs(os.getenv('YA_CACHE_DIR_TOOLS') or os.path.join(misc_root(), 'tools'))
- # TODO: remove when switched to S3, won't be needed in OSS
- def ya_token():
- def get_token_from_file():
- try:
- with open(os.environ.get('YA_TOKEN_PATH', os.path.join(home_dir(), '.ya_token')), 'r') as f:
- return f.read().strip()
- except:
- pass
- return os.getenv('YA_TOKEN') or get_token_from_file()
- TOOLS_DIR = tool_root()
- def uniq(size=6):
- import string
- import random
- return ''.join(random.choice(string.ascii_lowercase + string.digits) for _ in range(size))
- _ssl_is_tuned = False
- def _tune_ssl():
- global _ssl_is_tuned
- if _ssl_is_tuned:
- return
- try:
- import ssl
- ssl._create_default_https_context = ssl._create_unverified_context
- except AttributeError:
- pass
- try:
- import urllib3
- urllib3.disable_warnings(urllib3.exceptions.InsecureRequestWarning)
- except (AttributeError, ImportError):
- pass
- _ssl_is_tuned = True
- def _fetch(url, into):
- import hashlib
- _tune_ssl()
- from urllib.request import urlopen
- from urllib.request import Request
- from urllib.parse import urlparse
- request = Request(str(url))
- # TODO: Remove when switched to S3 distribution
- request.add_header('User-Agent', 'ya-bootstrap')
- token = ya_token()
- if token:
- request.add_header('Authorization', 'OAuth {}'.format(token))
- md5 = hashlib.md5()
- sys.stderr.write('Downloading %s ' % url)
- sys.stderr.flush()
- conn = urlopen(request, timeout=10)
- sys.stderr.write('[')
- sys.stderr.flush()
- try:
- with open(into, 'wb') as f:
- while True:
- block = conn.read(1024 * 1024)
- sys.stderr.write('.')
- sys.stderr.flush()
- if block:
- md5.update(block)
- f.write(block)
- else:
- break
- return md5.hexdigest()
- finally:
- sys.stderr.write('] ')
- sys.stderr.flush()
- def _atomic_fetch(url, into, md5):
- tmp_dest = into + '.' + uniq()
- try:
- real_md5 = _fetch(url, tmp_dest)
- if real_md5 != md5:
- raise Exception('MD5 mismatched: %s differs from %s' % (real_md5, md5))
- os.rename(tmp_dest, into)
- sys.stderr.write('OK\n')
- except Exception as e:
- sys.stderr.write('ERROR: ' + str(e) + '\n')
- raise
- finally:
- try:
- os.remove(tmp_dest)
- except OSError:
- pass
- def _extract(path, into):
- import tarfile
- tar = tarfile.open(path, errorlevel=2)
- # tar.extractall() will try to set file ownership according to the attributes stored in the archive
- # by calling TarFile.chown() method.
- # As this information is hardly relevant to the point of deployment / extraction,
- # it will just fail (python2) if ya is executed with root euid, or silently set non-existent numeric owner (python3)
- # to the files being extracted.
- # mock it with noop to retain current user ownership.
- tar.chown = lambda *args, **kwargs: None
- tar.extractall(path=into)
- tar.close()
- def _get(urls, md5):
- dest_path = os.path.join(TOOLS_DIR, md5[:HASH_PREFIX])
- if not os.path.exists(dest_path):
- for iter in range(RETRIES):
- try:
- _atomic_fetch(urls[iter % len(urls)], dest_path, md5)
- break
- except Exception:
- if iter + 1 == RETRIES:
- raise
- else:
- import time
- time.sleep(iter)
- return dest_path
- def _get_dir(urls, md5, ya_name):
- dest_dir = os.path.join(TOOLS_DIR, md5[:HASH_PREFIX] + '_d')
- if os.path.isfile(os.path.join(dest_dir, ya_name)):
- return dest_dir
- try:
- packed_path = _get(urls, md5)
- except Exception:
- if os.path.isfile(os.path.join(dest_dir, ya_name)):
- return dest_dir
- raise
- tmp_dir = dest_dir + '.' + uniq()
- try:
- try:
- _extract(packed_path, tmp_dir)
- except Exception:
- if os.path.isfile(os.path.join(dest_dir, ya_name)):
- return dest_dir
- raise
- try:
- os.rename(tmp_dir, dest_dir)
- except OSError as e:
- import errno
- if e.errno != errno.ENOTEMPTY:
- raise
- return dest_dir
- finally:
- import shutil
- shutil.rmtree(tmp_dir, ignore_errors=True)
- try:
- os.remove(packed_path)
- except Exception:
- pass
- def _mine_repo_root():
- # We think that this script is located in the root of the repo.
- return os.path.dirname(os.path.realpath(__file__))
- def main():
- if not os.path.exists(TOOLS_DIR):
- os.makedirs(TOOLS_DIR)
- result_args = sys.argv[1:]
- meta = PLATFORM_MAP['data']
- my_platform = platform.system().lower()
- my_machine = platform.machine().lower()
- if my_platform == 'linux':
- if 'ppc64le' in platform.platform():
- my_platform = 'linux-ppc64le'
- elif 'aarch64' in platform.platform():
- my_platform = 'linux-aarch64'
- else:
- my_platform = 'linux_musl'
- if my_platform == 'darwin' and my_machine == 'arm64':
- my_platform = 'darwin-arm64'
- def _platform_key(target_platform):
- """match by max prefix length, prefer shortest"""
- def _key_for_platform(platform):
- return len(os.path.commonprefix([target_platform, platform])), -len(platform)
- return _key_for_platform
- best_key = max(meta.keys(), key=_platform_key(my_platform))
- value = meta[best_key]
- ya_name = {'win32': 'ya-bin.exe', 'win32-clang-cl': 'ya-bin.exe'}.get(best_key, 'ya-bin') # XXX
- ya_dir = _get_dir(value['urls'], value['md5'], ya_name)
- # Popen `args` must have `str` type
- ya_path = str(os.path.join(ya_dir, ya_name))
- env = os.environ.copy()
- if 'YA_SOURCE_ROOT' not in env:
- src_root = _mine_repo_root()
- if src_root is not None:
- env['YA_SOURCE_ROOT'] = src_root
- # Disable respawn for opensource/ya
- if __file__.endswith('ya/opensource/ya'):
- env['YA_NO_RESPAWN'] = os.environ.get('YA_NO_RESPAWN', '1')
- for env_name in [
- 'LD_PRELOAD',
- 'Y_PYTHON_SOURCE_ROOT',
- ]:
- if env_name in os.environ:
- sys.stderr.write(
- "Warn: {}='{}' is specified and may affect the correct operation of the ya\n".format(
- env_name, env[env_name]
- )
- )
- if os.name == 'nt':
- import subprocess
- p = subprocess.Popen([ya_path] + result_args, env=env)
- p.wait()
- sys.exit(p.returncode)
- else:
- os.execve(ya_path, [ya_path] + result_args, env)
- if __name__ == '__main__':
- try:
- main()
- except Exception as e:
- sys.stderr.write('ERROR: ' + str(e) + '\n')
- from traceback import format_exc
- sys.stderr.write(format_exc() + "\n")
- sys.exit(1)
|