#!/usr/bin/env python3 """ Update a Python package expression by passing in the `.nix` file, or the directory containing it. You can pass in multiple files or paths. You'll likely want to use `` $ ./update-python-libraries ../../pkgs/development/python-modules/* `` to update all libraries in that folder. """ import argparse import logging import os import re import requests import toolz from concurrent.futures import ThreadPoolExecutor as Pool from packaging.version import Version as _Version from packaging.version import InvalidVersion from packaging.specifiers import SpecifierSet import collections import subprocess INDEX = "https://pypi.io/pypi" """url of PyPI""" EXTENSIONS = ['tar.gz', 'tar.bz2', 'tar', 'zip', '.whl'] """Permitted file extensions. These are evaluated from left to right and the first occurance is returned.""" PRERELEASES = False GIT = "git" import logging logging.basicConfig(level=logging.INFO) class Version(_Version, collections.abc.Sequence): def __init__(self, version): super().__init__(version) # We cannot use `str(Version(0.04.21))` because that becomes `0.4.21` # https://github.com/avian2/unidecode/issues/13#issuecomment-354538882 self.raw_version = version def __getitem__(self, i): return self._version.release[i] def __len__(self): return len(self._version.release) def __iter__(self): yield from self._version.release def _get_values(attribute, text): """Match attribute in text and return all matches. :returns: List of matches. """ regex = '{}\s+=\s+"(.*)";'.format(attribute) regex = re.compile(regex) values = regex.findall(text) return values def _get_unique_value(attribute, text): """Match attribute in text and return unique match. :returns: Single match. """ values = _get_values(attribute, text) n = len(values) if n > 1: raise ValueError("found too many values for {}".format(attribute)) elif n == 1: return values[0] else: raise ValueError("no value found for {}".format(attribute)) def _get_line_and_value(attribute, text): """Match attribute in text. Return the line and the value of the attribute.""" regex = '({}\s+=\s+"(.*)";)'.format(attribute) regex = re.compile(regex) value = regex.findall(text) n = len(value) if n > 1: raise ValueError("found too many values for {}".format(attribute)) elif n == 1: return value[0] else: raise ValueError("no value found for {}".format(attribute)) def _replace_value(attribute, value, text): """Search and replace value of attribute in text.""" old_line, old_value = _get_line_and_value(attribute, text) new_line = old_line.replace(old_value, value) new_text = text.replace(old_line, new_line) return new_text def _fetch_page(url): r = requests.get(url) if r.status_code == requests.codes.ok: return r.json() else: raise ValueError("request for {} failed".format(url)) SEMVER = { 'major' : 0, 'minor' : 1, 'patch' : 2, } def _get_latest_version_pypi(package, extension, current_version, target): """Get latest version and hash from PyPI.""" url = "{}/{}/json".format(INDEX, package) json = _fetch_page(url) version = json['info']['version'] try: releases = json['releases'][version] except KeyError as e: raise KeyError('Could not find version {} for {}'.format(version, package)) from e for release in releases: if release['filename'].endswith(extension): # TODO: In case of wheel we need to do further checks! sha256 = release['digests']['sha256'] break else: logging.error("Release not found for extension: {}".format(extension)) sha256 = None return version, sha256 def _get_latest_version_github(package, extension, current_version, target): raise ValueError("updating from GitHub is not yet supported.") FETCHERS = { 'fetchFromGitHub' : _get_latest_version_github, 'fetchPypi' : _get_latest_version_pypi, 'fetchurl' : _get_latest_version_pypi, } DEFAULT_SETUPTOOLS_EXTENSION = 'tar.gz' FORMATS = { 'setuptools' : DEFAULT_SETUPTOOLS_EXTENSION, 'wheel' : 'whl' } def _determine_fetcher(text): # Count occurences of fetchers. nfetchers = sum(text.count('src = {}'.format(fetcher)) for fetcher in FETCHERS.keys()) if nfetchers == 0: raise ValueError("no fetcher.") elif nfetchers > 1: raise ValueError("multiple fetchers.") else: # Then we check which fetcher to use. for fetcher in FETCHERS.keys(): if 'src = {}'.format(fetcher) in text: return fetcher def _determine_extension(text, fetcher): """Determine what extension is used in the expression. If we use: - fetchPypi, we check if format is specified. - fetchurl, we determine the extension from the url. - fetchFromGitHub we simply use `.tar.gz`. """ if fetcher == 'fetchPypi': try: src_format = _get_unique_value('format', text) except ValueError as e: src_format = None # format was not given try: extension = _get_unique_value('extension', text) except ValueError as e: extension = None # extension was not given if extension is None: if src_format is None: src_format = 'setuptools' elif src_format == 'flit': raise ValueError("Don't know how to update a Flit package.") extension = FORMATS[src_format] elif fetcher == 'fetchurl': url = _get_unique_value('url', text) extension = os.path.splitext(url)[1] if 'pypi' not in url: raise ValueError('url does not point to PyPI.') elif fetcher == 'fetchFromGitHub': raise ValueError('updating from GitHub is not yet implemented.') return extension def _update_package(path, target): # Read the expression with open(path, 'r') as f: text = f.read() # Determine pname. pname = _get_unique_value('pname', text) # Determine version. version = _get_unique_value('version', text) # First we check how many fetchers are mentioned. fetcher = _determine_fetcher(text) extension = _determine_extension(text, fetcher) new_version, new_sha256 = FETCHERS[fetcher](pname, extension, version, target) if new_version == version: logging.info("Path {}: no update available for {}.".format(path, pname)) return False elif Version(new_version) <= Version(version): raise ValueError("downgrade for {}.".format(pname)) if not new_sha256: raise ValueError("no file available for {}.".format(pname)) text = _replace_value('version', new_version, text) text = _replace_value('sha256', new_sha256, text) with open(path, 'w') as f: f.write(text) logging.info("Path {}: updated {} from {} to {}".format(path, pname, version, new_version)) result = { 'path' : path, 'target': target, 'pname': pname, 'old_version' : version, 'new_version' : new_version, #'fetcher' : fetcher, } return result def _update(path, target): # We need to read and modify a Nix expression. if os.path.isdir(path): path = os.path.join(path, 'default.nix') # If a default.nix does not exist, we quit. if not os.path.isfile(path): logging.info("Path {}: does not exist.".format(path)) return False # If file is not a Nix expression, we quit. if not path.endswith(".nix"): logging.info("Path {}: does not end with `.nix`.".format(path)) return False try: return _update_package(path, target) except ValueError as e: logging.warning("Path {}: {}".format(path, e)) return False def _commit(path, pname, old_version, new_version, **kwargs): """Commit result. """ msg = f'python: {pname}: {old_version} -> {new_version}' try: subprocess.check_call([GIT, 'add', path]) subprocess.check_call([GIT, 'commit', '-m', msg]) except subprocess.CalledProcessError as e: subprocess.check_call([GIT, 'checkout', path]) raise subprocess.CalledProcessError(f'Could not commit {path}') from e return True def main(): parser = argparse.ArgumentParser() parser.add_argument('package', type=str, nargs='+') parser.add_argument('--target', type=str, choices=SEMVER.keys(), default='major') parser.add_argument('--commit', action='store_true', help='Create a commit for each package update') args = parser.parse_args() target = args.target packages = list(map(os.path.abspath, args.package)) logging.info("Updating packages...") # Use threads to update packages concurrently with Pool() as p: results = list(p.map(lambda pkg: _update(pkg, target), packages)) logging.info("Finished updating packages.") # Commits are created sequentially. if args.commit: logging.info("Committing updates...") list(map(lambda x: _commit(**x), filter(bool, results))) logging.info("Finished committing updates") count = sum(map(bool, results)) logging.info("{} package(s) updated".format(count)) if __name__ == '__main__': main()