Source code for conda_pypi.translate

"""
Convert Python `*.dist-info/METADATA` to conda `info/index.json`
"""

import dataclasses
import json
import logging
import pkgutil
import sys
import time
from importlib.metadata import Distribution, PackageMetadata, PathDistribution
from pathlib import Path
from typing import Any, Optional, List, Dict, Callable

from conda.exceptions import ArgumentError
from conda.models.match_spec import MatchSpec
from packaging.requirements import Requirement
from packaging.utils import canonicalize_name

log = logging.getLogger(__name__)


[docs] class FileDistribution(Distribution): """ From a file e.g. a single `.metadata` fetched from pypi instead of a `*.dist-info` folder. """ def __init__(self, raw_text): self.raw_text = raw_text
[docs] def read_text(self, filename: str) -> Optional[str]: if filename == "METADATA": return self.raw_text else: return None
[docs] def locate_file(self, path): """ Given a path to a file in this distribution, return a path to it. """ return None
[docs] @dataclasses.dataclass class PackageRecord: # what goes in info/index.json name: str version: str subdir: str depends: List[str] extras: Dict[str, List[str]] build_number: int = 0 build_text: str = "pypi" # e.g. hash license_family: str = "" license: str = "" noarch: str = "" timestamp: int = 0
[docs] def to_index_json(self): return { "build_number": self.build_number, "build": self.build, "depends": self.depends, "extras": self.extras, "license_family": self.license_family, "license": self.license, "name": self.name, "noarch": self.noarch, "subdir": self.subdir, "timestamp": self.timestamp, "version": self.version, }
@property def build(self): return f"{self.build_text}_{self.build_number}" @property def stem(self): return f"{self.name}-{self.version}-{self.build}"
[docs] @dataclasses.dataclass class CondaMetadata: metadata: PackageMetadata console_scripts: List[str] package_record: PackageRecord about: Dict[str, Any]
[docs] @classmethod def from_distribution( cls, distribution: Distribution, pypi_to_conda_name_mapping: dict | None = None ): metadata = distribution.metadata python_version = metadata.get("requires-python") requires_python = "python" if python_version: requires_python = f"python {python_version}" requirements, extras = requires_to_conda(distribution.requires, pypi_to_conda_name_mapping) # conda does support ~=3.0.0 "compatibility release" matches depends = [requires_python] + requirements console_scripts = [ f"{ep.name} = {ep.value}" for ep in distribution.entry_points if ep.group == "console_scripts" ] noarch = "python" # Common "about" keys # ['channels', 'conda_build_version', 'conda_version', 'description', # 'dev_url', 'doc_url', 'env_vars', 'extra', 'home', 'identifiers', # 'keywords', 'license', 'license_family', 'license_file', 'root_pkgs', # 'summary', 'tags', 'conda_private', 'doc_source_url', 'license_url'] about = { "summary": metadata.get("summary") or "", "description": metadata.get("description") or "", # https://packaging.python.org/en/latest/specifications/core-metadata/#license-expression "license": metadata.get("license_expression") or metadata.get("license") or "", } if project_urls := metadata.get_all("project-url"): urls = dict(url.split(", ", 1) for url in project_urls) for py_name, conda_name in ( ("Home", "home"), ("Development", "dev_url"), ("Documentation", "doc_url"), ): if py_name in urls: about[conda_name] = urls[py_name] name = pypi_to_conda_name( getattr(distribution, "name", None) or distribution.metadata.get("name"), pypi_to_conda_name_mapping, ) version = getattr(distribution, "version", None) or distribution.metadata.get("version") package_record = PackageRecord( build_number=0, depends=depends, extras=extras, license=about["license"] or "", license_family="", name=name, version=version, subdir="noarch", noarch=noarch, timestamp=time.time_ns() // 1000000, ) return cls( metadata=metadata, package_record=package_record, console_scripts=console_scripts, about=about, )
# The keys are pypi names # conda_pypi.dist_repodata.grayskull_pypi_mapping['zope-hookable'] # { # "pypi_name": "zope-hookable", # "conda_name": "zope.hookable", # "import_name": "zope.hookable", # "mapping_source": "regro-bot", # } grayskull_pypi_mapping = json.loads( pkgutil.get_data("conda_pypi", "grayskull_pypi_mapping.json") or "{}" )
[docs] def requires_to_conda( requires: Optional[List[str]], pypi_to_conda_name_mapping: dict | None = None ): from collections import defaultdict extras: Dict[str, List[str]] = defaultdict(list) requirements = [] for requirement in [Requirement(dep) for dep in requires or []]: # requirement.marker.evaluate # if requirement.marker and not requirement.marker.evaluate(): # # excluded by environment marker # # see also marker evaluation according to given sys.executable # continue name = canonicalize_name(requirement.name) requirement.name = pypi_to_conda_name(name, pypi_to_conda_name_mapping) as_conda = f"{requirement.name} {requirement.specifier}" if (marker := requirement.marker) is not None: # for var, _, value in marker._markers: for mark in marker._markers: if isinstance(mark, tuple): var, _, value = mark if str(var) == "extra": extras[str(value)].append(as_conda) else: requirements.append(f"{requirement.name} {requirement.specifier}".strip()) return requirements, dict(extras)
# if there is a url or extras= here we have extra work, may need to # yield Requirement not str # sorted(packaging.requirements.SpecifierSet("<5,>3")._specs, key=lambda x: x.version) # or just sorted lexicographically in str(SpecifierSet) # yield f"{requirement.name} {requirement.specifier}"
[docs] def conda_to_requires(match_spec: MatchSpec) -> Requirement | None: match_spec = remap_match_spec_name(match_spec, conda_to_pypi_name) name = match_spec.name if name == "*": return None version = match_spec.version if version: version_str = str(version) if version_str == "*": return Requirement(name) if version_str.endswith(".*"): version_str = version_str[:-2] if version_str and version_str[0] not in "<>=!~": version_str = f"=={version_str}" return Requirement(f"{name}{version_str}") return Requirement(name)
[docs] def remap_match_spec_name(match_spec: MatchSpec, name_map: Callable[[str], str]) -> MatchSpec: name = match_spec.name if name == "*": return match_spec mapped_name = name_map(name) if mapped_name == name: return match_spec return MatchSpec(match_spec, name=mapped_name)
[docs] def validate_name_mapping_format(mapping: dict) -> None: """ Validate that the name mapping dict has the correct format. Expected format: - A dict where keys are PyPI package names (strings) - Values are dicts with at least "conda_name" key (string) - Optionally can have "pypi_name", "import_name", "mapping_source" keys - Empty dict is allowed Raises ArgumentError if format is invalid. """ # Check that mapping is a dict and has .items() method if not isinstance(mapping, dict): raise ArgumentError(f"Name mapping must be a dictionary, got {type(mapping).__name__}") try: items = mapping.items() except AttributeError: raise ArgumentError( f"Name mapping must be a dictionary with .items() method, got {type(mapping).__name__}" ) for pypi_name, value in items: if not isinstance(pypi_name, str): raise ArgumentError( f"Name mapping keys must be strings, got {type(pypi_name).__name__} for key: {pypi_name!r}" ) if not isinstance(value, dict): raise ArgumentError( f"Name mapping values must be dictionaries, got {type(value).__name__} for key {pypi_name!r}" ) if "conda_name" not in value: raise ArgumentError( f"Name mapping entry for {pypi_name!r} is missing required key 'conda_name'" ) if not isinstance(value["conda_name"], str): raise ArgumentError( f"Name mapping entry for {pypi_name!r} has invalid 'conda_name' type: expected str, got {type(value['conda_name']).__name__}" )
[docs] def pypi_to_conda_name(pypi_name: str, pypi_to_conda_name_mapping: dict | None = None): pypi_name = canonicalize_name(pypi_name) return ( pypi_to_conda_name_mapping if pypi_to_conda_name_mapping is not None else grayskull_pypi_mapping ).get( pypi_name, { "pypi_name": pypi_name, "conda_name": pypi_name, "import_name": None, "mapping_source": None, }, )["conda_name"]
_to_pypi_name_map = {}
[docs] def conda_to_pypi_name(name: str): if not _to_pypi_name_map: for value in grayskull_pypi_mapping.values(): conda_name = value["conda_name"] # XXX sometimes conda:pypi is n:1 _to_pypi_name_map[conda_name] = value found = _to_pypi_name_map.get(name) if found: name = found["pypi_name"] return canonicalize_name(name)
if __name__ == "__main__": # pragma: no cover base = sys.argv[1] for path in Path(base).glob("*.dist-info"): print(CondaMetadata.from_distribution(PathDistribution(path)))