whl2conda.api.converter

Converter API

Attributes

pip_version_re `module-attribute`

pip_version_re = compile(
    "^\\s*(?P<operator>[=<>!~]+)\\s*(?P<version>"
    + PIP_VERSION_PATTERN
    + ")\\s*$",
    VERBOSE | IGNORECASE,
)

Regular expression matching pip version spec

Classes

CondaPackageFormat

Bases: str, Enum

Supported output package formats

V1: original conda format as .tar.bz2 file
V2: newer .conda format
TREE: dumps package out as a directory tree (for debugging)

Source code in src/whl2conda/impl/pyproject.py

class CondaPackageFormat(str, enum.Enum):
    """
    Supported output package formats

    * V1: original conda format as .tar.bz2 file
    * V2: newer .conda format
    * TREE: dumps package out as a directory tree (for debugging)
    """

    V1 = ".tar.bz2"
    V2 = ".conda"
    TREE = ".tree"

    @classmethod
    def from_string(cls, name: str) -> CondaPackageFormat:
        """Convert string to CondaPackageFormat

        Arguments:
            name: either the enum name or a file extension, i.e.
                "V1"/".tar.bz2", "V2"/".conda", or "TREE"
        """
        try:
            return cls[name.upper()]
        except LookupError:
            return cls(name.lower())

Functions

from_string `classmethod`

from_string(name: str) -> CondaPackageFormat

Convert string to CondaPackageFormat

PARAMETER	DESCRIPTION
`name`	either the enum name or a file extension, i.e. "V1"/".tar.bz2", "V2"/".conda", or "TREE" TYPE: `str`

Source code in src/whl2conda/impl/pyproject.py

@classmethod
def from_string(cls, name: str) -> CondaPackageFormat:
    """Convert string to CondaPackageFormat

    Arguments:
        name: either the enum name or a file extension, i.e.
            "V1"/".tar.bz2", "V2"/".conda", or "TREE"
    """
    try:
        return cls[name.upper()]
    except LookupError:
        return cls(name.lower())

DependencyRename

Bases: NamedTuple

Defines a pypi to conda package renaming rule.

The pattern must fully match the input package. The replacement string may contain group references e.g. r'\1', r'\g`.

Source code in src/whl2conda/api/converter.py

class DependencyRename(NamedTuple):
    r"""
    Defines a pypi to conda package renaming rule.

    The pattern must fully match the input package.
    The replacement string may contain group references
    e.g. r'\1', r'\g<name>`.
    """

    pattern: re.Pattern
    replacement: str

    @classmethod
    def from_strings(cls, pattern: str, replacement: str) -> DependencyRename:
        r"""Construct from strings

        This will also translate '$#' and '${name}' expressions
        into r'\#' and r'\P<name>' respectively.
        """
        try:
            pat = re.compile(pattern)
        except re.error as err:
            # pylint: disable=raise-missing-from
            raise ValueError(f"Bad dependency rename pattern '{pattern}': {err}")
        repl = re.sub(r"\$(\d+)", r"\\\1", replacement)
        repl = re.sub(r"\$\{(\w+)}", r"\\g<\1>", repl)
        # TODO also verify replacement does not contain invalid package chars
        try:
            pat.sub(repl, "")
        except Exception as ex:
            if isinstance(ex, re.error):
                msg = ex.msg
            else:
                msg = str(ex)
            # pylint: disable=raise-missing-from
            raise ValueError(
                f"Bad dependency replacement '{replacement}' for pattern '{pattern}': {msg}"
            )
        return cls(pat, repl)

    def rename(self, pypi_name: str) -> tuple[str, bool]:
        """Rename dependency package name

        Returns conda name and indicator of whether the
        pattern was applied.
        """
        if m := self.pattern.fullmatch(pypi_name):
            return m.expand(self.replacement), True
        return pypi_name, False

Functions

from_strings `classmethod`

from_strings(
    pattern: str, replacement: str
) -> DependencyRename

Construct from strings

This will also translate '$#' and '${name}' expressions into r'#' and r'\P' respectively.

Source code in src/whl2conda/api/converter.py

@classmethod
def from_strings(cls, pattern: str, replacement: str) -> DependencyRename:
    r"""Construct from strings

    This will also translate '$#' and '${name}' expressions
    into r'\#' and r'\P<name>' respectively.
    """
    try:
        pat = re.compile(pattern)
    except re.error as err:
        # pylint: disable=raise-missing-from
        raise ValueError(f"Bad dependency rename pattern '{pattern}': {err}")
    repl = re.sub(r"\$(\d+)", r"\\\1", replacement)
    repl = re.sub(r"\$\{(\w+)}", r"\\g<\1>", repl)
    # TODO also verify replacement does not contain invalid package chars
    try:
        pat.sub(repl, "")
    except Exception as ex:
        if isinstance(ex, re.error):
            msg = ex.msg
        else:
            msg = str(ex)
        # pylint: disable=raise-missing-from
        raise ValueError(
            f"Bad dependency replacement '{replacement}' for pattern '{pattern}': {msg}"
        )
    return cls(pat, repl)

rename

rename(pypi_name: str) -> tuple[str, bool]

Rename dependency package name

Returns conda name and indicator of whether the pattern was applied.

Source code in src/whl2conda/api/converter.py

def rename(self, pypi_name: str) -> tuple[str, bool]:
    """Rename dependency package name

    Returns conda name and indicator of whether the
    pattern was applied.
    """
    if m := self.pattern.fullmatch(pypi_name):
        return m.expand(self.replacement), True
    return pypi_name, False

MetadataFromWheel `dataclass`

Metadata parsed from wheel distribution

Source code in src/whl2conda/api/converter.py

@dataclass
class MetadataFromWheel:
    """Metadata parsed from wheel distribution"""

    md: dict[str, Any]
    package_name: str
    version: str
    wheel_build_number: str
    license: Optional[str]
    dependencies: list[RequiresDistEntry]
    wheel_info_dir: Path

RequiresDistEntry `dataclass`

Requires-Dist metadata entry parsed from wheel

Source code in src/whl2conda/api/converter.py

@dataclass
class RequiresDistEntry:
    """
    Requires-Dist metadata entry parsed from wheel
    """

    # see https://packaging.python.org/specifications/core-metadata/#requires-dist-multiple-use
    # and https://peps.python.org/pep-0508/
    name: str
    extras: Sequence[str] = ()
    version: str = ""
    marker: str = ""

    extra_marker_name: str = ""
    """Name from extra expression in marker, if any"""

    generic: bool = True
    """True if marker is empty or only contains an extra expression"""

    def set_marker(self, marker: str) -> None:
        """Set marker value and update extra_marker_name and generic values"""
        self.marker = marker
        self.generic = False
        for pat in _extra_marker_re:
            if m := pat.search(marker):
                self.extra_marker_name = m.group("name")
                if m.group(0) == marker:
                    self.generic = True
                return

    @classmethod
    def parse(cls, raw: str) -> RequiresDistEntry:
        """
        Parse entry from raw string read from "Requires-Dist" or related header.

        Raises:
            SyntaxError: if entry is not properly formatted.
        """
        m = requires_dist_re.fullmatch(raw)
        if not m:
            raise SyntaxError(f"Cannot parse Requires-Dist entry: {repr(raw)}")
        entry = RequiresDistEntry(name=m.group("name"))
        if extra := m.group("extra"):
            entry.extras = tuple(re.split(r"\s*,\s*", extra))
        if version := m.group("version"):
            entry.version = version
        if marker := m.group("marker"):
            entry.set_marker(marker)
        return entry

    def with_extra(self, name: str) -> RequiresDistEntry:
        """Returns copy of entry with  an extra == '<name>' clause to marker"""
        marker = f"extra == '{name}'"
        if self.marker:
            marker = f"({self.marker}) and {marker}"

        entry = dataclasses.replace(self)
        entry.set_marker(marker)
        return entry

    def __str__(self) -> str:
        with io.StringIO() as buf:
            buf.write(self.name)
            if self.extras:
                buf.write(f" [{','.join(self.extras)}]")
            if self.version:
                buf.write(f" {self.version}")
            if self.marker:
                buf.write(f" ; {self.marker}")
            return buf.getvalue()

Attributes

extra_marker_name `class-attribute` `instance-attribute`

extra_marker_name: str = ''

Name from extra expression in marker, if any

generic `class-attribute` `instance-attribute`

generic: bool = True

True if marker is empty or only contains an extra expression

Functions

parse `classmethod`

parse(raw: str) -> RequiresDistEntry

Parse entry from raw string read from "Requires-Dist" or related header.

RAISES	DESCRIPTION
`SyntaxError`	if entry is not properly formatted.

Source code in src/whl2conda/api/converter.py

@classmethod
def parse(cls, raw: str) -> RequiresDistEntry:
    """
    Parse entry from raw string read from "Requires-Dist" or related header.

    Raises:
        SyntaxError: if entry is not properly formatted.
    """
    m = requires_dist_re.fullmatch(raw)
    if not m:
        raise SyntaxError(f"Cannot parse Requires-Dist entry: {repr(raw)}")
    entry = RequiresDistEntry(name=m.group("name"))
    if extra := m.group("extra"):
        entry.extras = tuple(re.split(r"\s*,\s*", extra))
    if version := m.group("version"):
        entry.version = version
    if marker := m.group("marker"):
        entry.set_marker(marker)
    return entry

set_marker

set_marker(marker: str) -> None

Set marker value and update extra_marker_name and generic values

Source code in src/whl2conda/api/converter.py

def set_marker(self, marker: str) -> None:
    """Set marker value and update extra_marker_name and generic values"""
    self.marker = marker
    self.generic = False
    for pat in _extra_marker_re:
        if m := pat.search(marker):
            self.extra_marker_name = m.group("name")
            if m.group(0) == marker:
                self.generic = True
            return

with_extra

with_extra(name: str) -> RequiresDistEntry

Returns copy of entry with an extra == '' clause to marker

Source code in src/whl2conda/api/converter.py

def with_extra(self, name: str) -> RequiresDistEntry:
    """Returns copy of entry with  an extra == '<name>' clause to marker"""
    marker = f"extra == '{name}'"
    if self.marker:
        marker = f"({self.marker}) and {marker}"

    entry = dataclasses.replace(self)
    entry.set_marker(marker)
    return entry

Wheel2CondaConverter

Converter supports generation of conda package from a pure python wheel.

Source code in src/whl2conda/api/converter.py

class Wheel2CondaConverter:
    """
    Converter supports generation of conda package from a pure python wheel.

    """

    SUPPORTED_WHEEL_VERSIONS = ("1.0",)
    SUPPORTED_METADATA_VERSIONS: tuple[str, ...] = (
        "1.0",
        "1.1",
        "1.2",
        "2.1",
        "2.2",
        "2.3",
        "2.4",
    )
    MULTI_USE_METADATA_KEYS = {
        "Classifier",
        "Dynamic",
        "License-File",
        "Obsoletes",
        "Obsoletes-Dist",
        "Platform",
        "Project-URL",
        "Provides",
        "Provides-Dist",
        "Provides-Extra",
        "Requires",
        "Requires-Dist",
        "Requires-External",
        "Supported-Platform",
    }

    package_name: str = ""
    logger: logging.Logger
    wheel_path: Path
    out_dir: Path
    dry_run: bool = False
    out_format: CondaPackageFormat = CondaPackageFormat.V2
    overwrite: bool = False
    keep_pip_dependencies: bool = False
    dependency_rename: list[DependencyRename]
    extra_dependencies: list[str]
    python_version: str = ""
    interactive: bool = False
    build_number: Optional[int] = None

    wheel_md: Optional[MetadataFromWheel] = None
    conda_pkg_path: Optional[Path] = None
    std_renames: dict[str, str]

    def __init__(
        self,
        wheel_path: Path,
        out_dir: Path,
        *,
        update_std_renames: bool = False,
    ):
        self.logger = logging.getLogger(__name__)
        self.wheel_path = wheel_path
        self.out_dir = out_dir
        self.dependency_rename = []
        self.extra_dependencies = []
        # TODO - option to ignore this
        self.std_renames = load_std_renames(update=update_std_renames)

    def convert(self) -> Path:
        """
        Convert wheel to conda package

        Does not write any non-temporary files if dry_run is True.

        Returns:
            Path of conda package
        """
        # pylint: disable=too-many-statements,too-many-branches,too-many-locals

        with tempfile.TemporaryDirectory(prefix="whl2conda-") as temp_dirname:
            temp_dir = Path(temp_dirname)
            extracted_wheel_dir = self._extract_wheel(temp_dir)

            wheel_md = self._parse_wheel_metadata(extracted_wheel_dir)

            conda_dir = temp_dir / "conda-files"
            conda_info_dir = conda_dir.joinpath("info")
            conda_dir.mkdir()

            # Copy files into conda package
            self._copy_wheel_files(extracted_wheel_dir, conda_dir)

            # collect relative paths before constructing info/ directory
            rel_files = list(
                str(f.relative_to(conda_dir))
                for f in conda_dir.glob("**/*")
                if f.is_file()
            )

            conda_dependencies = self._compute_conda_dependencies(wheel_md.dependencies)

            # Write conda info files
            # TODO - copy readme file into info
            #  must be one of README, README.md or README.rst
            self._copy_licenses(conda_info_dir, wheel_md)
            self._write_about(conda_info_dir, wheel_md.md)
            self._write_hash_input(conda_info_dir)
            self._write_files_list(conda_info_dir, rel_files)
            self._write_index(conda_info_dir, wheel_md, conda_dependencies)
            self._write_link_file(conda_info_dir, wheel_md.wheel_info_dir)
            self._write_paths_file(conda_dir, rel_files)
            self._write_git_file(conda_info_dir)

            conda_pkg_path = self._conda_package_path(
                wheel_md.package_name, wheel_md.version
            )
            self._write_conda_package(conda_dir, conda_pkg_path)

            return conda_pkg_path

    @classmethod
    def read_metadata_file(cls, file: Path) -> email.message.Message:
        """
        Read a wheel email-formatted metadata file (e.g. METADATA, WHEEL)

        Args:
            file: path to file

        Returns:
            Message object
        """
        return email.message_from_string(
            file.read_text(encoding="utf8"),
            policy=email.policy.EmailPolicy(utf8=True, refold_source="none"),  # type: ignore
        )

    def _conda_package_path(self, package_name: str, version: str) -> Path:
        """Construct conda package file path"""
        if self.out_format is CondaPackageFormat.TREE:
            suffix = ""
        else:
            suffix = str(self.out_format.value)
        conda_pkg_file = f"{package_name}-{version}-py_0{suffix}"
        self.conda_pkg_path = Path(self.out_dir).joinpath(conda_pkg_file)
        return self.conda_pkg_path

    # pylint: disable=too-many-branches
    def _write_conda_package(self, conda_dir: Path, conda_pkg_path: Path) -> Path:
        dry_run_suffix = " (dry run)" if self.dry_run else ""
        if self.logger.getEffectiveLevel() <= logging.DEBUG:
            for file in conda_dir.glob("**/*"):
                if file.is_file():
                    self._debug("Packaging %s", file.relative_to(conda_dir))
        if conda_pkg_path.exists():
            if not self.overwrite:
                msg = f"Output conda package already exists at '{conda_pkg_path}'"
                overwrite = False
                if self.interactive:
                    print(msg)
                    overwrite = bool_input("Overwrite? ")
                if not overwrite:
                    raise FileExistsError(msg)
            self._info("Removing existing %s%s", conda_pkg_path, dry_run_suffix)
            if not self.dry_run:
                if conda_pkg_path.is_dir():
                    shutil.rmtree(conda_pkg_path)
                else:
                    conda_pkg_path.unlink()
        self._info("Writing %s%s", conda_pkg_path, dry_run_suffix)

        if not self.dry_run:
            if self.out_format is CondaPackageFormat.TREE:
                shutil.copytree(
                    conda_dir, Path(self.out_dir).joinpath(conda_pkg_path.name)
                )
            else:
                self.out_dir.mkdir(parents=True, exist_ok=True)
                create_conda_pkg(conda_dir, None, conda_pkg_path.name, self.out_dir)

        return conda_pkg_path

    def _write_git_file(self, conda_info_dir: Path) -> None:
        """Write empty git file"""
        # python wheels don't have this concept, but conda-build
        # will write an empty git file if there are no git sources,
        # so we follow suit:
        conda_info_dir.joinpath("git").write_bytes(b'')

    def _write_paths_file(self, conda_dir: Path, rel_files: Sequence[str]) -> None:
        # info/paths.json - paths with SHA256 do we really need this?
        conda_paths_file = conda_dir.joinpath("info", "paths.json")
        paths: list[dict[str, Any]] = []
        for rel_file in rel_files:
            abs_file = conda_dir.joinpath(rel_file)
            file_bytes = abs_file.read_bytes()
            paths.append(
                dict(
                    _path=rel_file,
                    path_type="hardlink",
                    sha256=sha256(file_bytes).hexdigest(),
                    size_in_bytes=len(file_bytes),
                )
            )
        conda_paths_file.write_text(
            json.dumps(dict(paths=paths, paths_version=1), indent=2)
        )

    def _write_link_file(self, conda_info_dir: Path, wheel_info_dir: Path) -> None:
        # info/link.json
        conda_link_file = conda_info_dir.joinpath("link.json")
        wheel_entry_points_file = wheel_info_dir.joinpath("entry_points.txt")
        console_scripts: list[str] = []
        if wheel_entry_points_file.is_file():
            wheel_entry_points = configparser.ConfigParser()
            wheel_entry_points.read(wheel_entry_points_file)
            for section_name in ["console_scripts", "gui_scripts"]:
                if section_name in wheel_entry_points:
                    section = wheel_entry_points[section_name]
                    console_scripts.extend(f"{k}={v}" for k, v in section.items())
        noarch_dict: dict[str, Any] = dict(type="python")
        if console_scripts:
            noarch_dict["entry_points"] = console_scripts
        conda_link_file.write_text(
            json.dumps(
                dict(
                    noarch=noarch_dict,
                    package_metadata_version=1,
                ),
                indent=2,
                sort_keys=True,
            )
        )

    # pylint: disable=too-many-arguments
    def _write_index(
        self,
        conda_info_dir: Path,
        wheel_md: MetadataFromWheel,
        conda_dependencies: Sequence[str],
    ) -> None:
        # info/index.json
        conda_index_file = conda_info_dir.joinpath("index.json")

        if self.build_number is not None:
            build_number = self.build_number
        else:
            try:
                build_number = int(wheel_md.wheel_build_number)
            except ValueError:
                build_number = 0

        conda_index_file.write_text(
            json.dumps(
                dict(
                    arch=None,
                    build="py_0",
                    build_number=build_number,
                    depends=conda_dependencies,
                    license=wheel_md.license,
                    name=wheel_md.package_name,
                    noarch="python",
                    platform=None,
                    subdir="noarch",
                    timestamp=int(time.time() + time.timezone),  # UTC timestamp
                    version=wheel_md.version,
                ),
                indent=2,
            )
        )

    def _write_files_list(self, conda_info_dir: Path, rel_files: Sequence[str]) -> None:
        # * info/files - list of relative paths of files not including info/
        conda_files_file = conda_info_dir.joinpath("files")
        with open(conda_files_file, "w") as f:
            for rel_file in rel_files:
                f.write(str(rel_file))
                f.write("\n")

    def _write_hash_input(self, conda_info_dir: Path) -> None:
        conda_hash_input_file = conda_info_dir.joinpath("hash_input.json")
        conda_hash_input_file.write_text(json.dumps({}, indent=2))

    # pylint: disable=too-many-locals
    def _write_about(self, conda_info_dir: Path, md: dict[str, Any]) -> None:
        """Write the info/about.json file"""
        # * info/about.json
        #
        # Note that the supported fields in the about section are not
        # well documented, but conda-build will only copy fields from
        # its approved list, which can be found in the FIELDS datastructure
        # in the conda_build.metadata module. This currently includes:
        #
        #   URLS: home, dev_url, doc_url, doc_source_url
        #   Text: license, summary, description, license_family
        #   Lists: tags, keyword
        #   Paths in source tree: license-file, prelink_message, readme
        #
        # conda-build also adds conda-build-version and conda-version fields.

        # TODO description can come from METADATA message body
        #   then need to also use content type. It doesn't seem
        #   that conda-forge packages include this in the info/

        conda_about_file = conda_info_dir.joinpath("about.json")

        extra = non_none_dict(
            author=md.get("author"),
            classifiers=md.get("classifier"),
            maintainer=md.get("maintainer"),
            whl2conda_version=__version__,
        )

        proj_url_pat = re.compile(r"\s*(?P<key>\w+(\s+\w+)*)\s*,\s*(?P<url>\w.*)\s*")
        doc_url: Optional[str] = None
        dev_url: Optional[str] = None
        for urlline in md.get("project-url", ()):
            if m := proj_url_pat.match(urlline):  # pragma: no branch
                key = m.group("key")
                url = m.group("url")
                if re.match(r"(?i)doc(umentation)?\b", key):
                    doc_url = url
                elif re.match(r"(?i)(dev(elopment)?|repo(sitory))\b", key):
                    dev_url = url
                extra[key] = url

        for key in ["author-email", "maintainer-email"]:
            val = md.get(key)
            if val:
                author_key = key.split("-", maxsplit=1)[0] + "s"
                extra[author_key] = val.split(",")

        license = md.get("license-expression") or md.get("license")
        if license_files := md.get("license-file"):
            extra["license_files"] = list(license_files)

        if keywords := md.get("keywords"):
            keyword_list = keywords.split(",")
        else:
            keyword_list = None

        conda_about_file.write_text(
            json.dumps(
                non_none_dict(
                    description=md.get("description"),
                    summary=md.get("summary"),
                    license=license or None,
                    keywords=keyword_list,
                    home=md.get("home-page"),
                    dev_url=dev_url,
                    doc_url=doc_url,
                    extra=extra,
                ),
                indent=2,
                sort_keys=True,
            )
        )

    # pylint: disable=too-many-locals
    def _compute_conda_dependencies(
        self,
        dependencies: Sequence[RequiresDistEntry],
    ) -> list[str]:
        conda_dependencies: list[str] = []

        saw_python = False

        for entry in dependencies:
            if entry.extra_marker_name:
                self._debug("Skipping extra dependency: %s", entry)
                continue
            if not entry.generic:
                # TODO - support non-generic packages
                self._warn("Skipping dependency with environment marker: %s", entry)
                continue

            conda_name = pip_name = entry.name
            version = self.translate_version_spec(entry.version)
            if saw_python := conda_name == "python":
                if self.python_version and version != self.python_version:
                    self._info(
                        "Overriding python version '%s' with '%s'",
                        version,
                        self.python_version,
                    )
                    version = self.python_version

            # TODO - do something with extras (#36)
            #   download target pip package and its extra dependencies
            # check manual renames first
            renamed = False
            for renamer in self.dependency_rename:
                conda_name, renamed = renamer.rename(pip_name)
                if renamed:
                    break
            if not renamed:
                conda_name = self.std_renames.get(pip_name, pip_name)

            if conda_name:
                conda_dep = f"{conda_name} {version}"
                if conda_name == pip_name:
                    self._debug("Dependency copied: '%s'", conda_dep)
                else:
                    self._debug("Dependency renamed: '%s' -> '%s'", entry, conda_dep)
                conda_dependencies.append(conda_dep)
            else:
                self._debug("Dependency dropped: %s", entry)

        if not saw_python and self.python_version:
            self._info("Added 'python %s' dependency", self.python_version)
            conda_dependencies.append(f"python {self.python_version}")

        for dep in self.extra_dependencies:
            self._debug("Dependency added:  '%s'", dep)
            conda_dependencies.append(dep)
        return conda_dependencies

    def _copy_wheel_files(self, wheel_dir: Path, conda_dir: Path) -> None:
        """
        Copies files from wheels to corresponding location in conda package:

        This copies files using the mapping:
        - <wheel-dir>/*.data/data/* -> <conda-dir>/*
        - <wheel-dir>/*.data/scripts/* -> <conda-dir>/python-scripts/*
        - <wheel-dir>/*.data/* -> ignored
        - <wheel-dir>/* -> <conda-dir>/site-packages
        """
        conda_site_packages = conda_dir.joinpath("site-packages")
        conda_site_packages.mkdir()
        conda_info_dir = conda_dir.joinpath("info")
        conda_info_dir.mkdir()
        for entry in wheel_dir.iterdir():
            if not entry.is_dir():
                shutil.copyfile(entry, conda_site_packages / entry.name)
            elif not entry.name.endswith(".data"):
                shutil.copytree(
                    entry, conda_site_packages / entry.name, dirs_exist_ok=True
                )
            else:
                for datapath in entry.iterdir():
                    if not datapath.is_dir():
                        self._warn(
                            "Do not support top level file '%s' in '%s' directory - ignored",
                            datapath.name,
                            entry.relative_to(wheel_dir),
                        )
                    if datapath.name == "data":
                        conda_target = conda_dir
                    elif datapath.name == "scripts":
                        conda_target = conda_dir / "python-scripts"
                    else:
                        self._warn(
                            "Do not support '%s' path in '%s' directory - ignored",
                            datapath.name,
                            entry.relative_to(wheel_dir),
                        )
                        continue
                    shutil.copytree(datapath, conda_target, dirs_exist_ok=True)

        assert self.wheel_md is not None
        dist_info_dir = conda_site_packages / self.wheel_md.wheel_info_dir.name
        installer_file = dist_info_dir / "INSTALLER"
        installer_file.write_text("whl2conda")
        requested_file = dist_info_dir / "REQUESTED"
        requested_file.write_text("")

    def _copy_licenses(self, conda_info_dir: Path, wheel_md: MetadataFromWheel) -> None:
        to_license_dir = conda_info_dir / "licenses"
        wheel_info_dir = wheel_md.wheel_info_dir
        wheel_license_dir = wheel_info_dir / "licenses"
        if wheel_license_dir.is_dir():
            # just copy directory
            shutil.copytree(
                wheel_license_dir,
                to_license_dir,
                dirs_exist_ok=True,
            )
        else:
            # Otherwise look for files in the dist-info dir
            # that match the license-file entries. The paths
            # of the license-file entries may be relative to
            # where the wheel was built and may not directly
            # point at the files.
            for license_file in wheel_md.md.get("license-file", ()):
                # copy license file if it exists
                license_path = Path(license_file)
                from_files = [wheel_info_dir / license_path.name]
                if not license_path.is_absolute():
                    from_files.insert(0, wheel_info_dir / license_path)
                for from_file in filter(  # pragma: no branch
                    lambda f: f.exists(), from_files
                ):
                    to_file = to_license_dir / from_file.relative_to(wheel_info_dir)
                    if not to_file.exists():  # pragma: no branch
                        to_file.parent.mkdir(parents=True, exist_ok=True)
                        shutil.copyfile(from_file, to_file)
                        break

    # pylint: disable=too-many-locals, too-many-statements
    def _parse_wheel_metadata(self, wheel_dir: Path) -> MetadataFromWheel:
        wheel_info_dir = next(wheel_dir.glob("*.dist-info"))
        WHEEL_file = wheel_info_dir.joinpath("WHEEL")
        WHEEL_msg = self.read_metadata_file(WHEEL_file)
        # https://peps.python.org/pep-0427/#what-s-the-deal-with-purelib-vs-platlib

        is_pure_lib = WHEEL_msg.get("Root-Is-Purelib", "").lower() == "true"
        wheel_build_number = WHEEL_msg.get("Build", "")
        wheel_version = WHEEL_msg.get("Wheel-Version")

        if wheel_version not in self.SUPPORTED_WHEEL_VERSIONS:
            raise Wheel2CondaError(
                f"Wheel {self.wheel_path} has unsupported wheel version {wheel_version}"
            )

        if not is_pure_lib:
            raise Wheel2CondaError(f"Wheel {self.wheel_path} is not pure python")

        wheel_md_file = wheel_info_dir.joinpath("METADATA")
        md: dict[str, str | list[Any]] = {}
        # Metdata spec: https://packaging.python.org/en/latest/specifications/core-metadata/
        # Required keys: Metadata-Version, Name, Version
        md_msg = self.read_metadata_file(wheel_md_file)
        md_version_str = md_msg.get("Metadata-Version")
        if md_version_str not in self.SUPPORTED_METADATA_VERSIONS:
            msg = f"Wheel {self.wheel_path} has unsupported metadata version {md_version_str}"
            # TODO - perhaps just warn about this if not in "strict" mode
            raise Wheel2CondaError(msg)
        # md_version = tuple(int(x) for x in md_version_str.split("."))
        for mdkey, mdval in md_msg.items():
            mdkey = mdkey.strip()
            if mdkey in self.MULTI_USE_METADATA_KEYS:
                if curmdval := md.get(mdkey):
                    if isinstance(curmdval, str):
                        md[mdkey] = [curmdval]
                md.setdefault(mdkey.lower(), []).append(mdval)  # type: ignore
            else:
                md[mdkey.lower()] = mdval

        requires: list[RequiresDistEntry] = []
        raw_requires_entries = md.get("requires-dist", md.get("requires", ()))
        for raw_entry in raw_requires_entries:
            try:
                entry = RequiresDistEntry.parse(raw_entry)
                requires.append(entry)
            except SyntaxError as err:
                # TODO: error in strict mode?
                self._warn(str(err))

        if not self.keep_pip_dependencies:
            # Turn requirements into optional extra requirements
            del md_msg["Requires"]
            del md_msg["Requires-Dist"]
            for entry in requires:
                if not entry.extra_marker_name:
                    entry = entry.with_extra('original')
                md_msg.add_header("Requires-Dist", str(entry))
            md_msg.add_header("Provides-Extra", "original")
            wheel_md_file.write_text(md_msg.as_string())
        package_name = self.package_name or str(md.get("name"))
        self.package_name = package_name
        version = md.get("version")

        # RECORD_file = wheel_info_dir / "RECORD"
        # TODO: strip __pycache__ entries from RECORD
        # TODO: add INSTALLER and REQUESTED to RECORD
        # TODO: add direct_url to wheel and to RECORD
        # RECORD line format: <path>,sha256=<hash>,<len>

        python_version: str = str(md.get("requires-python", ""))
        if python_version:
            requires.append(RequiresDistEntry("python", version=python_version))
        self.wheel_md = MetadataFromWheel(
            md=md,
            package_name=package_name,
            version=str(version),
            wheel_build_number=wheel_build_number,
            license=md.get("license-expression") or md.get("license"),  # type: ignore
            dependencies=requires,
            wheel_info_dir=wheel_info_dir,
        )
        return self.wheel_md

    def translate_version_spec(self, pip_version: str) -> str:
        """
        Convert a pip version spec to a conda version spec.

        Compatible release specs using the `~=` operator will be turned
        into two clauses using ">=" and "==", for example
        `~=1.2.3` will become `>=1.2.3,1.2.*`.

        Arbitrary equality clauses using the `===` operator will be
        converted to use `==`, but such clauses are likely to fail
        so a warning will be produced.

        Any leading "v" character in the version will be dropped.
        (e.g. `v1.2.3` changes to `1.2.3`).
        """
        pip_version = pip_version.strip()
        version_specs = re.split(r"\s*,\s*", pip_version)
        for i, spec in enumerate(version_specs):
            if not spec:
                continue
            # spec for '~= <version>'
            # https://packaging.python.org/en/latest/specifications/version-specifiers/#compatible-release
            if m := pip_version_re.match(spec):
                operator = m.group("operator")
                v = m.group("version")
                if v.startswith("v"):  # e.g. convert v1.2 to 1.2
                    v = v[1:]
                if operator == "~=":
                    # compatible operator, e.g. convert ~=1.2.3 to >=1.2.3,==1.2.*
                    rv = m.group("release")
                    rv_parts = rv.split(".")
                    operator = ">="
                    if len(rv_parts) > 1:
                        # technically ~=1 is not valid, but if we see it, turn it into >=1
                        v += f",=={'.'.join(rv_parts[:-1])}.*"
                elif operator == "===":
                    operator = "=="
                    # TODO perhaps treat as an error in "strict" mode
                    self._warn(
                        "Converted arbitrary equality clause %s to ==%s - may not match!",
                        spec,
                        v,
                    )
                version_specs[i] = f"{operator}{v}"
            else:
                self._warn("Cannot convert bad version spec: '%s'", spec)

        return ",".join(filter(bool, version_specs))

    def _extract_wheel(self, temp_dir: Path) -> Path:
        self.logger.info("Reading %s", self.wheel_path)
        wheel_dir = temp_dir / "wheel-files"
        unpack_wheel(self.wheel_path, wheel_dir, logger=self.logger)
        return wheel_dir

    def _warn(self, msg, *args):
        self.logger.warning(msg, *args)

    def _info(self, msg, *args):
        self.logger.info(msg, *args)

    def _debug(self, msg, *args):
        self.logger.debug(msg, *args)

Functions

convert

convert() -> Path

Convert wheel to conda package

Does not write any non-temporary files if dry_run is True.

RETURNS	DESCRIPTION
`Path`	Path of conda package

Source code in src/whl2conda/api/converter.py

def convert(self) -> Path:
    """
    Convert wheel to conda package

    Does not write any non-temporary files if dry_run is True.

    Returns:
        Path of conda package
    """
    # pylint: disable=too-many-statements,too-many-branches,too-many-locals

    with tempfile.TemporaryDirectory(prefix="whl2conda-") as temp_dirname:
        temp_dir = Path(temp_dirname)
        extracted_wheel_dir = self._extract_wheel(temp_dir)

        wheel_md = self._parse_wheel_metadata(extracted_wheel_dir)

        conda_dir = temp_dir / "conda-files"
        conda_info_dir = conda_dir.joinpath("info")
        conda_dir.mkdir()

        # Copy files into conda package
        self._copy_wheel_files(extracted_wheel_dir, conda_dir)

        # collect relative paths before constructing info/ directory
        rel_files = list(
            str(f.relative_to(conda_dir))
            for f in conda_dir.glob("**/*")
            if f.is_file()
        )

        conda_dependencies = self._compute_conda_dependencies(wheel_md.dependencies)

        # Write conda info files
        # TODO - copy readme file into info
        #  must be one of README, README.md or README.rst
        self._copy_licenses(conda_info_dir, wheel_md)
        self._write_about(conda_info_dir, wheel_md.md)
        self._write_hash_input(conda_info_dir)
        self._write_files_list(conda_info_dir, rel_files)
        self._write_index(conda_info_dir, wheel_md, conda_dependencies)
        self._write_link_file(conda_info_dir, wheel_md.wheel_info_dir)
        self._write_paths_file(conda_dir, rel_files)
        self._write_git_file(conda_info_dir)

        conda_pkg_path = self._conda_package_path(
            wheel_md.package_name, wheel_md.version
        )
        self._write_conda_package(conda_dir, conda_pkg_path)

        return conda_pkg_path

read_metadata_file `classmethod`

read_metadata_file(file: Path) -> email.message.Message

Read a wheel email-formatted metadata file (e.g. METADATA, WHEEL)

PARAMETER	DESCRIPTION
`file`	path to file TYPE: `Path`

RETURNS	DESCRIPTION
`Message`	Message object

Source code in src/whl2conda/api/converter.py

@classmethod
def read_metadata_file(cls, file: Path) -> email.message.Message:
    """
    Read a wheel email-formatted metadata file (e.g. METADATA, WHEEL)

    Args:
        file: path to file

    Returns:
        Message object
    """
    return email.message_from_string(
        file.read_text(encoding="utf8"),
        policy=email.policy.EmailPolicy(utf8=True, refold_source="none"),  # type: ignore
    )

translate_version_spec

translate_version_spec(pip_version: str) -> str

Convert a pip version spec to a conda version spec.

Compatible release specs using the ~= operator will be turned into two clauses using ">=" and "==", for example ~=1.2.3 will become >=1.2.3,1.2.*.

Arbitrary equality clauses using the === operator will be converted to use ==, but such clauses are likely to fail so a warning will be produced.

Any leading "v" character in the version will be dropped. (e.g. v1.2.3 changes to 1.2.3).

Source code in src/whl2conda/api/converter.py

def translate_version_spec(self, pip_version: str) -> str:
    """
    Convert a pip version spec to a conda version spec.

    Compatible release specs using the `~=` operator will be turned
    into two clauses using ">=" and "==", for example
    `~=1.2.3` will become `>=1.2.3,1.2.*`.

    Arbitrary equality clauses using the `===` operator will be
    converted to use `==`, but such clauses are likely to fail
    so a warning will be produced.

    Any leading "v" character in the version will be dropped.
    (e.g. `v1.2.3` changes to `1.2.3`).
    """
    pip_version = pip_version.strip()
    version_specs = re.split(r"\s*,\s*", pip_version)
    for i, spec in enumerate(version_specs):
        if not spec:
            continue
        # spec for '~= <version>'
        # https://packaging.python.org/en/latest/specifications/version-specifiers/#compatible-release
        if m := pip_version_re.match(spec):
            operator = m.group("operator")
            v = m.group("version")
            if v.startswith("v"):  # e.g. convert v1.2 to 1.2
                v = v[1:]
            if operator == "~=":
                # compatible operator, e.g. convert ~=1.2.3 to >=1.2.3,==1.2.*
                rv = m.group("release")
                rv_parts = rv.split(".")
                operator = ">="
                if len(rv_parts) > 1:
                    # technically ~=1 is not valid, but if we see it, turn it into >=1
                    v += f",=={'.'.join(rv_parts[:-1])}.*"
            elif operator == "===":
                operator = "=="
                # TODO perhaps treat as an error in "strict" mode
                self._warn(
                    "Converted arbitrary equality clause %s to ==%s - may not match!",
                    spec,
                    v,
                )
            version_specs[i] = f"{operator}{v}"
        else:
            self._warn("Cannot convert bad version spec: '%s'", spec)

    return ",".join(filter(bool, version_specs))

Wheel2CondaError

Bases: RuntimeError

Errors from Wheel2CondaConverter

Source code in src/whl2conda/api/converter.py

class Wheel2CondaError(RuntimeError):
    """Errors from Wheel2CondaConverter"""

Functions

non_none_dict

non_none_dict(**kwargs: Any) -> dict[str, Any]

dict that drops keys with None values

Source code in src/whl2conda/api/converter.py

def non_none_dict(**kwargs: Any) -> dict[str, Any]:
    """dict that drops keys with None values"""
    d = dict()
    for k, v in kwargs.items():
        if v is not None:
            d[k] = v
    return d

whl2conda.api.converter

Attributes

pip_version_re module-attribute

Classes

CondaPackageFormat

Functions

from_string classmethod

DependencyRename

Functions

from_strings classmethod

rename

MetadataFromWheel dataclass

RequiresDistEntry dataclass

Attributes

extra_marker_name class-attribute instance-attribute

generic class-attribute instance-attribute

Functions

parse classmethod

set_marker

with_extra

Wheel2CondaConverter

Functions

convert

read_metadata_file classmethod

translate_version_spec

Wheel2CondaError

Functions

non_none_dict

pip_version_re `module-attribute`

from_string `classmethod`

from_strings `classmethod`

MetadataFromWheel `dataclass`

RequiresDistEntry `dataclass`

extra_marker_name `class-attribute` `instance-attribute`

generic `class-attribute` `instance-attribute`

parse `classmethod`

read_metadata_file `classmethod`