From f487b2e8c18f1667f2afd03b560b6e6eeb586b16 Mon Sep 17 00:00:00 2001
From: konsti <konstin@mailbox.org>
Date: Tue, 27 Feb 2024 13:49:49 +0100
Subject: [PATCH] Extend contributing instructions (#1983)

* Document good first issues
* Document `scripts` directory, as far as useful for contributors
* Remove compare with pip script, we don't need it anymore

I think this closes #817.

---------

Co-authored-by: Jo <10510431+j178@users.noreply.github.com>
---
 CONTRIBUTING.md                              |  20 +-
 scripts/compare_with_pip/compare_with_pip.py | 228 -------------------
 2 files changed, 17 insertions(+), 231 deletions(-)
 delete mode 100755 scripts/compare_with_pip/compare_with_pip.py

diff --git a/CONTRIBUTING.md b/CONTRIBUTING.md
index 78685be50..1e568d1c6 100644
--- a/CONTRIBUTING.md
+++ b/CONTRIBUTING.md
@@ -1,5 +1,7 @@
 # Contributing
 
+We have issues labeled as [Good First Issue](https://github.com/astral-sh/uv/issues?q=is%3Aopen+is%3Aissue+label%3A%22good+first+issue%22) and [Help Wanted](https://github.com/astral-sh/uv/issues?q=is%3Aopen+is%3Aissue+label%3A%22help+wanted%22) which are good opportunities for new contributors.
+
 ## Setup
 
 [Rust](https://rustup.rs/), a C compiler, and CMake are required to build uv.
@@ -76,10 +78,21 @@ docker run --rm -it -v $(pwd):/app uv-builder /app/target/x86_64-unknown-linux-m
 
 We recommend using this container if you don't trust the dependency tree of the package(s) you are trying to resolve or install.
 
-## Profiling
+## Profiling and Benchmarking
 
 Please refer to Ruff's [Profiling Guide](https://github.com/astral-sh/ruff/blob/main/CONTRIBUTING.md#profiling-projects), it applies to uv, too.
 
+We provide diverse sets of requirements for testing and benchmarking the resolver in `scripts/requirements` and for the installer in `scripts/requirements/compiled`.
+
+You can use `scripts/bench` to benchmark predefined workloads between uv versions and with other tools, e.g.
+
+```
+python -m scripts.bench \
+    --uv-path ./target/release/before \
+    --uv-path ./target/release/after \
+    ./scripts/requirements/jupyter.in --benchmark resolve-cold --min-runs 20
+```
+
 ### Analysing concurrency
 
 You can use [tracing-durations-export](https://github.com/konstin/tracing-durations-export) to visualize parallel requests and find any spots where uv is CPU-bound. Example usage, with `uv` and `uv-dev` respectively:
@@ -114,7 +127,8 @@ Then, editorialize the `CHANGELOG.md` file to ensure entries are consistently st
 
 Then, open a pull request e.g. `Bump version to ...`.
 
-Binary builds will automatically be tested for the release. 
+Binary builds will automatically be tested for the release.
 
 After merging the pull request, run the [release workflow](https://github.com/astral-sh/uv/actions/workflows/release.yml)
-with the version tag. **Do not include a leading `v`**. The release will automatically be created on GitHub after everything else publishes.
+with the version tag. **Do not include a leading `v`**.
+The release will automatically be created on GitHub after everything else publishes.
diff --git a/scripts/compare_with_pip/compare_with_pip.py b/scripts/compare_with_pip/compare_with_pip.py
deleted file mode 100755
index 3a810b375..000000000
--- a/scripts/compare_with_pip/compare_with_pip.py
+++ /dev/null
@@ -1,228 +0,0 @@
-#!/usr/bin/env python3
-"""
-Compare uv's resolution with pip-compile on a number of requirement sets and python
-versions.
-
-If the first resolution diverged, we run a second "coerced" try in which uv gets the
-output of pip as additional input to check if it considers this resolution possible.
-"""
-import json
-import os
-import subprocess
-import time
-from argparse import ArgumentParser
-from hashlib import sha256
-from pathlib import Path
-from subprocess import check_output, check_call, CalledProcessError
-
-default_targets = [
-    "pandas",
-    "pandas==2.1",
-    "black[d,jupyter]",
-    "meine_stadt_transparent",
-    "jupyter",
-    "transformers[tensorboard]",
-    "transformers[accelerate,agents,audio,codecarbon,deepspeed,deepspeed-testing,dev,dev-tensorflow,dev-torch,flax,flax-speech,ftfy,integrations,ja,modelcreation,onnx,onnxruntime,optuna,quality,ray,retrieval,sagemaker,sentencepiece,sigopt,sklearn,speech,testing,tf,tf-cpu,tf-speech,timm,tokenizers,torch,torch-speech,torch-vision,torchhub,video,vision]",
-]
-
-data_root = Path(__file__).parent
-project_root = Path(
-    check_output(["git", "rev-parse", "--show-toplevel"], text=True).strip(),
-)
-
-
-def resolve_pip(targets: list[str], pip_compile: Path) -> list[str]:
-    output = check_output(
-        [
-            pip_compile,
-            "--allow-unsafe",
-            "--strip-extras",
-            "--upgrade",
-            "--output-file",
-            "-",
-            "--quiet",
-            "-",
-        ],
-        input=" ".join(targets),
-        stderr=subprocess.STDOUT,
-        text=True,
-    )
-    pip_deps = []
-    for line in output.splitlines():
-        if not line.strip() or line.lstrip().startswith("#"):
-            continue
-        pip_deps.append(line)
-    pip_deps.sort()
-    return pip_deps
-
-
-def resolve_uv(targets: list[str], venv: Path, profile: str = "dev") -> list[str]:
-    target_profile = profile if profile != "dev" else "debug"
-    output = check_output(
-        [
-            project_root.joinpath("target").joinpath(target_profile).joinpath("uv-dev"),
-            "resolve",
-            "--format",
-            "expanded",
-            *targets,
-        ],
-        text=True,
-        stderr=subprocess.STDOUT,
-        env={
-            **os.environ,
-            "VIRTUAL_ENV": venv,
-        },
-    )
-    uv_deps = []
-    for line in output.splitlines():
-        uv_deps.append(line.replace(" ", ""))
-    uv_deps.sort()
-    return uv_deps
-
-
-def compare_for_python_version(
-    python_major: int, python_minor: int, targets: list[str], profile: str = "dev"
-):
-    venvs = data_root.joinpath("venvs")
-    venvs.mkdir(exist_ok=True)
-    venvs.joinpath(".gitignore").write_text("*")
-    cache = data_root.joinpath("pip_compile_cache")
-    cache.mkdir(exist_ok=True)
-    cache.joinpath(".gitignore").write_text("*")
-    pip_compile_venv = venvs.joinpath(f"pip_compile_py{python_major}{python_minor}")
-    if not pip_compile_venv.is_dir():
-        check_call(
-            ["virtualenv", "-p", f"{python_major}.{python_minor}", pip_compile_venv]
-        )
-        check_call(
-            [pip_compile_venv.joinpath("bin").joinpath("pip"), "install", "pip-tools"]
-        )
-    pip_compile = pip_compile_venv.joinpath("bin").joinpath("pip-compile")
-    for target in targets:
-        digest = (
-            f"py{python_major}{python_minor}-"
-            + sha256(str(target).encode()).hexdigest()
-        )
-        cache_file = cache.joinpath(digest).with_suffix(".json")
-        if cache_file.is_file():
-            pip_result = json.loads(cache_file.read_text())
-            pip_time = 0.0
-        else:
-            start = time.time()
-            try:
-                pip_result = resolve_pip([target], pip_compile)
-                cache_file.write_text(json.dumps(pip_result))
-            except CalledProcessError as e:
-                pip_result = e
-            pip_time = time.time() - start
-
-        start = time.time()
-        try:
-            uv_result = resolve_uv([target], pip_compile_venv, profile=profile)
-        except CalledProcessError as e:
-            uv_result = e
-        uv_time = time.time() - start
-
-        if isinstance(pip_result, CalledProcessError) and isinstance(
-            uv_result, CalledProcessError
-        ):
-            print(f"Both failed {python_major}.{python_minor} {target}")
-            continue
-        elif isinstance(pip_result, CalledProcessError):
-            # Make the output a bit more readable
-            output = "\n".join(pip_result.output.splitlines()[:10])
-            print(
-                f"Only pip failed {python_major}.{python_minor} {target}: "
-                f"{pip_result}\n---\n{output}\n---"
-            )
-            continue
-        elif isinstance(uv_result, CalledProcessError):
-            # Make the output a bit more readable
-            output = "\n".join(uv_result.output.splitlines()[:10])
-            print(
-                f"Only uv failed {python_major}.{python_minor} {target}: "
-                f"{uv_result}\n---\n{output}\n---"
-            )
-            continue
-
-        if pip_result != uv_result and isinstance(pip_result, list):
-            # Maybe, both resolution are allowed? By adding all constraints from the pip
-            # resolution we check whether uv considers this resolution possible
-            # (vs. there is a bug in uv where we wouldn't pick those versions)
-            start = time.time()
-            try:
-                uv_result2 = resolve_uv(
-                    [target, *pip_result], pip_compile_venv, profile=profile
-                )
-            except CalledProcessError as e:
-                uv_result2 = e
-            uv_time2 = time.time() - start
-            if uv_result2 == pip_result:
-                print(
-                    f"Equal (coerced) {python_major}.{python_minor} "
-                    f"(pip: {pip_time:.3}s, uv: {uv_time2:.3}s) {target}"
-                )
-                continue
-
-        if pip_result == uv_result:
-            print(
-                f"Equal {python_major}.{python_minor} "
-                f"(pip: {pip_time:.3}s, uv: {uv_time:.3}s) {target}"
-            )
-        else:
-            print(
-                f"Different {python_major}.{python_minor} "
-                f"(pip: {pip_time:.3}s, uv: {uv_time:.3}s) {target}"
-            )
-            print(f"pip: {pip_result}")
-            print(f"uv: {uv_result}")
-            while True:
-                if pip_result and uv_result:
-                    if pip_result[0] == uv_result[0]:
-                        pip_result.pop(0)
-                        uv_result.pop(0)
-                    elif pip_result[0] < uv_result[0]:
-                        print(f"- {pip_result.pop(0)}")
-                    else:
-                        print(f"+ {uv_result.pop(0)}")
-                elif pip_result:
-                    print(f"- {pip_result.pop(0)}")
-                elif uv_result:
-                    print(f"+ {uv_result.pop(0)}")
-                else:
-                    break
-
-
-def main():
-    parser = ArgumentParser()
-    parser.add_argument("--target", help="A list of requirements")
-    parser.add_argument("-p", "--python")
-    parser.add_argument("--release", action="store_true")
-    args = parser.parse_args()
-
-    if args.target:
-        targets = [args.target]
-    else:
-        targets = default_targets
-
-    if args.release:
-        profile = "release"
-    else:
-        profile = "dev"
-
-    check_call(["cargo", "build", "--bin", "uv-dev", "--profile", profile])
-
-    if args.python:
-        python_major = int(args.python.split(".")[0])
-        python_minor = int(args.python.split(".")[1])
-
-        assert python_major == 3
-        assert python_minor >= 8
-        compare_for_python_version(python_major, python_minor, targets, profile=profile)
-    else:
-        for python_minor in range(8, 12):
-            compare_for_python_version(3, python_minor, targets, profile=profile)
-
-
-if __name__ == "__main__":
-    main()