scikit-learn
diff --git a/‎.git-blame-ignore-revs
Copy file name to clipboardExpand all lines: .git-blame-ignore-revs
+3Lines changed: 3 additions & 0 deletions b/‎.git-blame-ignore-revs
Copy file name to clipboardExpand all lines: .git-blame-ignore-revs
+3Lines changed: 3 additions & 0 deletions
diff --git a/‎.github/workflows/assign.yml
Copy file name to clipboardExpand all lines: .github/workflows/assign.yml
+3-3Lines changed: 3 additions & 3 deletions b/‎.github/workflows/assign.yml
Copy file name to clipboardExpand all lines: .github/workflows/assign.yml
+3-3Lines changed: 3 additions & 3 deletions
diff --git a/‎.github/workflows/check-changelog.yml
Copy file name to clipboardExpand all lines: .github/workflows/check-changelog.yml
+2-2Lines changed: 2 additions & 2 deletions b/‎.github/workflows/check-changelog.yml
Copy file name to clipboardExpand all lines: .github/workflows/check-changelog.yml
+2-2Lines changed: 2 additions & 2 deletions
diff --git a/‎.github/workflows/check-manifest.yml
Copy file name to clipboardExpand all lines: .github/workflows/check-manifest.yml
+3Lines changed: 3 additions & 0 deletions b/‎.github/workflows/check-manifest.yml
Copy file name to clipboardExpand all lines: .github/workflows/check-manifest.yml
+3Lines changed: 3 additions & 0 deletions
diff --git a/‎.github/workflows/wheels.yml
Copy file name to clipboardExpand all lines: .github/workflows/wheels.yml
+4-2Lines changed: 4 additions & 2 deletions b/‎.github/workflows/wheels.yml
Copy file name to clipboardExpand all lines: .github/workflows/wheels.yml
+4-2Lines changed: 4 additions & 2 deletions
diff --git a/‎.gitignore
Copy file name to clipboardExpand all lines: .gitignore
+3Lines changed: 3 additions & 0 deletions b/‎.gitignore
Copy file name to clipboardExpand all lines: .gitignore
+3Lines changed: 3 additions & 0 deletions
diff --git a/‎.pre-commit-config.yaml
Copy file name to clipboardExpand all lines: .pre-commit-config.yaml
+1-1Lines changed: 1 addition & 1 deletion b/‎.pre-commit-config.yaml
Copy file name to clipboardExpand all lines: .pre-commit-config.yaml
+1-1Lines changed: 1 addition & 1 deletion
diff --git a/‎README.rst
Copy file name to clipboardExpand all lines: README.rst
+5-2Lines changed: 5 additions & 2 deletions b/‎README.rst
Copy file name to clipboardExpand all lines: README.rst
+5-2Lines changed: 5 additions & 2 deletions
diff --git a/‎azure-pipelines.yml
Copy file name to clipboardExpand all lines: azure-pipelines.yml
+5-3Lines changed: 5 additions & 3 deletions b/‎azure-pipelines.yml
Copy file name to clipboardExpand all lines: azure-pipelines.yml
+5-3Lines changed: 5 additions & 3 deletions
diff --git a/‎benchmarks/bench_hist_gradient_boosting_threading.py
Copy file name to clipboardExpand all lines: benchmarks/bench_hist_gradient_boosting_threading.py
+1-1Lines changed: 1 addition & 1 deletion b/‎benchmarks/bench_hist_gradient_boosting_threading.py
Copy file name to clipboardExpand all lines: benchmarks/bench_hist_gradient_boosting_threading.py
+1-1Lines changed: 1 addition & 1 deletion
diff --git a/‎benchmarks/bench_isotonic.py
Copy file name to clipboardExpand all lines: benchmarks/bench_isotonic.py
+1-1Lines changed: 1 addition & 1 deletion b/‎benchmarks/bench_isotonic.py
Copy file name to clipboardExpand all lines: benchmarks/bench_isotonic.py
+1-1Lines changed: 1 addition & 1 deletion
diff --git a/‎benchmarks/bench_lasso.py
Copy file name to clipboardExpand all lines: benchmarks/bench_lasso.py
+1-1Lines changed: 1 addition & 1 deletion b/‎benchmarks/bench_lasso.py
Copy file name to clipboardExpand all lines: benchmarks/bench_lasso.py
+1-1Lines changed: 1 addition & 1 deletion
diff --git a/‎benchmarks/bench_plot_nmf.py
Copy file name to clipboardExpand all lines: benchmarks/bench_plot_nmf.py
+1-1Lines changed: 1 addition & 1 deletion b/‎benchmarks/bench_plot_nmf.py
Copy file name to clipboardExpand all lines: benchmarks/bench_plot_nmf.py
+1-1Lines changed: 1 addition & 1 deletion
diff --git a/‎benchmarks/bench_plot_randomized_svd.py
Copy file name to clipboardExpand all lines: benchmarks/bench_plot_randomized_svd.py
+4-3Lines changed: 4 additions & 3 deletions b/‎benchmarks/bench_plot_randomized_svd.py
Copy file name to clipboardExpand all lines: benchmarks/bench_plot_randomized_svd.py
+4-3Lines changed: 4 additions & 3 deletions
diff --git a/‎benchmarks/bench_random_projections.py
Copy file name to clipboardExpand all lines: benchmarks/bench_random_projections.py
+3-3Lines changed: 3 additions & 3 deletions b/‎benchmarks/bench_random_projections.py
Copy file name to clipboardExpand all lines: benchmarks/bench_random_projections.py
+3-3Lines changed: 3 additions & 3 deletions
diff --git a/‎benchmarks/bench_rcv1_logreg_convergence.py
Copy file name to clipboardExpand all lines: benchmarks/bench_rcv1_logreg_convergence.py
+1-1Lines changed: 1 addition & 1 deletion b/‎benchmarks/bench_rcv1_logreg_convergence.py
Copy file name to clipboardExpand all lines: benchmarks/bench_rcv1_logreg_convergence.py
+1-1Lines changed: 1 addition & 1 deletion
diff --git a/‎benchmarks/bench_saga.py
Copy file name to clipboardExpand all lines: benchmarks/bench_saga.py
+1-1Lines changed: 1 addition & 1 deletion b/‎benchmarks/bench_saga.py
Copy file name to clipboardExpand all lines: benchmarks/bench_saga.py
+1-1Lines changed: 1 addition & 1 deletion
diff --git a/‎benchmarks/bench_sample_without_replacement.py
Copy file name to clipboardExpand all lines: benchmarks/bench_sample_without_replacement.py
+1-1Lines changed: 1 addition & 1 deletion b/‎benchmarks/bench_sample_without_replacement.py
Copy file name to clipboardExpand all lines: benchmarks/bench_sample_without_replacement.py
+1-1Lines changed: 1 addition & 1 deletion
diff --git a/‎benchmarks/bench_tree.py
Copy file name to clipboardExpand all lines: benchmarks/bench_tree.py
+1-1Lines changed: 1 addition & 1 deletion b/‎benchmarks/bench_tree.py
Copy file name to clipboardExpand all lines: benchmarks/bench_tree.py
+1-1Lines changed: 1 addition & 1 deletion
diff --git a/‎build_tools/azure/install.sh
Copy file name to clipboardExpand all lines: build_tools/azure/install.sh
+2-12Lines changed: 2 additions & 12 deletions b/‎build_tools/azure/install.sh
Copy file name to clipboardExpand all lines: build_tools/azure/install.sh
+2-12Lines changed: 2 additions & 12 deletions
diff --git a/‎build_tools/azure/posix.yml
Copy file name to clipboardExpand all lines: build_tools/azure/posix.yml
+1-1Lines changed: 1 addition & 1 deletion b/‎build_tools/azure/posix.yml
Copy file name to clipboardExpand all lines: build_tools/azure/posix.yml
+1-1Lines changed: 1 addition & 1 deletion
diff --git a/‎build_tools/circle/build_test_arm.sh
Copy file name to clipboardExpand all lines: build_tools/circle/build_test_arm.sh
+1-1Lines changed: 1 addition & 1 deletion b/‎build_tools/circle/build_test_arm.sh
Copy file name to clipboardExpand all lines: build_tools/circle/build_test_arm.sh
+1-1Lines changed: 1 addition & 1 deletion
diff --git a/‎doc/about.rst
Copy file name to clipboardExpand all lines: doc/about.rst
+4-30Lines changed: 4 additions & 30 deletions b/‎doc/about.rst
Copy file name to clipboardExpand all lines: doc/about.rst
+4-30Lines changed: 4 additions & 30 deletions
diff --git a/‎doc/computing/parallelism.rst
Copy file name to clipboardExpand all lines: doc/computing/parallelism.rst
-15Lines changed: 0 additions & 15 deletions b/‎doc/computing/parallelism.rst
Copy file name to clipboardExpand all lines: doc/computing/parallelism.rst
-15Lines changed: 0 additions & 15 deletions
@@ -19,3 +19,6 @@
 
 # PR 20502: Runs Black on examples
 70a185ae59b4362633d18b0d0083abb1b6f7370c
+
+# PR 22474: Update to Black 22.1.0
+1fc86b6aacd89da44a3b4e8abf7c3e2ba4336ffe
@@ -7,10 +7,10 @@ on:
 jobs:
   one:
     runs-on: ubuntu-latest
+    # Note that string comparisons is not case sensitive.
     if: >-
-      (github.event.comment.body == 'take' ||
-       github.event.comment.body == 'Take')
-      && !github.event.issue.assignee
+       startsWith(github.event.comment.body, '/take')
+       && !github.event.issue.assignee
     steps:
       - run: |
           echo "Assigning issue ${{ github.event.issue.number }} to ${{ github.event.comment.user.login }}"
 
@@ -61,8 +61,8 @@ jobs:
             echo "If you see this error and there is already a changelog entry,"
             echo "check that the PR number is correct."
             echo ""
-            echo "If you believe that this PR does no warrant a changelog"
-            echo "entry, say so in a comment so that a maintainer will label "
+            echo "If you believe that this PR does not warrant a changelog"
+            echo "entry, say so in a comment so that a maintainer will label"
             echo "the PR with 'No Changelog Needed' to bypass this check."
             exit 1
           fi
@@ -6,6 +6,9 @@ on:
 
 jobs:
   check:
+    # Don't run on forks
+    if: github.repository == 'scikit-learn/scikit-learn'
+
     runs-on: ubuntu-latest
     steps:
       - uses: actions/checkout@v2
 
@@ -49,11 +49,13 @@ jobs:
       matrix:
         include:
           # Window 64 bit
-          - os: windows-latest
+          # Note: windows-2019 is needed for older Python versions:
+          # https://github.com/scikit-learn/scikit-learn/issues/22530
+          - os: windows-2019
             python: 37
             bitness: 64
             platform_id: win_amd64
-          - os: windows-latest
+          - os: windows-2019
             python: 38
             bitness: 64
             platform_id: win_amd64
 
@@ -75,6 +75,9 @@ _configtest.o.d
 # Used by mypy
 .mypy_cache/
 
+# virtualenv from advanced installation guide
+sklearn-env/
+
 # files generated from a template
 sklearn/_loss/_loss.pyx
 sklearn/utils/_seq_dataset.pyx
 
@@ -6,7 +6,7 @@ repos:
     -   id: end-of-file-fixer
     -   id: trailing-whitespace
 -   repo: https://github.com/psf/black
-    rev: 21.6b0
+    rev: 22.1.0
     hooks:
     -   id: black
 -   repo: https://gitlab.com/pycqa/flake8
 
@@ -35,7 +35,7 @@
 .. |PythonMinVersion| replace:: 3.7
 .. |NumPyMinVersion| replace:: 1.14.6
 .. |SciPyMinVersion| replace:: 1.1.0
-.. |JoblibMinVersion| replace:: 0.11
+.. |JoblibMinVersion| replace:: 1.0.0
 .. |ThreadpoolctlMinVersion| replace:: 2.0.0
 .. |MatplotlibMinVersion| replace:: 2.2.3
 .. |Scikit-ImageMinVersion| replace:: 0.14.5
@@ -89,7 +89,7 @@ User installation
 ~~~~~~~~~~~~~~~~~
 
 If you already have a working installation of numpy and scipy,
-the easiest way to install scikit-learn is using ``pip``   ::
+the easiest way to install scikit-learn is using ``pip``::
 
     pip install -U scikit-learn
 
@@ -184,6 +184,8 @@ Communication
 
 - Mailing list: https://mail.python.org/mailman/listinfo/scikit-learn
 - Gitter: https://gitter.im/scikit-learn/scikit-learn
+- Blog: https://blog.scikit-learn.org
+- Calendar: https://blog.scikit-learn.org/calendar/
 - Twitter: https://twitter.com/scikit_learn
 - Twitter (commits): https://twitter.com/sklearn_commits
 - Stack Overflow: https://stackoverflow.com/questions/tagged/scikit-learn
@@ -193,6 +195,7 @@ Communication
 - YouTube: https://www.youtube.com/channel/UCJosFjYm0ZYVUARxuOZqnnw/playlists
 - Facebook: https://www.facebook.com/scikitlearnofficial/
 - Instagram: https://www.instagram.com/scikitlearnofficial/
+- TikTok: https://www.tiktok.com/@scikit.learn
 
 Citation
 ~~~~~~~~
 
@@ -45,7 +45,7 @@ jobs:
         versionSpec: '3.9'
     - bash: |
         # Include pytest compatibility with mypy
-        pip install pytest flake8 mypy==0.782 black==21.6b0
+        pip install pytest flake8 mypy==0.782 black==22.1.0
       displayName: Install linters
     - bash: |
         black --check --diff .
@@ -190,7 +190,7 @@ jobs:
         PANDAS_VERSION: 'none'
         THREADPOOLCTL_VERSION: 'min'
         COVERAGE: 'false'
-      # Linux + Python 3.7 build with OpenBLAS and without SITE_JOBLIB
+      # Linux + Python 3.7 build with OpenBLAS
       py37_conda_defaults_openblas:
         DISTRIB: 'conda'
         CONDA_CHANNEL: 'defaults'  # Anaconda main channel
@@ -206,6 +206,7 @@ jobs:
       pylatest_pip_openblas_pandas:
         DISTRIB: 'conda-pip-latest'
         PYTHON_VERSION: '3.9'
+        PYTEST_VERSION: '6.2.5'
         CHECK_PYTEST_SOFT_DEPENDENCY: 'true'
         TEST_DOCSTRINGS: 'true'
         CHECK_WARNINGS: 'true'
@@ -273,7 +274,8 @@ jobs:
         PYTHON_VERSION: '3.7'
         CHECK_WARNINGS: 'true'
         PYTHON_ARCH: '64'
-        PYTEST_VERSION: '*'
+        # Unpin when pytest stalling issue is fixed
+        PYTEST_VERSION: '6.2.5'
         COVERAGE: 'true'
         # Temporary fix for setuptools to use disutils from standard lib
         # https://github.com/numpy/numpy/issues/17216
 
@@ -239,7 +239,7 @@ def one_run(n_threads, n_samples):
 
 
 max_threads = os.cpu_count()
-n_threads_list = [2 ** i for i in range(8) if (2 ** i) < max_threads]
+n_threads_list = [2**i for i in range(8) if (2**i) < max_threads]
 n_threads_list.append(max_threads)
 
 sklearn_scores = []
 
@@ -86,7 +86,7 @@ def bench_isotonic_regression(Y):
 
     timings = []
     for exponent in range(args.log_min_problem_size, args.log_max_problem_size):
-        n = 10 ** exponent
+        n = 10**exponent
         Y = DATASET_GENERATORS[args.dataset](n)
         time_per_iteration = [
             bench_isotonic_regression(Y) for i in range(args.iterations)
 
@@ -39,7 +39,7 @@ def compute_bench(alpha, n_samples, n_features, precompute):
                 coef=True,
             )
 
-            X /= np.sqrt(np.sum(X ** 2, axis=0))  # Normalize data
+            X /= np.sqrt(np.sum(X**2, axis=0))  # Normalize data
 
             gc.collect()
             print("- benchmarking Lasso")
 
@@ -162,7 +162,7 @@ def _fit_projected_gradient(X, W, H, tol, max_iter, nls_max_iter, alpha, l1_rati
         proj_grad_W = squared_norm(gradW * np.logical_or(gradW < 0, W > 0))
         proj_grad_H = squared_norm(gradH * np.logical_or(gradH < 0, H > 0))
 
-        if (proj_grad_W + proj_grad_H) / init_grad < tol ** 2:
+        if (proj_grad_W + proj_grad_H) / init_grad < tol**2:
             break
 
         # update W
 
@@ -50,9 +50,10 @@
 
 References
 ----------
-(1) Finding structure with randomness: Stochastic algorithms for constructing
-    approximate matrix decompositions
-    Halko, et al., 2009 https://arxiv.org/abs/0909.4061
+(1) :arxiv:`"Finding structure with randomness:
+    Stochastic algorithms for constructing approximate matrix decompositions."
+    <0909.4061>`
+    Halko, et al., (2009)
 
 (2) A randomized algorithm for the decomposition of matrices
     Per-Gunnar Martinsson, Vladimir Rokhlin and Mark Tygert
 
@@ -38,7 +38,7 @@ def type_auto_or_int(val):
 
 
 def compute_time(t_start, delta):
-    mu_second = 0.0 + 10 ** 6  # number of microseconds in a second
+    mu_second = 0.0 + 10**6  # number of microseconds in a second
 
     return delta.seconds + delta.microseconds / mu_second
 
@@ -109,7 +109,7 @@ def print_row(clf_type, time_fit, time_transform):
     op.add_option(
         "--n-features",
         dest="n_features",
-        default=10 ** 4,
+        default=10**4,
         type=int,
         help="Number of features in the benchmarks",
     )
@@ -124,7 +124,7 @@ def print_row(clf_type, time_fit, time_transform):
     op.add_option(
         "--ratio-nonzeros",
         dest="ratio_nonzeros",
-        default=10 ** -3,
+        default=10**-3,
         type=float,
         help="Number of features in the benchmarks",
     )
 
@@ -149,7 +149,7 @@ def plot_dloss(clfs):
 
 def get_max_squared_sum(X):
     """Get the maximum row-wise sum of squares"""
-    return np.sum(X ** 2, axis=1).max()
+    return np.sum(X**2, axis=1).max()
 
 
 rcv1 = fetch_rcv1()
 
@@ -119,7 +119,7 @@ def fit_single(
                 # Lightning predict_proba is not implemented for n_classes > 2
                 y_pred = _predict_proba(lr, X)
             score = log_loss(y, y_pred, normalize=False) / n_samples
-            score += 0.5 * alpha * np.sum(lr.coef_ ** 2) + beta * np.sum(
+            score += 0.5 * alpha * np.sum(lr.coef_**2) + beta * np.sum(
                 np.abs(lr.coef_)
             )
             scores.append(score)
 
@@ -16,7 +16,7 @@
 
 
 def compute_time(t_start, delta):
-    mu_second = 0.0 + 10 ** 6  # number of microseconds in a second
+    mu_second = 0.0 + 10**6  # number of microseconds in a second
 
     return delta.seconds + delta.microseconds / mu_second
 
 
@@ -22,7 +22,7 @@
 scikit_classifier_results = []
 scikit_regressor_results = []
 
-mu_second = 0.0 + 10 ** 6  # number of microseconds in a second
+mu_second = 0.0 + 10**6  # number of microseconds in a second
 
 
 def bench_scikit_tree_classifier(X, Y):
 
@@ -63,11 +63,7 @@ if [[ "$DISTRIB" == "conda" || "$DISTRIB" == *"mamba"* ]]; then
 
     if [[ "$UNAMESTR" == "Darwin" ]]; then
         if [[ "$SKLEARN_TEST_NO_OPENMP" != "true" ]]; then
-            # on macOS, install an OpenMP-enabled clang/llvm from conda-forge.
-            # TODO: Remove !=1.1.0 when the following is fixed:
-            # sklearn/svm/_libsvm.cpython-38-darwin.so,
-            # 2): Symbol not found: _svm_check_parameter error
-            TO_INSTALL="$TO_INSTALL compilers>=1.0.4,!=1.1.0 llvm-openmp"
+            TO_INSTALL="$TO_INSTALL compilers llvm-openmp"
         else
             # Without openmp, we use the system clang. Here we use /usr/bin/ar
             # instead because llvm-ar errors
@@ -142,16 +138,10 @@ if [[ "$COVERAGE" == "true" ]]; then
     python -m pip install codecov pytest-cov coverage==6.2
 fi
 
-if [[ "$PYTEST_XDIST_VERSION" != "none" ]]; then
-    python -m pip install pytest-xdist
-fi
-
 if [[ "$TEST_DOCSTRINGS" == "true" ]]; then
     # numpydoc requires sphinx
     python -m pip install sphinx
-    # TODO: update the docstring checks to be compatible with new
-    # numpydoc versions
-    python -m pip install "numpydoc<1.2"
+    python -m pip install numpydoc
 fi
 
 python --version
 
@@ -30,7 +30,7 @@ jobs:
     PYAMG_VERSION: 'latest'
     PILLOW_VERSION: 'latest'
     MATPLOTLIB_VERSION: 'latest'
-    PYTEST_VERSION: 'latest'
+    PYTEST_VERSION: '6.2.5'
     # Disable pytest-xdist as it can stall builds
     PYTEST_XDIST_VERSION: 'latest'
     THREADPOOLCTL_VERSION: 'latest'
 
@@ -62,7 +62,7 @@ fi
 if [[ "$TEST_DOCSTRINGS" == "true" ]]; then
     # numpydoc requires sphinx
     mamba install --verbose -y sphinx
-    mamba install --verbose -y "numpydoc<1.2"
+    mamba install --verbose -y numpydoc
 fi
 
 python --version
 
@@ -244,19 +244,18 @@ July 2017.
    <div class="sk-sponsor-div">
    <div class="sk-sponsor-div-box">
 
-`Zalando SE <https://corporate.zalando.com/en>`_ funds Adrin Jalali since
-August 2020.
+`Hugging Face <https://huggingface.co/>`_ funds Adrin Jalali since 2022.
 
 .. raw:: html
 
    </div>
 
    <div class="sk-sponsor-div-box">
 
-.. image:: images/zalando_logo.png
-   :width: 100pt
+.. image:: images/huggingface_logo-noborder.png
+   :width: 55pt
    :align: center
-   :target: https://corporate.zalando.com/en
+   :target: https://huggingface.co/
 
 .. raw:: html
 
@@ -423,31 +422,6 @@ time of Joris van den Bossche (2017-2018).
    </div>
    </div>
 
-............
-
-.. raw:: html
-
-   <div class="sk-sponsor-div">
-   <div class="sk-sponsor-div-box">
-
-`Anaconda, Inc <https://www.anaconda.com/>`_ funded Adrin Jalali in 2019.
-
-.. raw:: html
-
-   </div>
-
-   <div class="sk-sponsor-div-box">
-
-.. image:: images/anaconda.png
-   :width: 100pt
-   :align: center
-   :target: https://www.anaconda.com/
-
-.. raw:: html
-
-   </div>
-   </div>
-
 ..........................
 
 .. raw:: html
 
@@ -179,21 +179,6 @@ Environment variables
 
 These environment variables should be set before importing scikit-learn.
 
-:SKLEARN_SITE_JOBLIB:
-
-    When this environment variable is set to a non zero value,
-    scikit-learn uses the site joblib rather than its vendored version.
-    Consequently, joblib must be installed for scikit-learn to run.
-    Note that using the site joblib is at your own risks: the versions of
-    scikit-learn and joblib need to be compatible. Currently, joblib 0.11+
-    is supported. In addition, dumps from joblib.Memory might be incompatible,
-    and you might loose some caches and have to redownload some datasets.
-
-    .. deprecated:: 0.21
-
-       As of version 0.21 this parameter has no effect, vendored joblib was
-       removed and site joblib is always used.
-
 :SKLEARN_ASSUME_FINITE:
 
     Sets the default value for the `assume_finite` argument of
Original file line number	Diff line number	Diff line change
`@@ -39,7 +39,7 @@ def compute_bench(alpha, n_samples, n_features, precompute):`
`39`	`39`	`coef=True,`
`40`	`40`	`)`
`41`	`41`
`42`		`- X /= np.sqrt(np.sum(X ** 2, axis=0)) # Normalize data`
	`42`	`+ X /= np.sqrt(np.sum(X**2, axis=0)) # Normalize data`
`43`	`43`
`44`	`44`	`gc.collect()`
`45`	`45`	`print("- benchmarking Lasso")`