scikit-learn · Shyanil · Jan 12, 2025 · Jan 12, 2025 · Jan 12, 2025 · Jan 12, 2025
diff --git a/sklearn/feature_selection/_sequential.py b/sklearn/feature_selection/_sequential.py
@@ -8,6 +8,7 @@
 from numbers import Integral, Real

 import numpy as np
+import pandas as pd

 from ..base import BaseEstimator, MetaEstimatorMixin, _fit_context, clone, is_classifier
 from ..metrics import check_scoring, get_scorer_names
@@ -310,7 +311,10 @@ def _get_best_new_feature_score(self, estimator, X, y, cv, current_mask, **param
            candidate_mask[feature_idx] = True
            if self.direction == "backward":
                candidate_mask = ~candidate_mask
-            X_new = X[:, candidate_mask]
+            if isinstance(X, pd.DataFrame):
+                X_new = X.iloc[:, candidate_mask]
+            else:
+                X_new = X[:, candidate_mask]
            scores[feature_idx] = cross_val_score(
                estimator,
                X_new,

diff --git a/sklearn/metrics/_ranking.py b/sklearn/metrics/_ranking.py
@@ -220,7 +220,14 @@ def average_precision_score(

    def _binary_uninterpolated_average_precision(
        y_true, y_score, pos_label=1, sample_weight=None
+
    ):
+        if len(y_true) < 2:
+            raise ValueError(
+                f"Average precision requires at least 2 samples. Got {len(y_true)}."
+                " A single sample cannot form a precision-recall curve."
+            )
+
        precision, recall, _ = precision_recall_curve(
            y_true, y_score, pos_label=pos_label, sample_weight=sample_weight
        )
-Original file line number
+Diff line change
@@ -8,6 +8,7 @@
     from numbers import Integral, Real
     import numpy as np
+    import pandas as pd
     from ..base import BaseEstimator, MetaEstimatorMixin, _fit_context, clone, is_classifier
     from ..metrics import check_scoring, get_scorer_names
@@ -310,7 +311,10 @@ def _get_best_new_feature_score(self, estimator, X, y, cv, current_mask, **param
                 candidate_mask[feature_idx] = True
                 if self.direction == "backward":
                     candidate_mask = ~candidate_mask
-                X_new = X[:, candidate_mask]
+                if isinstance(X, pd.DataFrame):
+                    X_new = X.iloc[:, candidate_mask]
+                else:
+                    X_new = X[:, candidate_mask]
       Comment on lines

    
      +314
     to 
      +317
    

  

  



  
    
        
        
  
    
        
    
  


      
          
  
      
            Copy link

  
      
    
  

  
      

  
  Member


      

  

  
    
      

      
            glemaitre
  

      

      

      


        Feb 11, 2025


      
    

  


        
      
  
  
  
    

    There was a problem hiding this comment.


  

 
  
    

    Choose a reason for hiding this comment

    
      The reason will be displayed to describe this comment to others. Learn more.
    

    
      
      


  


  
    
      You should the function _safe_indexing instead.
However, here it is already to late because you already too late. We should avoid the call to validate_data or at least not validate X to not convert it to a NumPy array.
We also need to use n_features = _num_features(X) to compute the number of features.
    
  
  


    

        
      
  
  
    
  
  
  
    
    Sorry, something went wrong.
  

  
    
  
    
      

              Uh oh!

              
There was an error while loading. Please reload this page.


  
  


          
      
  
    
    
      
        
            
    All reactions
  


          
          
        
      
    

    



  
        
  
    
        
    
  


      
          
  
      
            Copy link

  
      
    
  

  
      



      

  Author


  

  
    
      

      
            Shyanil
  

      

      

      


        Feb 12, 2025


      
    

  


        
      
  
  
  
    

    There was a problem hiding this comment.


  

 
  
    

    Choose a reason for hiding this comment

    
      The reason will be displayed to describe this comment to others. Learn more.
    

    
      
      


  


  
    
      @glemaitre Should I modify the earlier validation step to prevent X from being converted to a NumPy array? If so, should I change how validate_data is called, or should we handle it differently?
    
  
  


    

        
      
  
  
    
  
  
  
    
    Sorry, something went wrong.
  

  
    
  
    
      

              Uh oh!

              
There was an error while loading. Please reload this page.


  
  


          
      
  
    
    
      
        
            
    All reactions
  


          
          
        
      
    

    



  
        
  
    
        
    
  


      
          
  
      
            Copy link

  
      
    
  

  
      

  
  Member


      

  

  
    
      

      
            adrinjalali
  

      

      

      


        Feb 12, 2025


      
    

  


        
      
  
  
  
    

    There was a problem hiding this comment.


  

 
  
    

    Choose a reason for hiding this comment

    
      The reason will be displayed to describe this comment to others. Learn more.
    

    
      
      


  


  
    
      validate_data has a skip_check_array arg which would skip conversion to numpy.
    
  
  


    

        
      
  
  
    
  
  
  
    
    Sorry, something went wrong.
  

  
    
  
    
      

              Uh oh!

              
There was an error while loading. Please reload this page.


  
  


          
      
  
    
    
      
        
            
    All reactions
  


          
          
        
      
    

    



  
        
  
    
        
    
  


      
          
  
      
            Copy link

  
      
    
  

  
      



      

  Author


  

  
    
      

      
            Shyanil
  

      

      

      


        Feb 13, 2025


      
    

  


        
      
  
  
  
    

    There was a problem hiding this comment.


  

 
  
    

    Choose a reason for hiding this comment

    
      The reason will be displayed to describe this comment to others. Learn more.
    

    
      
      


  


  
    
      Ok @adrinjalali
    
  
  


    

        
      
  
  
    
  
  
  
    
    Sorry, something went wrong.
  

  
    
  
    
      

              Uh oh!

              
There was an error while loading. Please reload this page.


  
  


          
      
  
    
    
      
        
            
    All reactions
                 scores[feature_idx] = cross_val_score(
                     estimator,
                     X_new,
-          Expand Down