scikit-learn
diff --git a/‎sklearn/cross_validation.py
+32-35 b/‎sklearn/cross_validation.py
+32-35
diff --git a/‎sklearn/feature_selection/rfe.py
+7-6 b/‎sklearn/feature_selection/rfe.py
+7-6
diff --git a/‎sklearn/grid_search.py
+20-32 b/‎sklearn/grid_search.py
+20-32
@@ -1078,7 +1078,7 @@ def __len__(self):
 
 def cross_val_score(estimator, X, y=None, scoring=None, cv=None, n_jobs=1,
                     verbose=0, fit_params=None, pre_dispatch='2*n_jobs',
-                    sample_weight=None):
+                    scorer_params=None):
     """Evaluate a score by cross-validation
 
     Parameters
@@ -1093,9 +1093,6 @@ def cross_val_score(estimator, X, y=None, scoring=None, cv=None, n_jobs=1,
         The target variable to try to predict in the case of
         supervised learning.
 
-    sample_weight : array-like, optional, default: None
-        Sample weights.
-
     scoring : string, callable or None, optional, default: None
         A string (see model evaluation documentation) or
         a scorer callable object / function with signature
@@ -1134,12 +1131,16 @@ def cross_val_score(estimator, X, y=None, scoring=None, cv=None, n_jobs=1,
             - A string, giving an expression as a function of n_jobs,
               as in '2*n_jobs'
 
+    scorer_params : dict, optional
+        Parameters to pass to the scorer.  Can be used for sample weights
+        and sample groups.
+
     Returns
     -------
     scores : array of float, shape=(len(list(cv)),)
         Array of scores of the estimator for each run of the cross validation.
     """
-    X, y, sample_weight = indexable(X, y, sample_weight)
+    X, y = indexable(X, y)
 
     cv = _check_cv(cv, X, y, classifier=is_classifier(estimator))
     scorer = check_scoring(estimator, scoring=scoring)
@@ -1148,16 +1149,14 @@ def cross_val_score(estimator, X, y=None, scoring=None, cv=None, n_jobs=1,
     parallel = Parallel(n_jobs=n_jobs, verbose=verbose,
                         pre_dispatch=pre_dispatch)
     scores = parallel(delayed(_fit_and_score)(clone(estimator), X, y,
-                                              sample_weight, scorer,
-                                              train, test, verbose, None,
-                                              fit_params)
+                                              scorer, train, test, verbose,
+                                              None, fit_params, scorer_params)
                       for train, test in cv)
     return np.array(scores)[:, 0]
 
 
-def _fit_and_score(estimator, X, y, sample_weight,
-                   scorer, train, test, verbose, parameters,
-                   fit_params, return_train_score=False,
+def _fit_and_score(estimator, X, y, scorer, train, test, verbose, parameters,
+                   fit_params, scorer_params, return_train_score=False,
                    return_parameters=False):
     """Fit estimator and compute scores for a given dataset split.
 
@@ -1173,9 +1172,6 @@ def _fit_and_score(estimator, X, y, sample_weight,
         The target variable to try to predict in the case of
         supervised learning.
 
-    sample_weight : array-like or None
-        Sample weights.
-
     scoring : callable
         A scorer callable object / function with signature
         ``scorer(estimator, X, y)``.
@@ -1195,6 +1191,9 @@ def _fit_and_score(estimator, X, y, sample_weight,
     fit_params : dict or None
         Parameters that will be passed to ``estimator.fit``.
 
+    scorer_params : dict or None
+        Parameters that will be passed to the scorer.
+
     return_train_score : boolean, optional, default: False
         Compute and return score on training set.
 
@@ -1233,33 +1232,36 @@ def _fit_and_score(estimator, X, y, sample_weight,
                        if hasattr(v, '__len__') and len(v) == n_samples else v)
                        for k, v in fit_params.items()])
 
+    # Same, but take both slices
+    scorer_params = scorer_params if scorer_params is not None else {}
+    train_scorer_params = dict([(k, np.asarray(v)[train]
+                                 if hasattr(v, '__len__')
+                                 and len(v) == n_samples
+                                 else v)
+                                for k, v in scorer_params.items()])
+    test_scorer_params = dict([(k, np.asarray(v)[test]
+                                if hasattr(v, '__len__')
+                                and len(v) == n_samples
+                                else v)
+                               for k, v in scorer_params.items()])
+
     if parameters is not None:
         estimator.set_params(**parameters)
 
     start_time = time.time()
 
-    X_train, y_train, sample_weight_train = _safe_split(
-        estimator, X, y, sample_weight, train)
-    X_test, y_test, sample_weight_test = _safe_split(
-        estimator, X, y, sample_weight, test, train)
-
-    test_score_params = {}
-    train_score_params = {}
-    if sample_weight is not None:
-        fit_params = fit_params.copy()
-        fit_params['sample_weight'] = sample_weight_train
-        test_score_params['sample_weight'] = sample_weight_test
-        train_score_params['sample_weight'] = sample_weight_train
+    X_train, y_train = _safe_split(estimator, X, y, train)
+    X_test, y_test = _safe_split(estimator, X, y, test, train)
 
     if y_train is None:
         estimator.fit(X_train, **fit_params)
     else:
         estimator.fit(X_train, y_train, **fit_params)
     test_score = _score(estimator, X_test, y_test, scorer,
-                        **test_score_params)
+                        **test_scorer_params)
     if return_train_score:
         train_score = _score(estimator, X_train, y_train, scorer,
-                             **train_score_params)
+                             **train_scorer_params)
 
     scoring_time = time.time() - start_time
 
@@ -1276,7 +1278,7 @@ def _fit_and_score(estimator, X, y, sample_weight,
     return ret
 
 
-def _safe_split(estimator, X, y, sample_weight, indices, train_indices=None):
+def _safe_split(estimator, X, y, indices, train_indices=None):
     """Create subset of dataset and properly handle kernels."""
     if hasattr(estimator, 'kernel') and callable(estimator.kernel):
         # cannot compute the kernel values with custom function
@@ -1305,12 +1307,7 @@ def _safe_split(estimator, X, y, sample_weight, indices, train_indices=None):
     else:
         y_subset = None
 
-    if sample_weight is not None:
-        sample_weight_subset = np.asarray(sample_weight)[indices]
-    else:
-        sample_weight_subset = None
-
-    return X_subset, y_subset, sample_weight_subset
+    return X_subset, y_subset
 
 
 def _score(estimator, X_test, y_test, scorer, **params):
 
@@ -335,16 +335,17 @@ def fit(self, X, y, sample_weight=None):
 
         # Cross-validation
         for n, (train, test) in enumerate(cv):
-            X_train, y_train, sample_weight_train = _safe_split(
-                self.estimator, X, y, sample_weight, train)
-            X_test, y_test, sample_weight_test = _safe_split(
-                self.estimator, X, y, sample_weight, test, train)
+            X_train, y_train = _safe_split(
+                self.estimator, X, y, train)
+            X_test, y_test  = _safe_split(
+                self.estimator, X, y, test, train)
 
             fit_params = dict()
             score_params = dict()
             if sample_weight is not None:
-                fit_params['sample_weight'] = sample_weight_train
-                score_params['sample_weight'] = sample_weight_test
+                sample_weight = np.asarray(sample_weight)
+                fit_params['sample_weight'] = sample_weight[train]
+                score_params['sample_weight'] = sample_weight[test]
 
             # Compute a full ranking of the features
             ranking_ = rfe.fit(X_train, y_train, **fit_params).ranking_
 
@@ -281,7 +281,8 @@ class BaseSearchCV(six.with_metaclass(ABCMeta, BaseEstimator,
     @abstractmethod
     def __init__(self, estimator, scoring=None,
                  fit_params=None, n_jobs=1, iid=True,
-                 refit=True, cv=None, verbose=0, pre_dispatch='2*n_jobs'):
+                 refit=True, cv=None, verbose=0, pre_dispatch='2*n_jobs',
+                 scorer_params=None):
 
         self.scoring = scoring
         self.estimator = estimator
@@ -292,8 +293,9 @@ def __init__(self, estimator, scoring=None,
         self.cv = cv
         self.verbose = verbose
         self.pre_dispatch = pre_dispatch
+        self.scorer_params = scorer_params
 
-    def score(self, X, y=None, sample_weight=None):
+    def score(self, X, y=None, **scorer_params):
         """Returns the score on the given test data and labels, if the search
         estimator has been refit. The ``score`` function of the best estimator
         is used, or the ``scoring`` parameter where unavailable.
@@ -308,24 +310,18 @@ def score(self, X, y=None, sample_weight=None):
             Target relative to X for classification or regression;
             None for unsupervised learning.
 
-        sample_weight : array-like, shape = [n_samples], optional
-            Sample weights.
-
         Returns
         -------
         score : float
 
         """
-        kwargs = {}
-        if sample_weight is not None:
-            kwargs['sample_weight'] = sample_weight
         if hasattr(self.best_estimator_, 'score'):
-            return self.best_estimator_.score(X, y, **kwargs)
+            return self.best_estimator_.score(X, y, **scorer_params)
         if self.scorer_ is None:
             raise ValueError("No score function explicitly defined, "
                              "and the estimator doesn't provide one %s"
                              % self.best_estimator_)
-        return self.scorer_(self.best_estimator_, X, y, **kwargs)
+        return self.scorer_(self.best_estimator_, X, y, **scorer_params)
 
     @property
     def predict(self):
@@ -343,15 +339,15 @@ def decision_function(self):
     def transform(self):
         return self.best_estimator_.transform
 
-    def _fit(self, X, y, sample_weight, parameter_iterable):
+    def _fit(self, X, y, parameter_iterable):
         """Actual fitting,  performing the search over parameters."""
 
         estimator = self.estimator
         cv = self.cv
         self.scorer_ = check_scoring(self.estimator, scoring=self.scoring)
 
         n_samples = _num_samples(X)
-        X, y, sample_weight = indexable(X, y, sample_weight)
+        X, y = indexable(X, y)
 
         if y is not None:
             if len(y) != n_samples:
@@ -376,10 +372,10 @@ def _fit(self, X, y, sample_weight, parameter_iterable):
             n_jobs=self.n_jobs, verbose=self.verbose,
             pre_dispatch=pre_dispatch
         )(
-            delayed(_fit_and_score)(clone(base_estimator), X, y, sample_weight,
+            delayed(_fit_and_score)(clone(base_estimator), X, y,
                                     self.scorer_, train, test,
                                     self.verbose, parameters, self.fit_params,
-                                    return_parameters=True)
+                                    self.scorer_params, return_parameters=True)
             for parameters in parameter_iterable
             for train, test in cv)
 
@@ -422,9 +418,6 @@ def _fit(self, X, y, sample_weight, parameter_iterable):
 
         if self.refit:
             fit_params = self.fit_params
-            if sample_weight is not None:
-                fit_params = fit_params.copy()
-                fit_params['sample_weight'] = sample_weight
             # fit the best estimator using the entire dataset
             # clone first to work around broken estimators
             best_estimator = clone(base_estimator).set_params(
@@ -580,14 +573,15 @@ class GridSearchCV(BaseSearchCV):
 
     def __init__(self, estimator, param_grid, scoring=None,
                  fit_params=None, n_jobs=1, iid=True,
-                 refit=True, cv=None, verbose=0, pre_dispatch='2*n_jobs'):
+                 refit=True, cv=None, verbose=0, pre_dispatch='2*n_jobs',
+                 scorer_params=None):
         super(GridSearchCV, self).__init__(
             estimator, scoring, fit_params, n_jobs, iid,
-            refit, cv, verbose, pre_dispatch)
+            refit, cv, verbose, pre_dispatch, scorer_params)
         self.param_grid = param_grid
         _check_param_grid(param_grid)
 
-    def fit(self, X, y=None, sample_weight=None):
+    def fit(self, X, y=None):
         """Run fit with all sets of parameters.
 
         Parameters
@@ -600,11 +594,8 @@ def fit(self, X, y=None, sample_weight=None):
         y : array-like, shape = [n_samples] or [n_samples, n_output], optional
             Target relative to X for classification or regression;
             None for unsupervised learning.
-
-        sample_weight : array-like, shape = [n_samples], optional
-            Sample weights.
         """
-        return self._fit(X, y, sample_weight, ParameterGrid(self.param_grid))
+        return self._fit(X, y, ParameterGrid(self.param_grid))
 
 
 class RandomizedSearchCV(BaseSearchCV):
@@ -730,17 +721,18 @@ class RandomizedSearchCV(BaseSearchCV):
 
     def __init__(self, estimator, param_distributions, n_iter=10, scoring=None,
                  fit_params=None, n_jobs=1, iid=True, refit=True, cv=None,
-                 verbose=0, pre_dispatch='2*n_jobs', random_state=None):
+                 verbose=0, pre_dispatch='2*n_jobs', random_state=None,
+                 scorer_params=None):
 
         self.param_distributions = param_distributions
         self.n_iter = n_iter
         self.random_state = random_state
         super(RandomizedSearchCV, self).__init__(
             estimator=estimator, scoring=scoring, fit_params=fit_params,
             n_jobs=n_jobs, iid=iid, refit=refit, cv=cv, verbose=verbose,
-            pre_dispatch=pre_dispatch)
+            pre_dispatch=pre_dispatch, scorer_params=scorer_params)
 
-    def fit(self, X, y=None, sample_weight=None):
+    def fit(self, X, y=None):
         """Run fit on the estimator with randomly drawn parameters.
 
         Parameters
@@ -752,12 +744,8 @@ def fit(self, X, y=None, sample_weight=None):
         y : array-like, shape = [n_samples] or [n_samples, n_output], optional
             Target relative to X for classification or regression;
             None for unsupervised learning.
-
-        sample_weight : array-like, shape = [n_samples], optional
-            Sample weights.
-
         """
         sampled_params = ParameterSampler(self.param_distributions,
                                           self.n_iter,
                                           random_state=self.random_state)
-        return self._fit(X, y, sample_weight, sampled_params)
+        return self._fit(X, y, sampled_params)