
    biA`                        d Z ddlZddlmZmZmZmZmZ ddlZ	ddl
mZ ddlmZmZ ddlmZmZ ddlmZ dd	lmZmZmZ d
dlmZmZmZ d
dlmZ dee   dee   ddfdZddZ G d de      Z  G d de      Z! ee e!        G d deee      Z" G d de      Z# ee"e#        G d de      Z$ G d de      Z% ee$e%       y)z8Xgboost pyspark integration submodule for estimator API.    N)AnyListOptionalTypeUnion)keyword_only)ParamParams)HasProbabilityColHasRawPredictionCol   )Config)XGBClassifier	XGBRankerXGBRegressor   )_ClassificationModel_SparkXGBEstimator_SparkXGBModel)get_class_name	estimatormodelreturnc                    	  j                         }dt        dt        f	fd	dt        dt        ddf 	fd}|j	                         D ]J  }dt         j                                d	| }t        t        j                         ||
      } |||       L  j                         }|j	                         D ]T  }dt         j                                d| }|dk(  r|dz  }t        t        j                         ||
      } |||       V  j                         }|j	                         D ]J  }dt         j                                d| }t        t        j                         ||
      } |||       L y)zyThis function automatically infer to xgboost parameters and set them
    into corresponding pyspark estimators and modelsvr   c                 X   t        | t        j                        r#t        j                  |       j	                         S t        | t
              r*| j                         D ci c]  \  }}| |       c}}S t        | t              r| D cg c]
  } |       c}S | S c c}}w c c}w N)
isinstancenpgenericarrayitemdictitemslist)r   knvparam_value_converters      R/home/cdr/jupyterlab/.venv/lib/python3.12/site-packages/xgboost/spark/estimator.pyr(   z?_set_pyspark_xgb_cls_param_attrs.<locals>.param_value_converter   s    a$88A;##%%a>?ggiHUQA,R00HHa89:")"-:: I:s   "B!B'	attr_nameparamNc                 H    |_         t        | |       t        | |       y r   )typeConvertersetattr)r*   r+   r   r   r(   s     r)   set_param_attrsz9_set_pyspark_xgb_cls_param_attrs.<locals>.set_param_attrs)   s#    3	9e,y%(    zRefer to XGBoost doc of z for this param )namedocz.fit() for this param 	callbackszThe callbacks can be arbitrary functions. It is saved using cloudpickle which is not a fully self-contained format. It may fail to load with different versions of dependencies.z.predict() for this param )_get_xgb_params_defaultr   strr	   keysr   _xgb_clsr
   _dummy_get_fit_params_default_get_predict_params_default)
r   r   params_dictr/   r1   r2   	param_objfit_params_dictpredict_params_dictr(   s
   ``       @r)    _set_pyspark_xgb_cls_param_attrsr?      s   
 335K  )3 )u ) )
   " )&i002344DTFL 	
 !tE	i()  779O$$& )&~i6H6H6J'K&L$TF, 	 ;6C
 &--/#>	i() $??A#((* )&~i6H6H6J'K&L(0 	 &--/#>	i()r0   c                  8    t        j                  dt               y )Nz9`use_gpu` is deprecated since 2.0.0, use `device` instead)warningswarnFutureWarning r0   r)   _deprecated_use_gpurE   P   s    MMC]r0   c            $           e Zd ZdZedddddddddddddddd	d
eeee   f   dededee   dee   dee   dee   de	dee
   dee   de
de
de
de
dee   deddf" fd       Zedee   fd       Zeded   fd       Zd  fdZ xZS )!SparkXGBRegressora  SparkXGBRegressor is a PySpark ML estimator. It implements the XGBoost regression
    algorithm based on XGBoost python library, and it can be used in PySpark Pipeline
    and PySpark ML meta algorithms like
    - :py:class:`~pyspark.ml.tuning.CrossValidator`/
    - :py:class:`~pyspark.ml.tuning.TrainValidationSplit`/
    - :py:class:`~pyspark.ml.classification.OneVsRest`

    SparkXGBRegressor automatically supports most of the parameters in
    :py:class:`xgboost.XGBRegressor` constructor and most of the parameters used in
    :py:meth:`xgboost.XGBRegressor.fit` and :py:meth:`xgboost.XGBRegressor.predict`
    method.

    To enable GPU support, set `device` to `cuda` or `gpu`.

    SparkXGBRegressor doesn't support setting `base_margin` explicitly as well, but
    support another param called `base_margin_col`. see doc below for more details.

    SparkXGBRegressor doesn't support `validate_features` and `output_margin` param.

    SparkXGBRegressor doesn't support setting `nthread` xgboost param, instead, the
    `nthread` param for each xgboost worker will be set equal to `spark.task.cpus`
    config value.


    Parameters
    ----------

    features_col:
        When the value is string, it requires the features column name to be vector type.
        When the value is a list of string, it requires all the feature columns to be numeric types.
    label_col:
        Label column name. Default to "label".
    prediction_col:
        Prediction column name. Default to "prediction"
    pred_contrib_col:
        Contribution prediction column name.
    validation_indicator_col:
        For params related to `xgboost.XGBRegressor` training with
        evaluation dataset's supervision,
        set :py:attr:`xgboost.spark.SparkXGBRegressor.validation_indicator_col`
        parameter instead of setting the `eval_set` parameter in `xgboost.XGBRegressor`
        fit method.
    weight_col:
        To specify the weight of the training and validation dataset, set
        :py:attr:`xgboost.spark.SparkXGBRegressor.weight_col` parameter instead of setting
        `sample_weight` and `sample_weight_eval_set` parameter in `xgboost.XGBRegressor`
        fit method.
    base_margin_col:
        To specify the base margins of the training and validation
        dataset, set :py:attr:`xgboost.spark.SparkXGBRegressor.base_margin_col` parameter
        instead of setting `base_margin` and `base_margin_eval_set` in the
        `xgboost.XGBRegressor` fit method.

    num_workers:
        How many XGBoost workers to be used to train.
        Each XGBoost worker corresponds to one spark task.
    use_gpu:
        .. deprecated:: 2.0.0

        Use `device` instead.

    device:

        .. versionadded:: 2.0.0

        Device for XGBoost workers, available options are `cpu`, `cuda`, and `gpu`.

    force_repartition:
        Boolean value to specify if forcing the input dataset to be repartitioned
        before XGBoost training.
    repartition_random_shuffle:
        Boolean value to specify if randomly shuffling the dataset when repartitioning is required.
    enable_sparse_data_optim:
        Boolean value to specify if enabling sparse data optimization, if True,
        Xgboost DMatrix object will be constructed from sparse matrix instead of
        dense matrix.
    launch_tracker_on_driver:
        Boolean value to indicate whether the tracker should be launched on the driver side or
        the executor side.
    coll_cfg:
        The collective configuration. See :py:class:`~xgboost.collective.Config`

    kwargs:
        A dictionary of xgboost parameters, please refer to
        https://xgboost.readthedocs.io/en/stable/parameter.html

    Note
    ----

    The Parameters chart above contains parameters that need special handling.
    For a full list of parameters, see entries with `Param(parent=...` below.

    This API is experimental.


    Examples
    --------

    >>> from xgboost.spark import SparkXGBRegressor
    >>> from pyspark.ml.linalg import Vectors
    >>> df_train = spark.createDataFrame([
    ...     (Vectors.dense(1.0, 2.0, 3.0), 0, False, 1.0),
    ...     (Vectors.sparse(3, {1: 1.0, 2: 5.5}), 1, False, 2.0),
    ...     (Vectors.dense(4.0, 5.0, 6.0), 2, True, 1.0),
    ...     (Vectors.sparse(3, {1: 6.0, 2: 7.5}), 3, True, 2.0),
    ... ], ["features", "label", "isVal", "weight"])
    >>> df_test = spark.createDataFrame([
    ...     (Vectors.dense(1.0, 2.0, 3.0), ),
    ...     (Vectors.sparse(3, {1: 1.0, 2: 5.5}), )
    ... ], ["features"])
    >>> xgb_regressor = SparkXGBRegressor(max_depth=5, missing=0.0,
    ... validation_indicator_col='isVal', weight_col='weight',
    ... early_stopping_rounds=1, eval_metric='rmse')
    >>> xgb_reg_model = xgb_regressor.fit(df_train)
    >>> xgb_reg_model.transform(df_test)

    featureslabel
predictionNr   FT)features_col	label_colprediction_colpred_contrib_colvalidation_indicator_col
weight_colbase_margin_colnum_workersuse_gpudeviceforce_repartitionrepartition_random_shuffleenable_sparse_data_optimlaunch_tracker_on_drivercoll_cfgrK   rL   rM   rN   rO   rP   rQ   rR   rS   rT   rU   rV   rW   rX   rY   kwargsr   c                v    t         |           | j                  }|	r
t                 | j                  di | y NrD   super__init___input_kwargsrE   	setParams)selfrK   rL   rM   rN   rO   rP   rQ   rR   rS   rT   rU   rV   rW   rX   rY   rZ   input_kwargs	__class__s                     r)   r_   zSparkXGBRegressor.__init__   s5    * 	))!&&r0   c                     t         S r   r   clss    r)   r7   zSparkXGBRegressor._xgb_cls       r0   SparkXGBRegressorModelc                     t         S r   )rj   rg   s    r)   _pyspark_model_clsz$SparkXGBRegressor._pyspark_model_cls   s    %%r0   c                 n    t         |           | j                  | j                        rt	        d      y )NzCSpark Xgboost regressor estimator does not support `qid_col` param.r^   _validate_params	isDefinedqid_col
ValueErrorrb   rd   s    r)   ro   z"SparkXGBRegressor._validate_params   s3     ">>$,,'U  (r0   r   N)__name__
__module____qualname____doc__r   r   r5   r   r   intboolr   r   r_   classmethodr   r   r7   rl   ro   __classcell__rd   s   @r)   rG   rG   V   sl   tl  /9 **.26$()-"& $"'+0).)-%)#' CcN+' 	'
 ' #3-' #+3-' SM' "#' ' $' '  ' %)' #''  #'!'" 6"#'$ %'& 
'' '4 l+   &4(@#A & & r0   rG   c                   ,    e Zd ZdZedee   fd       Zy)rj   zt
    The model returned by :func:`xgboost.spark.SparkXGBRegressor.fit`

    .. Note:: This API is experimental.
    r   c                     t         S r   rf   rg   s    r)   r7   zSparkXGBRegressorModel._xgb_cls   ri   r0   N)ru   rv   rw   rx   r{   r   r   r7   rD   r0   r)   rj   rj      s'     l+  r0   rj   c            (           e Zd ZdZeddddddddddddd	d	d	d
dddeeee   f   dededededee   dee   dee   dee   de	dee
   dee   de
de
de
de
dee   deddf& fd       Zedee   fd        Zeded!   fd"       Zd$ fd#Z xZS )%SparkXGBClassifiera  SparkXGBClassifier is a PySpark ML estimator. It implements the XGBoost
    classification algorithm based on XGBoost python library, and it can be used in
    PySpark Pipeline and PySpark ML meta algorithms like
    - :py:class:`~pyspark.ml.tuning.CrossValidator`/
    - :py:class:`~pyspark.ml.tuning.TrainValidationSplit`/
    - :py:class:`~pyspark.ml.classification.OneVsRest`

    SparkXGBClassifier automatically supports most of the parameters in
    :py:class:`xgboost.XGBClassifier` constructor and most of the parameters used in
    :py:meth:`xgboost.XGBClassifier.fit` and :py:meth:`xgboost.XGBClassifier.predict`
    method.

    To enable GPU support, set `device` to `cuda` or `gpu`.

    SparkXGBClassifier doesn't support setting `base_margin` explicitly as well, but
    support another param called `base_margin_col`. see doc below for more details.

    SparkXGBClassifier doesn't support setting `output_margin`, but we can get output
    margin from the raw prediction column. See `raw_prediction_col` param doc below for
    more details.

    SparkXGBClassifier doesn't support `validate_features` and `output_margin` param.

    SparkXGBClassifier doesn't support setting `nthread` xgboost param, instead, the
    `nthread` param for each xgboost worker will be set equal to `spark.task.cpus`
    config value.


    Parameters
    ----------

    features_col:
        When the value is string, it requires the features column name to be vector type.
        When the value is a list of string, it requires all the feature columns to be numeric types.
    label_col:
        Label column name. Default to "label".
    prediction_col:
        Prediction column name. Default to "prediction"
    probability_col:
        Column name for predicted class conditional probabilities. Default to probabilityCol
    raw_prediction_col:
        The `output_margin=True` is implicitly supported by the
        `rawPredictionCol` output column, which is always returned with the predicted margin
        values.
    pred_contrib_col:
        Contribution prediction column name.
    validation_indicator_col:
        For params related to `xgboost.XGBClassifier` training with
        evaluation dataset's supervision,
        set :py:attr:`xgboost.spark.SparkXGBClassifier.validation_indicator_col`
        parameter instead of setting the `eval_set` parameter in `xgboost.XGBClassifier`
        fit method.
    weight_col:
        To specify the weight of the training and validation dataset, set
        :py:attr:`xgboost.spark.SparkXGBClassifier.weight_col` parameter instead of setting
        `sample_weight` and `sample_weight_eval_set` parameter in `xgboost.XGBClassifier`
        fit method.
    base_margin_col:
        To specify the base margins of the training and validation
        dataset, set :py:attr:`xgboost.spark.SparkXGBClassifier.base_margin_col` parameter
        instead of setting `base_margin` and `base_margin_eval_set` in the
        `xgboost.XGBClassifier` fit method.

    num_workers:
        How many XGBoost workers to be used to train.
        Each XGBoost worker corresponds to one spark task.
    use_gpu:
        .. deprecated:: 2.0.0

        Use `device` instead.

    device:

        .. versionadded:: 2.0.0

        Device for XGBoost workers, available options are `cpu`, `cuda`, and `gpu`.

    force_repartition:
        Boolean value to specify if forcing the input dataset to be repartitioned
        before XGBoost training.
    repartition_random_shuffle:
        Boolean value to specify if randomly shuffling the dataset when repartitioning is required.
    enable_sparse_data_optim:
        Boolean value to specify if enabling sparse data optimization, if True,
        Xgboost DMatrix object will be constructed from sparse matrix instead of
        dense matrix.
    launch_tracker_on_driver:
        Boolean value to indicate whether the tracker should be launched on the driver side or
        the executor side.
    coll_cfg:
        The collective configuration. See :py:class:`~xgboost.collective.Config`

    kwargs:
        A dictionary of xgboost parameters, please refer to
        https://xgboost.readthedocs.io/en/stable/parameter.html

    Note
    ----

    The Parameters chart above contains parameters that need special handling.
    For a full list of parameters, see entries with `Param(parent=...` below.

    This API is experimental.

    Examples
    --------

    >>> from xgboost.spark import SparkXGBClassifier
    >>> from pyspark.ml.linalg import Vectors
    >>> df_train = spark.createDataFrame([
    ...     (Vectors.dense(1.0, 2.0, 3.0), 0, False, 1.0),
    ...     (Vectors.sparse(3, {1: 1.0, 2: 5.5}), 1, False, 2.0),
    ...     (Vectors.dense(4.0, 5.0, 6.0), 0, True, 1.0),
    ...     (Vectors.sparse(3, {1: 6.0, 2: 7.5}), 1, True, 2.0),
    ... ], ["features", "label", "isVal", "weight"])
    >>> df_test = spark.createDataFrame([
    ...     (Vectors.dense(1.0, 2.0, 3.0), ),
    ... ], ["features"])
    >>> xgb_classifier = SparkXGBClassifier(max_depth=5, missing=0.0,
    ...     validation_indicator_col='isVal', weight_col='weight',
    ...     early_stopping_rounds=1, eval_metric='logloss')
    >>> xgb_clf_model = xgb_classifier.fit(df_train)
    >>> xgb_clf_model.transform(df_test).show()

    rH   rI   rJ   probabilityrawPredictionNr   FT)rK   rL   rM   probability_colraw_prediction_colrN   rO   rP   rQ   rR   rS   rT   rU   rV   rW   rX   rY   rK   rL   rM   r   r   rN   rO   rP   rQ   rR   rS   rT   rU   rV   rW   rX   rY   rZ   r   c                    t         |           | j                  }|r
t                 | j                  di | | j                  d        y )N)	objectiverD   )r^   r_   r`   rE   ra   _setDefault)rb   rK   rL   rM   r   r   rN   rO   rP   rQ   rR   rS   rT   rU   rV   rW   rX   rY   rZ   rc   rd   s                       r)   r_   zSparkXGBClassifier.__init__  sH    . 	
 ))!&&4(r0   c                     t         S r   r   rg   s    r)   r7   zSparkXGBClassifier._xgb_cls      r0   SparkXGBClassifierModelc                     t         S r   )r   rg   s    r)   rl   z%SparkXGBClassifier._pyspark_model_cls  s    &&r0   c                     t         |           | j                  | j                        rt	        d      | j                  d      rt	        d      y )NzDSpark Xgboost classifier estimator does not support `qid_col` param.r   zHSetting custom 'objective' param is not allowed in 'SparkXGBClassifier'.)r^   ro   rp   rq   rr   getOrDefaultrs   s    r)   ro   z#SparkXGBClassifier._validate_params  sS     ">>$,,'V  [)Z  *r0   rt   )ru   rv   rw   rx   r   r   r5   r   r   ry   rz   r   r   r_   r{   r   r   r7   rl   ro   r|   r}   s   @r)   r   r     s   ||  /9 *,"1*.26$()-"& $"'+0).)-%)') CcN+) 	)
 ) )  ) #3-) #+3-) SM) "#) ) $) )  )  %)!)" #'#)$ #'%)& 6"')( ))* 
+) )B m,   '4(A#B ' '	 	r0   r   c                   ,    e Zd ZdZedee   fd       Zy)r   zu
    The model returned by :func:`xgboost.spark.SparkXGBClassifier.fit`

    .. Note:: This API is experimental.
    r   c                     t         S r   r   rg   s    r)   r7   z SparkXGBClassifierModel._xgb_cls  r   r0   N)ru   rv   rw   rx   r{   r   r   r7   rD   r0   r)   r   r     s'     m,  r0   r   c            &           e Zd ZdZeddddddddddddddddd	d
eeee   f   dededee   dee   dee   dee   dee   de	dee
   dee   de
de
de
de
dee   deddf$ fd       Zedee   fd       Zeded   fd       Zd! fd Z xZS )"SparkXGBRankera  SparkXGBRanker is a PySpark ML estimator. It implements the XGBoost
    ranking algorithm based on XGBoost python library, and it can be used in
    PySpark Pipeline and PySpark ML meta algorithms like
    :py:class:`~pyspark.ml.tuning.CrossValidator`/
    :py:class:`~pyspark.ml.tuning.TrainValidationSplit`/
    :py:class:`~pyspark.ml.classification.OneVsRest`

    SparkXGBRanker automatically supports most of the parameters in
    :py:class:`xgboost.XGBRanker` constructor and most of the parameters used in
    :py:meth:`xgboost.XGBRanker.fit` and :py:meth:`xgboost.XGBRanker.predict` method.

    To enable GPU support, set `device` to `cuda` or `gpu`.

    SparkXGBRanker doesn't support setting `base_margin` explicitly as well, but support
    another param called `base_margin_col`. see doc below for more details.

    SparkXGBRanker doesn't support setting `output_margin`, but we can get output margin
    from the raw prediction column. See `raw_prediction_col` param doc below for more
    details.

    SparkXGBRanker doesn't support `validate_features` and `output_margin` param.

    SparkXGBRanker doesn't support setting `nthread` xgboost param, instead, the
    `nthread` param for each xgboost worker will be set equal to `spark.task.cpus`
    config value.


    Parameters
    ----------

    features_col:
        When the value is string, it requires the features column name to be vector type.
        When the value is a list of string, it requires all the feature columns to be numeric types.
    label_col:
        Label column name. Default to "label".
    prediction_col:
        Prediction column name. Default to "prediction"
    pred_contrib_col:
        Contribution prediction column name.
    validation_indicator_col:
        For params related to `xgboost.XGBRanker` training with
        evaluation dataset's supervision,
        set :py:attr:`xgboost.spark.SparkXGBRanker.validation_indicator_col`
        parameter instead of setting the `eval_set` parameter in :py:class:`xgboost.XGBRanker`
        fit method.
    weight_col:
        To specify the weight of the training and validation dataset, set
        :py:attr:`xgboost.spark.SparkXGBRanker.weight_col` parameter instead of setting
        `sample_weight` and `sample_weight_eval_set` parameter in :py:class:`xgboost.XGBRanker`
        fit method.
    base_margin_col:
        To specify the base margins of the training and validation
        dataset, set :py:attr:`xgboost.spark.SparkXGBRanker.base_margin_col` parameter
        instead of setting `base_margin` and `base_margin_eval_set` in the
        :py:class:`xgboost.XGBRanker` fit method.
    qid_col:
        Query id column name.
    num_workers:
        How many XGBoost workers to be used to train.
        Each XGBoost worker corresponds to one spark task.
    use_gpu:
        .. deprecated:: 2.0.0

        Use `device` instead.

    device:

        .. versionadded:: 2.0.0

        Device for XGBoost workers, available options are `cpu`, `cuda`, and `gpu`.

    force_repartition:
        Boolean value to specify if forcing the input dataset to be repartitioned
        before XGBoost training.
    repartition_random_shuffle:
        Boolean value to specify if randomly shuffling the dataset when repartitioning is required.
    enable_sparse_data_optim:
        Boolean value to specify if enabling sparse data optimization, if True,
        Xgboost DMatrix object will be constructed from sparse matrix instead of
        dense matrix.
    launch_tracker_on_driver:
        Boolean value to indicate whether the tracker should be launched on the driver side or
        the executor side.
    coll_cfg:
        The collective configuration. See :py:class:`~xgboost.collective.Config`

    kwargs:
        A dictionary of xgboost parameters, please refer to
        https://xgboost.readthedocs.io/en/stable/parameter.html

    .. Note:: The Parameters chart above contains parameters that need special handling.
        For a full list of parameters, see entries with `Param(parent=...` below.

    .. Note:: This API is experimental.

    Examples
    --------

    >>> from xgboost.spark import SparkXGBRanker
    >>> from pyspark.ml.linalg import Vectors
    >>> ranker = SparkXGBRanker(qid_col="qid")
    >>> df_train = spark.createDataFrame(
    ...     [
    ...         (Vectors.dense(1.0, 2.0, 3.0), 0, 0),
    ...         (Vectors.dense(4.0, 5.0, 6.0), 1, 0),
    ...         (Vectors.dense(9.0, 4.0, 8.0), 2, 0),
    ...         (Vectors.sparse(3, {1: 1.0, 2: 5.5}), 0, 1),
    ...         (Vectors.sparse(3, {1: 6.0, 2: 7.5}), 1, 1),
    ...         (Vectors.sparse(3, {1: 8.0, 2: 9.5}), 2, 1),
    ...     ],
    ...     ["features", "label", "qid"],
    ... )
    >>> df_test = spark.createDataFrame(
    ...     [
    ...         (Vectors.dense(1.5, 2.0, 3.0), 0),
    ...         (Vectors.dense(4.5, 5.0, 6.0), 0),
    ...         (Vectors.dense(9.0, 4.5, 8.0), 0),
    ...         (Vectors.sparse(3, {1: 1.0, 2: 6.0}), 1),
    ...         (Vectors.sparse(3, {1: 6.0, 2: 7.0}), 1),
    ...         (Vectors.sparse(3, {1: 8.0, 2: 10.5}), 1),
    ...     ],
    ...     ["features", "qid"],
    ... )
    >>> model = ranker.fit(df_train)
    >>> model.transform(df_test).show()
    rH   rI   rJ   Nr   FT)rK   rL   rM   rN   rO   rP   rQ   rq   rR   rS   rT   rU   rV   rW   rX   rY   rK   rL   rM   rN   rO   rP   rQ   rq   rR   rS   rT   rU   rV   rW   rX   rY   rZ   r   c                v    t         |           | j                  }|
r
t                 | j                  di | y r\   r]   )rb   rK   rL   rM   rN   rO   rP   rQ   rq   rR   rS   rT   rU   rV   rW   rX   rY   rZ   rc   rd   s                      r)   r_   zSparkXGBRanker.__init__K  s5    , 	))!&&r0   c                     t         S r   r   rg   s    r)   r7   zSparkXGBRanker._xgb_clsg      r0   SparkXGBRankerModelc                     t         S r   )r   rg   s    r)   rl   z!SparkXGBRanker._pyspark_model_clsk  s    ""r0   c                 n    t         |           | j                  | j                        st	        d      y )Nz@Spark Xgboost ranker estimator requires setting `qid_col` param.rn   rs   s    r)   ro   zSparkXGBRanker._validate_paramso  s3     "~~dll+R  ,r0   rt   )ru   rv   rw   rx   r   r   r5   r   r   ry   rz   r   r   r_   r{   r   r   r7   rl   ro   r|   r}   s   @r)   r   r     s|   }~  /9 **.26$()-!%"& $"'+0).)-%)%' CcN+' 	'
 ' #3-' #+3-' SM' "#' #' ' $' '  ' %)'  #'!'" #'#'$ 6"%'& ''( 
)' '6 i   #4(=#> # # r0   r   c                   ,    e Zd ZdZedee   fd       Zy)r   zq
    The model returned by :func:`xgboost.spark.SparkXGBRanker.fit`

    .. Note:: This API is experimental.
    r   c                     t         S r   r   rg   s    r)   r7   zSparkXGBRankerModel._xgb_cls~  r   r0   N)ru   rv   rw   rx   r{   r   r   r7   rD   r0   r)   r   r   w  s&     i  r0   r   rt   )&rx   rA   typingr   r   r   r   r   numpyr   pysparkr   pyspark.ml.paramr	   r
   pyspark.ml.param.sharedr   r   
collectiver   sklearnr   r   r   corer   r   r   utilsr   r?   rE   rG   rj   r   r   r   r   rD   r0   r)   <module>r      s    >
  3 3    * J  < < 
 "5)&'5)04^0D5)	5)p_* _D	^ 	 !!24J Kr+->@S rj	2 	 !!35L Mi' iX	. 	 !1D Er0   