Ë
    {‰Kg­h  ã                   ó<   — d Z ddlZddlmZ ddlmZ  G d„ d«      Zy)zA
Loss functions for linear models with raw_prediction = X @ coef
é    N)Úsparseé   )Úsquared_normc                   ó~   — e Zd ZdZd„ Zdd„Zd„ Zd„ Zd„ Z	 	 	 	 dd„Z		 	 	 	 dd	„Z
	 	 	 	 dd
„Z	 	 	 	 	 	 dd„Z	 dd„Zy)ÚLinearModelLossaÓ  General class for loss functions with raw_prediction = X @ coef + intercept.

    Note that raw_prediction is also known as linear predictor.

    The loss is the average of per sample losses and includes a term for L2
    regularization::

        loss = 1 / s_sum * sum_i s_i loss(y_i, X_i @ coef + intercept)
               + 1/2 * l2_reg_strength * ||coef||_2^2

    with sample weights s_i=1 if sample_weight=None and s_sum=sum_i s_i.

    Gradient and hessian, for simplicity without intercept, are::

        gradient = 1 / s_sum * X.T @ loss.gradient + l2_reg_strength * coef
        hessian = 1 / s_sum * X.T @ diag(loss.hessian) @ X
                  + l2_reg_strength * identity

    Conventions:
        if fit_intercept:
            n_dof =  n_features + 1
        else:
            n_dof = n_features

        if base_loss.is_multiclass:
            coef.shape = (n_classes, n_dof) or ravelled (n_classes * n_dof,)
        else:
            coef.shape = (n_dof,)

        The intercept term is at the end of the coef array:
        if base_loss.is_multiclass:
            if coef.shape (n_classes, n_dof):
                intercept = coef[:, -1]
            if coef.shape (n_classes * n_dof,)
                intercept = coef[n_features::n_dof] = coef[(n_dof-1)::n_dof]
            intercept.shape = (n_classes,)
        else:
            intercept = coef[-1]

    Note: If coef has shape (n_classes * n_dof,), the 2d-array can be reconstructed as

        coef.reshape((n_classes, -1), order="F")

    The option order="F" makes coef[:, i] contiguous. This, in turn, makes the
    coefficients without intercept, coef[:, :-1], contiguous and speeds up
    matrix-vector computations.

    Note: If the average loss per sample is wanted instead of the sum of the loss per
    sample, one can simply use a rescaled sample_weight such that
    sum(sample_weight) = 1.

    Parameters
    ----------
    base_loss : instance of class BaseLoss from sklearn._loss.
    fit_intercept : bool
    c                 ó    — || _         || _        y ©N)Ú	base_lossÚfit_intercept)Úselfr
   r   s      úe/home/alanp/www/video.onchill/myenv/lib/python3.12/site-packages/sklearn/linear_model/_linear_loss.pyÚ__init__zLinearModelLoss.__init__E   s   € Ø"ˆŒØ*ˆÕó    Nc                 ó  — |j                   d   }| j                  j                  }| j                  r|dz   }n|}| j                  j                  rt        j                  |||f|d¬«      }|S t        j                  |||¬«      }|S )aâ  Allocate coef of correct shape with zeros.

        Parameters:
        -----------
        X : {array-like, sparse matrix} of shape (n_samples, n_features)
            Training data.
        dtype : data-type, default=None
            Overrides the data type of coef. With dtype=None, coef will have the same
            dtype as X.

        Returns
        -------
        coef : ndarray of shape (n_dof,) or (n_classes, n_dof)
            Coefficients of a linear model.
        é   ÚF)ÚshapeÚdtypeÚorder©r   r   )r   r
   Ú	n_classesr   Úis_multiclassÚnpÚ
zeros_like)r   ÚXr   Ú
n_featuresr   Ún_dofÚcoefs          r   Úinit_zero_coefzLinearModelLoss.init_zero_coefI   s~   € ð  —W‘W˜Q‘Zˆ
Ø—N‘N×,Ñ,ˆ	Ø×ÒØ ‘N‰EàˆEØ>‰>×'Ò'Ü—=‘= ¨9°eÐ*<ÀEÐQTÔUˆDð ˆô —=‘= ¨%°uÔ=ˆDØˆr   c                 ó<  — | j                   j                  s"| j                  r|d   }|dd }||fS d}|}||fS |j                  dk(  r*|j	                  | j                   j
                  dfd¬«      }n|}| j                  r|dd…df   }|dd…dd…f   }||fS d}||fS )a˜  Helper function to get coefficients and intercept.

        Parameters
        ----------
        coef : ndarray of shape (n_dof,), (n_classes, n_dof) or (n_classes * n_dof,)
            Coefficients of a linear model.
            If shape (n_classes * n_dof,), the classes of one feature are contiguous,
            i.e. one reconstructs the 2d-array via
            coef.reshape((n_classes, -1), order="F").

        Returns
        -------
        weights : ndarray of shape (n_features,) or (n_classes, n_features)
            Coefficients without intercept term.
        intercept : float or ndarray of shape (n_classes,)
            Intercept terms.
        éÿÿÿÿNç        r   r   ©r   )r
   r   r   ÚndimÚreshaper   )r   r   Ú	interceptÚweightss       r   Úweight_interceptz LinearModelLoss.weight_intercepte   sÍ   € ð$ ~‰~×+Ò+Ø×!Ò!Ø  ™H	Ø˜s ˜)ð  ˜	Ð!Ð!ð  	Øð ˜	Ð!Ð!ð y‰y˜AŠ~ØŸ,™,¨¯©×(@Ñ(@À"Ð'EÈS˜,ÓQ‘àØ×!Ò!Ø#¢A r E™N	Ø!¢! S b S &™/ð ˜	Ð!Ð!ð  	à˜	Ð!Ð!r   c                 ó–   — | j                  |«      \  }}| j                  j                  s	||z  |z   }n||j                  z  |z   }|||fS )ai  Helper function to get coefficients, intercept and raw_prediction.

        Parameters
        ----------
        coef : ndarray of shape (n_dof,), (n_classes, n_dof) or (n_classes * n_dof,)
            Coefficients of a linear model.
            If shape (n_classes * n_dof,), the classes of one feature are contiguous,
            i.e. one reconstructs the 2d-array via
            coef.reshape((n_classes, -1), order="F").
        X : {array-like, sparse matrix} of shape (n_samples, n_features)
            Training data.

        Returns
        -------
        weights : ndarray of shape (n_features,) or (n_classes, n_features)
            Coefficients without intercept term.
        intercept : float or ndarray of shape (n_classes,)
            Intercept terms.
        raw_prediction : ndarray of shape (n_samples,) or             (n_samples, n_classes)
        )r(   r
   r   ÚT)r   r   r   r'   r&   Úraw_predictions         r   Úweight_intercept_rawz$LinearModelLoss.weight_intercept_rawŒ   sU   € ð, "×2Ñ2°4Ó8Ñˆà~‰~×+Ò+Ø ™[¨9Ñ4‰Nð  §¡™]¨YÑ6ˆNà˜	 >Ð1Ð1r   c                 óP   — |j                   dk(  r||z  n
t        |«      }d|z  |z  S )z5Compute L2 penalty term l2_reg_strength/2 *||w||_2^2.r   g      à?)r$   r   )r   r'   Úl2_reg_strengthÚnorm2_ws       r   Ú
l2_penaltyzLinearModelLoss.l2_penalty¬   s.   € à'.§|¡|°qÒ'8'˜GÒ#¼lÈ7Ó>SˆØ_Ñ$ wÑ.Ð.r   c                 óò   — |€| j                  ||«      \  }}	}n| j                  |«      \  }}	| j                  j                  ||d|¬«      }
t	        j
                  |
|¬«      }
|
| j                  ||«      z   S )a  Compute the loss as weighted average over point-wise losses.

        Parameters
        ----------
        coef : ndarray of shape (n_dof,), (n_classes, n_dof) or (n_classes * n_dof,)
            Coefficients of a linear model.
            If shape (n_classes * n_dof,), the classes of one feature are contiguous,
            i.e. one reconstructs the 2d-array via
            coef.reshape((n_classes, -1), order="F").
        X : {array-like, sparse matrix} of shape (n_samples, n_features)
            Training data.
        y : contiguous array of shape (n_samples,)
            Observed, true target values.
        sample_weight : None or contiguous array of shape (n_samples,), default=None
            Sample weights.
        l2_reg_strength : float, default=0.0
            L2 regularization strength
        n_threads : int, default=1
            Number of OpenMP threads to use.
        raw_prediction : C-contiguous array of shape (n_samples,) or array of             shape (n_samples, n_classes)
            Raw prediction values (in link space). If provided, these are used. If
            None, then raw_prediction = X @ coef + intercept is calculated.

        Returns
        -------
        loss : float
            Weighted average of losses per sample, plus penalty.
        N©Úy_truer+   Úsample_weightÚ	n_threads)r'   )r,   r(   r
   Úlossr   Úaverager0   )r   r   r   Úyr4   r.   r5   r+   r'   r&   r6   s              r   r6   zLinearModelLoss.loss±   s‡   € ðN Ð!Ø15×1JÑ1JÈ4ÐQRÓ1SÑ.ˆGY¡à!%×!6Ñ!6°tÓ!<ÑˆGYà~‰~×"Ñ"ØØ)ØØð	 #ó 
ˆô z‰z˜$¨Ô6ˆàd—o‘o g¨Ó?Ñ?Ð?r   c                 ó¤  — |j                   | j                  j                  c\  }}	}
|	t        | j                  «      z   }|€| j                  ||«      \  }}}n| j                  |«      \  }}| j                  j                  ||||¬«      \  }}|€|nt        j                  |«      }|j                  «       |z  }|| j                  ||«      z  }||z  }| j                  j                  s\t        j                  ||j                  ¬«      }|j                  |z  ||z  z   |d|	 | j                  r|j                  «       |d<   ||fS t        j                  |
|f|j                  d¬«      }|j                  |z  ||z  z   |dd…d|	…f<   | j                  r|j                  d¬«      |dd…df<   |j                   d	k(  r|j#                  d¬
«      }||fS )a\  Computes the sum of loss and gradient w.r.t. coef.

        Parameters
        ----------
        coef : ndarray of shape (n_dof,), (n_classes, n_dof) or (n_classes * n_dof,)
            Coefficients of a linear model.
            If shape (n_classes * n_dof,), the classes of one feature are contiguous,
            i.e. one reconstructs the 2d-array via
            coef.reshape((n_classes, -1), order="F").
        X : {array-like, sparse matrix} of shape (n_samples, n_features)
            Training data.
        y : contiguous array of shape (n_samples,)
            Observed, true target values.
        sample_weight : None or contiguous array of shape (n_samples,), default=None
            Sample weights.
        l2_reg_strength : float, default=0.0
            L2 regularization strength
        n_threads : int, default=1
            Number of OpenMP threads to use.
        raw_prediction : C-contiguous array of shape (n_samples,) or array of             shape (n_samples, n_classes)
            Raw prediction values (in link space). If provided, these are used. If
            None, then raw_prediction = X @ coef + intercept is calculated.

        Returns
        -------
        loss : float
            Weighted average of losses per sample, plus penalty.

        gradient : ndarray of shape coef.shape
             The gradient of the loss.
        Nr2   ©r   r!   r   ©r   r   r   ©Úaxisr   r#   )r   r
   r   Úintr   r,   r(   Úloss_gradientr   Úsumr0   r   Ú
empty_liker   r*   Úemptyr$   Úravel)r   r   r   r8   r4   r.   r5   r+   Ú	n_samplesr   r   r   r'   r&   r6   Úgrad_pointwiseÚsw_sumÚgrads                     r   r?   zLinearModelLoss.loss_gradientç   sÒ  € ðT ./¯W©W°d·n±n×6NÑ6NÐ*ÑˆJ ØœS ×!3Ñ!3Ó4Ñ4ˆàÐ!Ø15×1JÑ1JÈ4ÐQRÓ1SÑ.ˆGY¡à!%×!6Ñ!6°tÓ!<ÑˆGYà#Ÿ~™~×;Ñ;ØØ)Ø'Øð	  <ó  
Ñˆˆnð ,Ð3‘¼¿¹ÀÓ9NˆØx‰x‹z˜FÑ"ˆØ—‘ ¨Ó9Ñ9ˆà˜&Ñ ˆà~‰~×+Ò+Ü—=‘= ¨W¯]©]Ô;ˆDØ !§¡ nÑ 4°ÈÑ7PÑ PˆD*ÐØ×!Ò!Ø)×-Ñ-Ó/R‘ð TˆzÐô —8‘8˜Y¨Ð.°g·m±mÈ3ÔOˆDà#1×#3Ñ#3°aÑ#7¸/ÈGÑ:SÑ#SˆD’KZKÑ Ø×!Ò!Ø,×0Ñ0°aÐ0Ó8’Q˜U‘Øy‰y˜AŠ~Ø—z‘z¨zÓ,àTˆzÐr   c                 óF  — |j                   | j                  j                  c\  }}	}
|	t        | j                  «      z   }|€| j                  ||«      \  }}}n| j                  |«      \  }}| j                  j                  ||||¬«      }|€|nt        j                  |«      }||z  }| j                  j                  sZt        j                  ||j                  ¬«      }|j                  |z  ||z  z   |d|	 | j                  r|j                  «       |d<   |S t        j                  |
|f|j                  d¬«      }|j                  |z  ||z  z   |dd…d|	…f<   | j                  r|j                  d¬«      |dd…df<   |j                  d	k(  r|j!                  d¬
«      S |S )aõ  Computes the gradient w.r.t. coef.

        Parameters
        ----------
        coef : ndarray of shape (n_dof,), (n_classes, n_dof) or (n_classes * n_dof,)
            Coefficients of a linear model.
            If shape (n_classes * n_dof,), the classes of one feature are contiguous,
            i.e. one reconstructs the 2d-array via
            coef.reshape((n_classes, -1), order="F").
        X : {array-like, sparse matrix} of shape (n_samples, n_features)
            Training data.
        y : contiguous array of shape (n_samples,)
            Observed, true target values.
        sample_weight : None or contiguous array of shape (n_samples,), default=None
            Sample weights.
        l2_reg_strength : float, default=0.0
            L2 regularization strength
        n_threads : int, default=1
            Number of OpenMP threads to use.
        raw_prediction : C-contiguous array of shape (n_samples,) or array of             shape (n_samples, n_classes)
            Raw prediction values (in link space). If provided, these are used. If
            None, then raw_prediction = X @ coef + intercept is calculated.

        Returns
        -------
        gradient : ndarray of shape coef.shape
             The gradient of the loss.
        Nr2   r:   r!   r   r;   r   r<   r   r#   )r   r
   r   r>   r   r,   r(   Úgradientr   r@   r   rA   r   r*   rB   r$   rC   )r   r   r   r8   r4   r.   r5   r+   rD   r   r   r   r'   r&   rE   rF   rG   s                    r   rI   zLinearModelLoss.gradient5  s›  € ðN ./¯W©W°d·n±n×6NÑ6NÐ*ÑˆJ ØœS ×!3Ñ!3Ó4Ñ4ˆàÐ!Ø15×1JÑ1JÈ4ÐQRÓ1SÑ.ˆGY¡à!%×!6Ñ!6°tÓ!<ÑˆGYàŸ™×0Ñ0ØØ)Ø'Øð	 1ó 
ˆð ,Ð3‘¼¿¹ÀÓ9NˆØ˜&Ñ ˆà~‰~×+Ò+Ü—=‘= ¨W¯]©]Ô;ˆDØ !§¡ nÑ 4°ÈÑ7PÑ PˆD*ÐØ×!Ò!Ø)×-Ñ-Ó/R‘ØˆKä—8‘8˜Y¨Ð.°g·m±mÈ3ÔOˆDà#1×#3Ñ#3°aÑ#7¸/ÈGÑ:SÑ#SˆD’KZKÑ Ø×!Ò!Ø,×0Ñ0°aÐ0Ó8’Q˜U‘Øy‰y˜AŠ~Ø—z‘z¨zÓ,Ð,àr   c
                 óà  — |j                   \  }
}|t        | j                  «      z   }|	€| j                  ||«      \  }}}	n| j	                  |«      \  }}| j
                  j                  ||	||¬«      \  }}|€|
nt        j                  |«      }||z  }||z  }t        j                  |dk  «      dkD  }t        j                  |«      }| j
                  j                  s„|€"t        j                  ||j                  ¬«      }n|}|j                  |z  ||z  z   |d| | j                  r|j                  «       |d<   |€$t        j                  ||f|j                  ¬«      }n|}|r|||fS t!        j"                  |«      rC|j                  t!        j$                  |df|
|
f¬«      z  |z  j'                  «       |d|…d|…f<   n5|dd…df   |z  }t        j(                  |j                  |«      |d|…d|…f<   |dkD  r%|j+                  d«      d||z  |d	z   …xx   |z  cc<   | j                  r;|j                  |z  }||dd…df<   ||ddd…f<   |j                  «       |d
<   nt,        ‚|||fS )aå  Computes gradient and hessian w.r.t. coef.

        Parameters
        ----------
        coef : ndarray of shape (n_dof,), (n_classes, n_dof) or (n_classes * n_dof,)
            Coefficients of a linear model.
            If shape (n_classes * n_dof,), the classes of one feature are contiguous,
            i.e. one reconstructs the 2d-array via
            coef.reshape((n_classes, -1), order="F").
        X : {array-like, sparse matrix} of shape (n_samples, n_features)
            Training data.
        y : contiguous array of shape (n_samples,)
            Observed, true target values.
        sample_weight : None or contiguous array of shape (n_samples,), default=None
            Sample weights.
        l2_reg_strength : float, default=0.0
            L2 regularization strength
        n_threads : int, default=1
            Number of OpenMP threads to use.
        gradient_out : None or ndarray of shape coef.shape
            A location into which the gradient is stored. If None, a new array
            might be created.
        hessian_out : None or ndarray
            A location into which the hessian is stored. If None, a new array
            might be created.
        raw_prediction : C-contiguous array of shape (n_samples,) or array of             shape (n_samples, n_classes)
            Raw prediction values (in link space). If provided, these are used. If
            None, then raw_prediction = X @ coef + intercept is calculated.

        Returns
        -------
        gradient : ndarray of shape coef.shape
             The gradient of the loss.

        hessian : ndarray
            Hessian matrix.

        hessian_warning : bool
            True if pointwise hessian has more than half of its elements non-positive.
        Nr2   r   g      Ð?r:   r!   r   ©r   r   )r!   r!   )r   r>   r   r,   r(   r
   Úgradient_hessianr   r@   ÚmeanÚabsr   rA   r   r*   rB   r   ÚissparseÚ
dia_matrixÚtoarrayÚdotr%   ÚNotImplementedError)r   r   r   r8   r4   r.   r5   Úgradient_outÚhessian_outr+   rD   r   r   r'   r&   rE   Úhess_pointwiserF   Úhessian_warningrG   ÚhessÚWXÚXhs                          r   rL   z LinearModelLoss.gradient_hessian~  s°  € ðj !"§¡Ñˆ	:ØœS ×!3Ñ!3Ó4Ñ4ˆàÐ!Ø15×1JÑ1JÈ4ÐQRÓ1SÑ.ˆGY¡à!%×!6Ñ!6°tÓ!<ÑˆGYà)-¯©×)HÑ)HØØ)Ø'Øð	 *Ió *
Ñ&ˆ˜ð ,Ð3‘¼¿¹ÀÓ9NˆØ˜&Ñ ˆØ˜&Ñ ˆô
 Ÿ'™' .°AÑ"5Ó6¸Ñ=ˆÜŸ™ Ó/ˆà~‰~×+Ó+àÐ#Ü—}‘} T°·±Ô?‘à#Ø !§¡ nÑ 4°ÈÑ7PÑ PˆD*ÐØ×!Ò!Ø)×-Ñ-Ó/R‘ð Ð"Ü—x‘x u¨e n¸G¿M¹MÔJ‘à"áà˜T ?Ð2Ð2ô
 ‰˜qÔ!à—C‘CÜ×'Ñ'Ø'¨Ð+°I¸yÐ3Iôñð ñ	÷
 ‘'“)ð [j[ + : +Ð-Ò.ð $¢A t GÑ,¨qÑ0Ü13·±¸¿¹¸R³[j[ + : +Ð-Ñ.à Ò"ð —‘˜RÓ Ø8z EÑ)¨e°a©iÐ8óà$ñ%ó ð ×!Ò!ð —S‘S˜>Ñ)Ø "SbS˜"W‘Ø "R˜˜"˜W‘Ø-×1Ñ1Ó3V’ô &Ð%àT˜?Ð*Ð*r   c                 óB  ‡ ‡‡‡‡‡‡‡‡‡‡‡‡‡— ‰j                   ‰ j                  j                  c\  }ŠŠ‰t        ‰ j                  «      z   Š‰ j                  ‰‰«      \  Š}}	‰€|nt        j                  ‰«      Š‰ j                  j                  sJ‰ j                  j                  ||	‰|¬«      \  }
}|
‰z  }
|‰z  }t        j                  ‰‰j                  ¬«      }‰j                  |
z  ‰‰z  z   |d‰ ‰ j                  r|
j                  «       |d<   |j                  «       Št        j                  ‰«      rt        j                  |df||f¬«      ‰z  Šn|dd…t        j                   f   ‰z  Š‰ j                  rMt        j"                  t        j$                  ‰j                  d¬«      «      «      Št        j&                  ‰«      Šˆˆˆˆˆˆˆ fd„}||fS ‰ j                  j)                  ||	‰|¬«      \  }
Š|
‰z  }
t        j*                  ‰‰f‰j                  d	¬
«      }|
j                  ‰z  ‰‰z  z   |dd…d‰…f<   ‰ j                  r|
j                  d¬«      |dd…df<   ˆˆˆˆˆˆˆˆˆ ˆˆfd„}‰j,                  dk(  r|j/                  d	¬«      |fS ||fS )a¡  Computes gradient and hessp (hessian product function) w.r.t. coef.

        Parameters
        ----------
        coef : ndarray of shape (n_dof,), (n_classes, n_dof) or (n_classes * n_dof,)
            Coefficients of a linear model.
            If shape (n_classes * n_dof,), the classes of one feature are contiguous,
            i.e. one reconstructs the 2d-array via
            coef.reshape((n_classes, -1), order="F").
        X : {array-like, sparse matrix} of shape (n_samples, n_features)
            Training data.
        y : contiguous array of shape (n_samples,)
            Observed, true target values.
        sample_weight : None or contiguous array of shape (n_samples,), default=None
            Sample weights.
        l2_reg_strength : float, default=0.0
            L2 regularization strength
        n_threads : int, default=1
            Number of OpenMP threads to use.

        Returns
        -------
        gradient : ndarray of shape coef.shape
             The gradient of the loss.

        hessp : callable
            Function that takes in a vector input of shape of gradient and
            and returns matrix-vector product with hessian.
        Nr2   r:   r!   r   rK   r<   c                 ó‚  •— t        j                  | «      }t        j                  ‰«      r‰j                  ‰| d ‰ z  z  |d ‰ n2t         j
                  j                  ‰j                  ‰| d ‰ g«      |d ‰ |d ‰xxx ‰| d ‰ z  z  ccc ‰j                  r(|d ‰xxx | d   ‰z  z  ccc ‰| d ‰ z  ‰| d   z  z   |d<   |S )Nr!   )r   rA   r   rO   r*   ÚlinalgÚ	multi_dotr   )	ÚsÚretr   ÚhXÚhX_sumÚhessian_sumr.   r   r   s	     €€€€€€€r   Úhesspz7LinearModelLoss.gradient_hessian_product.<locals>.hesspR  sÐ   ø€ Ü—m‘m AÓ&Ü—?‘? 1Ô%Ø'(§s¡s¨b°1°[°j°>Ñ.AÑ'BC˜˜Ñ$ä')§y¡y×':Ñ':¸A¿C¹CÀÀQÀ{È
À^Ð;TÓ'UC˜˜Ð$ØKZÓ  O°a¸¸°nÑ$DÑDÓ à×%Ò%Ø˜˜Ó$¨¨"©°©Ñ6Ó$Ø$ q¨¨* ~Ñ5¸ÀaÈÁeÑ8KÑKC˜‘GØ
r   r   r;   c                 óV  •— | j                  ‰dfd¬«      } ‰j                  r| d d …df   }| d d …d d…f   } nd}‰| j                  z  |z   }|‰
 |z  j                  d¬«      d d …t        j
                  f   z  }|‰
z  }‰|‰d d …t        j
                  f   z  }t	        j                  ‰‰f‰j                  d¬«      }|j                  ‰z  ‰z  ‰| z  z   |d d …d ‰	…f<   ‰j                  r|j                  d¬«      ‰z  |d d …df<   ‰j                  dk(  r|j                  d¬«      S |S )Nr!   r   r#   r   r   r<   r;   )
r%   r   r*   r@   r   ÚnewaxisrB   r   r$   rC   )r_   Ús_interceptÚtmpÚ	hess_prodr   r   r.   r   r   r   Úprobar4   r   rF   r'   s       €€€€€€€€€€€r   rd   z7LinearModelLoss.gradient_hessian_product.<locals>.hessp†  s8  ø€ Ø—I‘I˜y¨"˜o°SIÓ9Ø×%Ò%Ø"#¢A r E¡(KØš!˜S˜b˜S˜&™	‘Aà"#KØ˜!Ÿ#™#‘g Ñ+Ø˜˜ ™×)Ñ)¨qÐ)Ó1²!´R·Z±Z°-Ñ@Ñ@Øu‘Ø Ð,Ø˜=ª¬B¯J©J¨Ñ7Ñ7Cô ŸH™H i°Ð%7¸w¿}¹}ÐTWÔX	Ø-0¯U©U°Q©Y¸&Ñ,@À?ÐUVÑCVÑ,V	š!˜[˜j˜[˜.Ñ)Ø×%Ò%Ø'*§w¡w°A w£¸Ñ'?Iša ˜eÑ$Ø—9‘9 ’>Ø$Ÿ?™?°˜?Ó5Ð5à$Ð$r   r   r#   )r   r
   r   r>   r   r,   r   r@   r   rL   rA   r   r*   r   rO   rP   rf   ÚsqueezeÚasarrayÚ
atleast_1dÚgradient_probarB   r$   rC   )r   r   r   r8   r4   r.   r5   rD   r&   r+   rE   rV   rG   rd   ra   rb   rc   r   r   r   rj   rF   r'   s   ``` ``        @@@@@@@@@r   Úgradient_hessian_productz(LinearModelLoss.gradient_hessian_product	  s‰  ÿý€ ð@ ./¯W©W°d·n±n×6NÑ6NÐ*ÑˆJ ØœS ×!3Ñ!3Ó4Ñ4ˆØ-1×-FÑ-FÀtÈQÓ-OÑ*ˆ˜NØ+Ð3‘¼¿¹ÀÓ9Nˆà~‰~×+Ó+Ø-1¯^©^×-LÑ-LØØ-Ø+Ø#ð	 .Mó .Ñ*ˆN˜Nð ˜fÑ$ˆNØ˜fÑ$ˆNÜ—=‘= ¨W¯]©]Ô;ˆDØ !§¡ nÑ 4°ÈÑ7PÑ PˆD*ÐØ×!Ò!Ø)×-Ñ-Ó/R‘ð )×,Ñ,Ó.ˆKÜ‰˜qÔ!ä×%Ñ% ~°qÐ&9À)ÈYÐAWÔXØññ ð
 $¢A¤r§z¡z MÑ2°QÑ6à×!Ò!ô Ÿ™¤B§J¡J¨r¯v©v¸1¨v«~Ó$>Ó?äŸ™ vÓ.÷ò ð\ Uˆ{Ððw %)§N¡N×$AÑ$AØØ-Ø+Ø#ð	 %Bó %Ñ!ˆN˜Eð ˜fÑ$ˆNÜ—8‘8˜Y¨Ð.°g·m±mÈ3ÔOˆDØ#1×#3Ñ#3°aÑ#7¸/ÈGÑ:SÑ#SˆD’KZKÑ Ø×!Ò!Ø,×0Ñ0°aÐ0Ó8’Q˜U‘÷.%ö %ð. y‰y˜AŠ~Ø—z‘z¨zÓ,¨eÐ3Ð3àUˆ{Ðr   r	   )Nr"   r   N)Nr"   r   NNN)Nr"   r   )Ú__name__Ú
__module__Ú__qualname__Ú__doc__r   r   r(   r,   r0   r6   r?   rI   rL   ro   © r   r   r   r      sŠ   „ ñ7òr+óò8%"òN2ò@/ð ØØØó4@ðv ØØØóLðf ØØØóGð\ ØØØØØóI+ðX NOôWr   r   )rs   Únumpyr   Úscipyr   Úutils.extmathr   r   rt   r   r   Ú<module>rx      s!   ðñó Ý å (÷U
ò U
r   