
    =[gH              
       ^   d dl Z d dlZd dlZd dlmZmZmZ d dlm	Z	 d dl
mZmZmZmZmZmZmZmZmZmZmZmZmZmZ d dlmZmZ d dlmZ d dlmZ d dl m!Z!m"Z" eeeeeeegZ#d	 Z$d
 Z%d Z&d Z'd Z(d Z)d Z*d Z+d2dZ,d Z-d Z.d Z/d Z0d Z1ejd                  jg                  d e             d        Z4d Z5d Z6d Z7d3dZ8d Z9d Z:ejd                  jg                  dd gd!z  g d"fd#gd!z  g d"fg d"d gd!z  fg d"d#gd!z  fd gd!z  d gd!z  fg      d$        Z;d% Z<d& Z=d' Z>d( Z?ejd                  jg                  d) e@ eAd*             e@ eAd*            f ej                  d+       ej                  d+      fg      d,        ZCd- ZDd. ZEejd                  jg                  d/g d0      d1        ZFy)4    N)assert_allcloseassert_array_almost_equalassert_array_equal)config_context)adjusted_mutual_info_scoreadjusted_rand_scorecompleteness_scorecontingency_matrixentropyexpected_mutual_informationfowlkes_mallows_score"homogeneity_completeness_v_measurehomogeneity_scoremutual_info_scorenormalized_mutual_info_scorepair_confusion_matrix
rand_scorev_measure_score)_generalized_averagecheck_clusterings)assert_all_finite))yield_namespace_device_dtype_combinations)_array_api_for_testsassert_almost_equalc                     t         D ]  } d}t        j                  t        |      5   | ddgg d       d d d        d}t        j                  t        |      5   | ddgddggg d       d d d        d}t        j                  t        |      5   | g dddgddgg       d d d         y # 1 sw Y   zxY w# 1 sw Y   OxY w# 1 sw Y   xY w)	NzDFound input variables with inconsistent numbers of samples: \[2, 3\]matchr      )r   r   r   z$labels_true must be 1D: shape is \(2z$labels_pred must be 1D: shape is \(2r   r   r   )score_funcspytestraises
ValueError)
score_funcexpecteds     h/var/www/html/bid-api/venv/lib/python3.12/site-packages/sklearn/metrics/cluster/tests/test_supervised.py"test_error_messages_on_wrong_inputr'   (   s    !
W 	 ]]:X61vy) 7 ;]]:X6AA'3 7 ;]]:X6yAq6Aq6"23 76 " 76 76 76s#   B.B:C.B7	:C	C	c                  $   d\  } }g d}|D cg c]  }t        | ||       }}|d   |d   cxk  r|d   cxk  r	|d   k  sJ  J d\  }}|D cg c]  }t        |||       }}|d   |d   cxk(  r|d   cxk(  r	|d   k(  sJ  J y c c}w c c}w )N)r      min	geometric
arithmeticmaxr   r   r)      )   r0   )r   )abmethodsmethodmeanscds          r&   test_generalized_averager8   9   s    DAq7G>EFgF!!Q/gEF8uQx7587uQx77777DAq>EFgF!!Q/gEF8uQx7587uQx77777	 G Gs   BBc                  n   t         D ]  }  | g g       t        j                  d      k(  sJ  | dgdg      t        j                  d      k(  sJ  | g dg d      t        j                  d      k(  sJ  | g dg d      t        j                  d      k(  sJ  | g dg d      t        j                  d      k(  sJ  | g d	g d
      t        j                  d      k(  sJ  | g dg d      t        j                  d      k(  rJ  t        t        g}h d}|D ]  } |D ]  } | g g |      t        j                  d      k(  sJ  | dgdg|      t        j                  d      k(  sJ  | g dg d|      t        j                  d      k(  sJ  | g dg d|      t        j                  d      k(  sJ  | g dg d|      t        j                  d      k(  sJ  | g d	g d
|      t        j                  d      k(  sJ  | g dg d|      t        j                  d      k(  rJ   y )N      ?r   r   )r   r   r   r   )*      r;   )        r:   r=   )      E@      @r>   )r=   r:          @)r>   r?   r@   )r   r   r)   )r;   r<   r)   >   r.   r+   r,   r-   average_method)r    r!   approxr   r   )r$   score_funcs_with_changing_meansr5   means       r&   test_perfect_matchesrF   C   s/   !
"b!V]]3%77771#s#v}}S'9999)Y/6==3EEEE)[1V]]35GGGG/+<=sASSSS/+;<c@RRRR)Z0FMM#4FFFF " 	%"'# 6E5
Db"T:fmmC>PPPPqcA3t<c@RRRR9Ts#$ $ $ ;ts#$ $ $ !24s#$ $ $ !1$s#$ $ $ :ds#$ $ $  6    c                  z    t        g dg d      \  } }}t        | dd       t        |dd       t        |dd       y )Nr   r   r   r   r   r   )r   r   r   r   r)   r)   r:   r)   gGz?gQ?r   r   hr6   vs      r&   *test_homogeneous_but_not_complete_labelingrN   f   :    01CEWXGAq!4#4#4#rG   c                  z    t        g dg d      \  } }}t        | dd       t        |dd       t        |dd       y )Nr   r   r   r   r)   r)   )r   r   r   r   r   r   g(\?r)   r:   g\(\?rJ   rK   s      r&   *test_complete_but_not_homogeneous_labelingrR   n   rO   rG   c                  z    t        g dg d      \  } }}t        | dd       t        |dd       t        |dd       y )NrI   r   r   r   r   r)   r)   q=
ףp?r)   zG?p=
ף?rJ   rK   s      r&   .test_not_complete_and_not_homogeneous_labelingrX   v   rO   rG   c                      d} d}d}d| z   |z  |z  | |z  |z   z  }t        g dg d|       \  }}}t        ||d       t        ||d       t        ||d       t        g dg d|       }t        ||d       y )	Ng?rU   rV   r   rI   rT   )betar)   )r   r   r   )	beta_testh_testc_testv_testrL   r6   rM   s          r&   test_beta_parameterr_   ~   s     IFF)mv%.)f2Dv2MNF0.YGAq! 61%61%61%*,>YOA61%rG   c                     t        g dg d      \  } }}t        | dd       t        |dd       t        |dd       t        g dg d      \  } }}t        | dd       t        |dd       t        |dd       t        g dg d      }t        g dg d      }t        |d	d       t        |d	d       t        g dg d      }t        g dg d      }t        |d
d       t        |d
d       y )N)r   r   r   r)   r)   r)   rT   rU   r)   rV   rW   rI   )r      r   ra   r)   r)   gQ?gQ?)r   r   r   r   )rL   r6   rM   ari_1ari_2ri_1ri_2s          r&   test_non_consecutive_labelsrf      s    01CEWXGAq!4#4#4#01CEWXGAq!4#4#4# 24FGE 24FGEtQ'tQ'(*<=D(*<=DdA&dA&rG   c                 &   t         j                  j                  |      j                  }t        j                  t        |      |f      }t        |      D ]9  \  }}t        |      D ]&  }	 |d||      }
 |d||      } | |
|      |||	f<   ( ; |S )Nr   )lowhighsize)nprandomRandomStaterandintzeroslen	enumeraterange)r$   	n_samplesk_rangen_runsseedrandom_labelsscoresikjlabels_alabels_bs               r&   uniform_labelings_scoresr~      s    II))$/77MXXs7|V,-F'"1vA$CH$CH%h9F1a4L  #
 MrG   c                      g d} d}d}t        t        || |      }t        j                  |      j	                  d      }t        |g dd       y )N)r)   
   2   Z   d   r   r   )axis){Gz?Q?r   r   r)   )r~   r   rk   absr.   r   )n_clusters_rangers   ru   rx   max_abs_scoress        r&   test_adjustment_for_chancer      sP    &IF%Y(8&F VVF^''Q'/Nn.FJrG   c                     t        j                  g d      } t        j                  g d      }t        | |      }t        |dd       t	        | |d      }t        | ||      }t        |dd       t	        | |      }t        | ||      }t        |dd       |j                         }t        ||      }t        |dd       t        | |      }t        |d	d       t        g d
g d      }|t        j                  d      k(  sJ t        j                  t        |       dz  g      j                         }t        j                  t        |      dz  g      j                         }t        ||      }t        |dd       y )Nr   r   r   r   r   r   r)   r)   r)   r)   r)   r)   r/   r/   r/   r/   r/   r   r   r   r   r)   r   r)   r)   r)   r)   r/   r   r/   r/   r/   r)   r)   gS
cA?   Tsparse)contingencygpUj@?gP1?)r   r   r)   r)   )r)   r)   r/   r/   r:   n   gRQ?r)   )rk   arrayr   r   r
   sumr   r   r!   rC   listflatten)	r|   r}   miCrs   emiamia110b110s	            r&   test_adjusted_mutual_info_scorer      sB   xxKLHxxKLH	8X	.BGQ'8Xd;A	8X1	=BGQ'8X.A	8X1	=BGQ'I
%a
3CWa(
$Xx
8CWa(
$\<
@C&--$$$$88T(^c)*+335D88T(^c)*+335D
$T4
0CT1%rG   c                  P    t        t        j                  dgg      d      dk  sJ y )Nip r   )r   rk   r    rG   r&   "test_expected_mutual_info_overflowr      s&     'rxx%	':EBaGGGrG   c                  r   t        j                  dgdz  dgdz  z   dgdz  z   dgdz  z   d	gd
z  z         } t        j                  dgdz  dgdz  z   dgdz  z   dgdz  z   dgdz  z   dgdz  z   dgdz  z   dgdz  z   dgdz  z   dgdz  z         }t        t        | |             t        t	        | |             y )Nr   iy  r)   i]<  r/   i  ra   iU  r   iP  r   i  i	  iD9  i  i     i.  '   i<     )rk   r   r   r   r   )xys     r&   3test_int_overflow_mutual_info_fowlkes_mallows_scorer      s!   
	
|#
	#
	 #
	 #
			A 		
e#*	#+	 #)	 #*		
 #)	 #)	 #(	 #)	 #(			A '1-.+Aq12rG   c                      t        t        g d      dd       t        t        g       d       t        g d      dk(  sJ y )Nr   r   r>   ,^R^?r   r   r   r   r   r   r   )r   r   r   rG   r&   test_entropyr     s4    -y!<Q'< A%%%rG   z#array_namespace, device, dtype_namec                    t        | |      }|j                  t        j                  g d|      |      }|j                  g |j                  |      }|j                  g d|      }t	        d      5  t        |      t        j                  dd	
      k(  sJ t        |      dk(  sJ t        |      dk(  sJ 	 d d d        y # 1 sw Y   y xY w)Nr   dtype)device)r   r   r   T)array_api_dispatchr   gh㈵>)r   r   r   )r   asarrayrk   int32r   r   r!   rC   )array_namespacer   
dtype_namexpfloat_labelsempty_int32_labels
int_labelss          r&   test_entropy_array_apir     s     
ov	6B::bjjZHQW:XLBbhhvFL8J	4	0|$iT(JJJJ)*a///z"a''' 
1	0	0s   6ACCc            	      T   t        j                  g d      } t        j                  g d      }t        | |      }t        j                  | |t        j                  dd      t        j                  dd      f      d   }t        ||       t        | |d      }t        ||dz          y )	Nr   r   r   r   )binsr   g?)eps)rk   r   r
   histogram2daranger   )r|   r}   r   C2s       r&   test_contingency_matrixr     s    xxKLHxxKLH8X.A	("))Aq/299QPQ?1S	TUV	WBa$8X37Aac*rG   c                  F   t        j                  g d      } t        j                  g d      }t        | |      }t        | |d      j                         }t	        ||       t        j                  t        d      5  t        | |dd       d d d        y # 1 sw Y   y xY w)	Nr   r   Tr   z!Cannot set 'eps' when sparse=Truer   g|=)r   r   )rk   r   r
   toarrayr   r!   r"   r#   )r|   r}   r   C_sparses       r&   test_contingency_matrix_sparser      sw    xxKLHxxKLH8X.A!(HTBJJLHa*	z)L	M8X5F 
N	M	Ms   >BB c                     t        j                  ddd      j                  t              D ]  } t        j                  | t              t        j
                  | t              }}t        ||      t        j                  d      k(  sJ t        ||      t        j                  d      k(  sJ t        ||      t        j                  d      k(  sJ t        ||      t        j                  d      k(  sJ dD ]N  }t        |||      t        j                  d      k(  sJ t        |||      t        j                  d      k(  rNJ   y )Nr   ra   r   r=   r*   rA   )rk   logspaceastypeintonesr   r   r!   rC   r   r   )ry   r|   r}   r4   s       r&   test_exactly_zero_info_scorer   *  s   [[Aq!((- ggas3RYYq5L(+Hh?6==QTCUUUUx2fmmC6HHHH)(H=sASSSS+Hh?6==QTCUUUU?F-(6s#$ $ $ 0(6s#$ $ $	 @ .rG   c           	         t        j                  ddd      j                  t              D ]  }t         j                  j                  |       }|j                  dd|      |j                  dd|      }}t        t        ||      dt        ||      z  t        |      t        |      z   z  d       d}t        t        ||      t        |||              y )Nr   ra   r   r   r@   r-   rA   )rk   r   r   r   rl   rm   rn   r   r   r   r   r   )rv   ry   random_stater|   r}   avgs         r&   %test_v_measure_and_mutual_informationr   ;  s    [[Aq!((-yy,,T2  B*  B*  	Hh/(34x 78#446 	
 Hh/(8CP	
 .rG   c                      t        g dg d      } t        | dt        j                  d      z         t        g dg d      }t        |d       t        g dg d      }t        |d	       y )
NrI   rQ   g      @g      R@)r   r   r   r   r   r   r:   )r   r   r   r   r   r   )r   r   r)   r/   ra   r   r=   )r   r   rk   sqrt)scoreperfect_scoreworst_scores      r&   test_fowlkes_mallows_scorer   Q  s\    !"46HIEsRWWZ%889 **<>PQMs+ ((:<NOKS)rG   c                  h   t        j                  g d      } t        j                  g d      }dt        j                  d      z  }t        | |      }t	        ||       t        ||       }t	        ||       t        | dz   dz  |      }t	        ||       t        || dz   dz        }t	        ||       y )N)r   r   r   r   r   r)   )r   r   r)   r)   r   r   r:   g      (@r   r/   r)   )rk   r   r   r   r   )r|   r}   r%   score_originalscore_symmetricscore_permuted
score_boths          r&   %test_fowlkes_mallows_score_propertiesr   _  s    xx*+Hxx*+HRWW677H +8X>N1 ,Hh?O2 +HqLA+=xHN1 'x(Q,!1CDJ
H-rG   zlabels_true, labels_predr1      )r   r   r   r   r   r   r   c                 &    t        | |      dk(  sJ y )Nr   )r   )labels_truelabels_preds     r&   .test_mutual_info_score_positive_constant_labelr   v  s     [+6!;;;rG   c                     t         j                  j                  d      } | j                  d      }t        j                  ddd      dz  }d}t        j                  t        |      5  t        ||       d d d        y # 1 sw Y   y xY w)Nr;   i  g{Gz?r   gư>zuClustering metrics expects discrete values but received continuous values for label, and continuous values for targetr   )	rk   rl   rm   randlinspacer!   warnsUserWarningr   )rngnoise
wavelengthmsgs       r&   test_check_clustering_errorr     sj    
))


#CHHSMET1c*T1J	  
k	-*e, 
.	-	-s   (A>>Bc                      d} t        t        |             }|}t        j                  | | dz
  z  dgddgg      }t	        t        ||      |       y )Nr   r   r   )r   rr   rk   r   r   r   Nclustering1clustering2r%   s       r&   *test_pair_confusion_matrix_fully_dispersedr     sO    AuQx.KKxx!q1u+q)Aq623H,[+FQrG   c                      d} t        j                  | f      }|}t        j                  ddgd| | dz
  z  gg      }t        t	        ||      |       y )Nr   r   r   )rk   ro   r   r   r   r   s       r&   )test_pair_confusion_matrix_single_clusterr     sQ    A((A4.KKxx!Q!Q!a%[!123H,[+FQrG   c                  R   d} | dz  }t        j                  t        |       D cg c]  }|dz   g| z   c}      }t        j                  t        |       D cg c]  }|dz   g| dz   z   c}      d | }t        j                  dt         j                        }t        t        |            D ]X  }t        t        |            D ]?  }||k7  s	t        ||   ||   k(        }t        ||   ||   k(        }|||fxx   dz  cc<   A Z t        t        ||      |       y c c}w c c}w )Nr   r)   r   )r)   r)   )shaper   )	rk   hstackrr   ro   int64rp   r   r   r   )	nr   ry   r   r   r%   r{   same_cluster_1same_cluster_2s	            r&   test_pair_confusion_matrixr     s   
A	1A))%(;(Qa!eWq[(;<K))aA1a!eWA.AB2AFKxxfBHH5H3{#$s;'(AAv!$[^{1~%E!F!$[^{1~%E!F78A=8	 ) % ,[+FQ <As   DD$zclustering1, clustering2r   )r   c                 0    t        t        | |      d       y )Nr:   r   r   )r   r   s     r&   test_rand_score_edge_casesr     s     J{K8#>rG   c                      g d} g d}d}d}d}d|z
  |z
  |z
  }||z   }||z   |z   |z   }||z  }t        t        | |      |       y )NrI   rT   ra      r)      r   )	r   r   D11D10D01D00expected_numeratorexpected_denominatorr%   s	            r&   test_rand_scorer    sg    $K$K
C
C
C
#+
c
!Cs9s?S0!$88HJ{K8(CrG   c                  l   t         j                  j                  d      } | j                  dddt         j                        }| j                  dddt         j                        }t        j                         5  t        j                  dt               t        ||       ddd       y# 1 sw Y   yxY w)zCheck that large amount of data will not lead to overflow in
    `adjusted_rand_score`.
    Non-regression test for:
    https://github.com/scikit-learn/scikit-learn/issues/20305
    r   r)   i r   errorN)
rk   rl   rm   rn   int8warningscatch_warningssimplefilterRuntimeWarningr   )r   y_truey_preds      r&   !test_adjusted_rand_score_overflowr    s~     ))


"C[[Awbgg[6F[[Awbgg[6F		 	 	"g~6FF+ 
#	"	"s   :'B**B3rB   )r+   r-   r,   r.   c                     dgdz  }dg|dd z   }ddg|dd z   }t        |||       }|dk(  sJ t        |||       }d|cxk  rdk  sJ  J y)zCheck that nmi returns a score between 0 (included) and 1 (excluded
    for non-perfect match)

    Non-regression test for issue #13836
    r   i  r   Nr)   rA   )r   )rB   labels1labels2labels3nmis        r&   )test_normalized_mutual_info_score_boundedr    su     cCiGcGABKG!fwqr{"G 'w
WC!8O8 'w
WC<a<<<rG   )r   r;   )$   )Gr  numpyrk   r!   numpy.testingr   r   r   sklearn.baser   sklearn.metrics.clusterr   r   r	   r
   r   r   r   r   r   r   r   r   r   r   #sklearn.metrics.cluster._supervisedr   r   sklearn.utilsr   sklearn.utils._array_apir   sklearn.utils._testingr   r   r    r'   r8   rF   rN   rR   rX   r_   rf   r~   r   r   r   r   r   markparametrizer   r   r   r   r   r   r   r   r   r   r   r   r   rr   ro   r   r  r  r  r   rG   r&   <module>r#     s      X X '     X + N L  4"8 $F$$$&('.	K&>H34& )+T+V((+G$"
,*.. 
&'
q$%	cUQY'	aS1W%
SEAI	<	<-RRR" 
5:U3Z()HBHHV,<hbhhv>N+OP?	?D , )+TU VrG   