U
    3d!                     @   s   d Z ddlmZ ddlZddlZddlmZ ddlm	Z	 ddlm
Z
 ddlmZ ddlmZ dd	lmZmZ dd
lmZ ddlmZ dd Zdd Zdd Zdd Zdd Zdd Zdd Zdd Zdd Zdd Zd d! Zd"d# Z d$d% Z!d&d' Z"d(d) Z#dS )*z+
Tests for the birch clustering algorithm.
    )sparseN)generate_clustered_data)Birch)AgglomerativeClustering)
make_blobs)ConvergenceWarning)pairwise_distances_argminv_measure_score)assert_array_equal)assert_allclosec                 C   s   t d| d\}}|j|dd}t }|| tdd |jjD }tdd | D }||jd kslt	||jd ks~t	d S )	N
   	n_samplesrandom_stateFcopyc                 S   s   g | ]
}|j qS  )
n_samples_).0scr   r   D/tmp/pip-unpacked-wheel-zrfo1fqw/sklearn/cluster/tests/test_birch.py
<listcomp>   s     z/test_n_samples_leaves_roots.<locals>.<listcomp>c                 S   s   g | ]}|j D ]
}|jqqS r   )subclusters_r   )r   Zleafr   r   r   r   r      s       r   )
r   astyper   fitsumroot_r   Z_get_leavesshapeAssertionError)global_random_seedglobal_dtypeXybrcZn_samples_rootZn_samples_leavesr   r   r   test_n_samples_leaves_roots   s    
r$   c                 C   s   t d| d\}}|j|dd}tdd}|| td d}||d d  ||dd   t|j|j |jdd |d  t|j	|j	 d S )Nd   r   Fr      
n_clusters2   )
r   r   r   r   partial_fitr   subcluster_centers_Z
set_paramsr
   subcluster_labels_)r   r    r!   r"   r#   Zbrc_partialr   r   r   test_partial_fit"   s    



r-   c           	      C   s   t j| }tdddd}|j|dd}t d}|| ||d d f }tddd	}|| |j	j
|ksrtt|j|| |j	}|jt|| }tt||jd d S )
Nr&   r   )r(   
n_featuresZn_samples_per_clusterFr         g      ?r(   	threshold)nprandomZRandomStater   r   Zarangeshuffler   r   r+   dtyper   r
   labels_Zpredictr,   r   r   r	   )	r   r    rngr!   Zshuffle_indicesZ	X_shuffler#   Z	centroidsZnearest_centroidr   r   r   test_birch_predict4   s    


r9   c              	   C   s   t dd| d\}}|j|dd}tdd}|| t|jdksFttt|j	dks^tt
dd}t|d}|| t|j|j t|j	|j	 tdd}tt || W 5 Q R X d S )	Nr%   r   r   Zcentersr   Fr   r'   g     @)r2   )r   r   r   r   lenr+   r   r3   uniquer7   r   r
   r,   pytestZwarnsr   )r   r    r!   r"   Zbrc1gcZbrc2Zbrc4r   r   r   test_n_clustersL   s    





r?   c                 C   s   t dd| d\}}|j|dd}tdd}|| t|}tdd}|| |jj|ksbtt	|j
|j
 t|j|j d S )Nr%   r   r:   Fr   r'   )r   r   r   r   r   Z
csr_matrixr+   r6   r   r
   r7   r   )r   r    r!   r"   r#   ZcsrZ
brc_sparser   r   r   test_sparse_Xc   s    




r@   c               	   C   s`   t dd\} }tdd}|| | d}tjt|d  || d d dgf | W 5 Q R X d S )Nr%   )r   r&   r'   z3X has 1 features, but Birch is expecting 2 features)matchr   )r   r   r*   r=   Zraises
ValueError)r!   r"   r#   msgr   r   r   )test_partial_fit_second_call_error_checksu   s    
rD   c                 C   s6   | j }|t|kst|D ]}|jrt|j| qd S )N)r   r;   r   Zchild_check_branching_factor)nodebranching_factorsubclustersZclusterr   r   r   rE      s
    rE   c                 C   sl   t | d\}}|j|dd}d}td |dd}|| t|j| td|dd}|| t|j| d S )Nr   Fr   	   g{Gz?)r(   rG   r2   r&   )r   r   r   r   rE   r   )r   r    r!   r"   rG   r#   r   r   r   test_branching_factor   s    

rK   c                 C   s6   | j j}|r2|j}|D ]}||jkstq|j}qdS )z&Use the leaf linked list for traversalN)Zdummy_leaf_Z
next_leaf_r   Zradiusr   )Zbirch_instancer2   Zcurrent_leafrH   r   r   r   r   check_threshold   s    rL   c                 C   sd   t dd| d\}}|j|dd}tdd d}|| t|d tdd d}|| t|d d S )	NP   r0   r:   Fr   g      ?)r2   r(   g      @)r   r   r   r   rL   )r   r    r!   r"   r#   r   r   r   test_threshold   s    


rN   c                  C   s,   t dd\} }td}t|d|  d S )Nr   rI      r'   )r   r3   Zint64r   r   )r!   _r(   r   r   r   test_birch_n_clusters_long_int   s    
rQ   c                  C   sV   t dddd\} }tdd}||  |jjd }| }tdd t|D | dS )	z*Check `get_feature_names_out` for `Birch`.rM   r0   r   r   r.   r   r'   c                 S   s   g | ]}d | qS )Zbirchr   )r   ir   r   r   r      s     z*test_feature_names_out.<locals>.<listcomp>N)r   r   r   r+   r   Zget_feature_names_outr
   range)r!   rP   r#   r(   Z	names_outr   r   r   test_feature_names_out   s    

rU   c                 C   sL   t dd| d\}}tddd}||}||tj}t||dd d S )NrM   r0   rR   g?r1   gư>)Zatol)r   r   Zfit_transformr   r3   float32r   )r   r!   rP   r#   ZY_64ZY_32r   r   r   "test_transform_match_across_dtypes   s
    
rW   c                 C   s@   t ddddd j| dd}tdd}||jj| ks<td S )NrM   r0   r   rR   Fr   r'   )r   r   r   r   r+   r6   r   )r    r!   r#   r   r   r   test_subcluster_dtype   s     
rX   c                  C   s   t jddgddgddgddgd	d
gddgddgddgddgddgddgddgddgd	d
gddgd	d
gddgddgddgddgddggt jd} tdddd|  dS )zCheck that both subclusters are updated when a node a split, even when there are
    duplicated data points. Non-regression test for #23269.
    g@̙Hg\sGg%g44Tg}Thg\Fgzog/IwgY+ctEgBlCg}
gr'g_ guXgaeR^g	AX7g.^g|SAgkg^#g@cgi8K)r6   rO   gh㈵>N)rG   r2   r(   )r3   arrayrV   r   r   )r!   r   r   r   test_both_subclusters_updated   s4    rZ   )$__doc__Zscipyr   Znumpyr3   r=   Zsklearn.cluster.tests.commonr   Zsklearn.clusterr   r   Zsklearn.datasetsr   Zsklearn.exceptionsr   Zsklearn.metricsr   r	   Zsklearn.utils._testingr
   r   r$   r-   r9   r?   r@   rD   rE   rK   rL   rN   rQ   rU   rW   rX   rZ   r   r   r   r   <module>   s4   
	