U
    f/eH/                     @   sn   d dl Zd dlZd dlmZ d dlmZmZmZ d dl	m
Z d dlm  mZ G dd dZG dd dZdS )    N)np_version_under1p18)	DataFrameIndexSeriesc                   @   s   e Zd Zejeegddd Zej	de
eddd Zdd	 Zd
d Zdd Zdd Zdd Zdd Zdd Zdd Zdd Zdd Zdd Zej	ddd d!d"d#gfejd$d!ejjed%d&d'ejd(d)ejjed%d&d'gd*d+ Zd,d- Zd.S )/
TestSample)paramsc                 C   s6   |j }|tkrtjd}ntjdd}||d dS )N
   )Zdtype)paramr   nprandomrandn)selfrequestklassZarr r   J/tmp/pip-unpacked-wheel-tiezk1ph/pandas/tests/frame/methods/test_sample.pyobj   s
    zTestSample.objtestr   c              	   C   sB  t jdd}t|jd|d|jd|d t|jd|d|jd|d t|jdt j|d|jdt j|d t|jdt j|d|jdt j|d t|jddt j|d	|jddt j|d	 g g  }}tdD ]4}t j| |	|jdd
 |	|jdd qtj|  tj|  d S )Nr   d      nrandom_stategffffff?)fracr      T)r   replacer   r   r   )
r
   r   randinttmassert_equalsampleZRandomStaterangeseedappend)r   r   r   r#   Zos1Zos2_r   r   r   test_sample   s8     

zTestSample.test_samplec                 C   sL   t |jdddkstt |jdddks0tt |jdddksHtd S )Nr   r   g(\?r      g
ףp=
?)lenr!   AssertionErrorr   r   r   r   r   test_sample_lengthsA   s    zTestSample.test_sample_lengthsc              	   C   s.   d}t jt|d |jdd W 5 Q R X d S )NzYrandom_state must be an integer, array-like, a BitGenerator, a numpy RandomState, or NonematchZa_string)r   pytestraises
ValueErrorr!   r   r   msgr   r   r    test_sample_invalid_random_stateG   s    z+TestSample.test_sample_invalid_random_statec              	   C   s0   d}t jt|d |jddd W 5 Q R X d S )Nz0Please enter a value for `frac` OR `n`, not bothr,   r'   g333333?)r   r   r.   r2   r   r   r   "test_sample_wont_accept_n_and_fracP   s    z-TestSample.test_sample_wont_accept_n_and_fracc              	   C   sT   d}t jt|d |jdd W 5 Q R X t jt|d |jdd W 5 Q R X d S )NzCA negative number of rows requested. Please provide positive value.r,   r   g333333ӿr   r.   r2   r   r   r   $test_sample_requires_positive_n_fracV   s
    z/TestSample.test_sample_requires_positive_n_fracc              	   C   s*   t jtdd |jdd W 5 Q R X d S )Nz$Only integers accepted as `n` valuesr,   g	@r   r.   r*   r   r   r   test_sample_requires_integer_n]   s    z)TestSample.test_sample_requires_integer_nc              	   C   s   d}t jt|d |jdddgd W 5 Q R X t jt|d dgd }|jd|d W 5 Q R X t jtd	d" tddd
g}|jd|d W 5 Q R X d S )N5Weights and axis to be sampled must be of same lengthr,   r'   r      r   weights      ?   z%Fewer non-zero entries in p than sizeg?r   )r/   r0   r1   r!   r   )r   r   r3   bad_weightsZbad_weight_seriesr   r   r   "test_sample_invalid_weight_lengthsb   s    
z-TestSample.test_sample_invalid_weight_lengthsc              	   C   s:   dgd }d}t jt|d |jd|d W 5 Q R X d S )Ngr   z.weight vector many not include negative valuesr,   r'   r;   r.   )r   r   r?   r3   r   r   r   test_sample_negative_weightsp   s    
z'TestSample.test_sample_negative_weightsc              	   C   s   dgd }t j|d< d}tjt|d |jd|d W 5 Q R X dgd }t j |d< tjt|d |jd|d W 5 Q R X d S )Ng?r   r   z*weight vector may not include `inf` valuesr,   r'   r;   )r
   infr/   r0   r1   r!   )r   r   Zweights_with_infr3   Zweights_with_ninfr   r   r   test_sample_inf_weightsw   s    


z"TestSample.test_sample_inf_weightsc              	   C   s6   dgd }t jtdd |jd|d W 5 Q R X d S )Nr   r   $Invalid weights: weights sum to zeror,   r'   r;   r.   )r   r   Zzero_weightsr   r   r   test_sample_zero_weights   s    
z#TestSample.test_sample_zero_weightsc              	   C   s8   t jgd }tjtdd |jd|d W 5 Q R X d S )Nr   rD   r,   r'   r;   )r
   nanr/   r0   r1   r!   )r   r   Znan_weightsr   r   r   test_sample_missing_weights   s    z&TestSample.test_sample_missing_weightsc                 C   s8   d gd }d|d< t |jdd|d|jdd  d S )Nr   r=      r:   r   r   axisr<      )r   r    r!   iloc)r   r   Zweights_with_Noner   r   r   test_sample_none_weights   s    
 z#TestSample.test_sample_none_weightszfunc_str,argznp.arrayr   r'   r:   r   znp.random.MT19937z
NumPy<1.18)reason)Zmarksznp.random.PCG64r>   c                 C   sl   t tddtddd}|tkr*|d }|jdt||d}|jdtt||d}t|| d S )Nr         col1col2rR   r'   r   )	r   r"   r   r!   evalcomr   r   r    )r   Zfunc_strargframe_or_seriesr   resultexpectedr   r   r   test_sample_random_state   s    z#TestSample.test_sample_random_statec              	   C   sP   t dtdi}|tkr |d }d}tjt|d |jddd W 5 Q R X d S )NAabczJReplace has to be set to `True` when upsampling the population `frac` > 1.r,   r   F)r   r   )r   listr   r/   r0   r1   r!   )r   rW   r   r3   r   r   r   *test_sample_upsampling_without_replacement   s    z5TestSample.test_sample_upsampling_without_replacementN)__name__
__module____qualname__r/   Zfixturer   r   r   markZparametrizer]   r"   r&   r+   r4   r5   r7   r8   r@   rA   rC   rE   rG   rM   r	   Zskipifr   rZ   r^   r   r   r   r   r      s@   

'	
	r   c                   @   s4   e Zd Zdd Zdd Zdd Zdd Zd	d
 ZdS )TestSampleDataFramec           	   	   C   s  dgd }d|d< t tddtdddgd |d}|jdd	d
}t||jdd  ttd}d}tjt	|d |jddd
 W 5 Q R X d}tjt	|d |jdddd W 5 Q R X tjt
dd |jddd
 W 5 Q R X dgd }d|d< t|jd|d
|jd d  t tddgd d}ddg}t|jdd|d|dg  t|jdd|d|dg  dgd }d|d< t|jdd|d|jdd  t|jdd|d|jdd  d}tjt	|d |jddd W 5 Q R X d}tjt	|d |jddd W 5 Q R X ttd}tjt	d d |jddd W 5 Q R X d!}tjt	|d |jdddgd d W 5 Q R X d S )"Nr   r   r:   rH   rO   rP   a)rR   rS   	colStringeasyweightsrf   r;   rK   z@Strings cannot be passed as weights when sampling from a Series.r,   r'   Zweight_columnzLStrings can only be passed to weights when sampling from rows on a DataFrame)r   r<   rJ   z-'String passed to weights not a valid column'Znot_a_real_column_namer=   rQ   rI   rS   columnsZrowsindexz)No axis named 2 for object type DataFramer   )r   rJ   z2No axis named not_a_name for object type DataFrameZ
not_a_namez&No axis named 1 for object type Seriesr9   )r   r"   r!   r   assert_frame_equalrL   r   r/   r0   r1   KeyError)	r   easy_weight_listdfsample1serr3   Zweights_less_than_1Zsecond_column_weightZweightr   r   r   r&      sp    
 
   
" zTestSampleDataFrame.test_samplec                 C   s|   dgd }d|d< t tddtdddgd d	}|jdd|d
}t||dg  t|jddd|jdddd d S )Nr   r'   r:   r   r   rO   rP   rd   rR   rS   re   rI   re   *   r   )r   rJ   r   )r   r"   r!   r   ri   )r   rk   rl   rm   r   r   r   test_sample_axis1  s    
 z%TestSampleDataFrame.test_sample_axis1c              	   C   s  t dddgdddgdddd	gd
}tdddgd	ddgd
}t|jd	g |jd|d tdddgd	ddgd
}t|jd	g |jd|d tddgd	dgd
}t|jd	g |jd|d tddgddgd
}tjtdd |jd|d W 5 Q R X d S )NrH   rK      rd   bcrQ   	   r'   )rh   r:   r   )r<   gMbP?i'  r   g{Gz?r   rD   r,   )	r   r   r   ri   locr!   r/   r0   r1   )r   rl   rn   Zser2Zser3Zser4r   r   r   %test_sample_aligns_weights_with_frame,  s    $z9TestSampleDataFrame.test_sample_aligns_weights_with_framec              	   C   sH   t tjdddddgd}|d}td  d|d< W 5 Q R X d S )	Nr   r'   rd   rs   rt   )rg   r:   d)r   r
   r   r   r!   r   Zassert_produces_warning)r   rl   Zdf2r   r   r   test_sample_is_copyB  s    
z'TestSampleDataFrame.test_sample_is_copyc                 C   sP   t tddtdddgd d}|jddd}td	d
dg}t|j| d S )Nr   rO   rP   rd   ro   r'   T)Zignore_indexr   r:   r   )r   r"   r!   r   r   Zassert_index_equalrh   )r   rl   rX   Zexpected_indexr   r   r   test_sample_ignore_indexK  s    z,TestSampleDataFrame.test_sample_ignore_indexN)r_   r`   ra   r&   rq   rw   ry   rz   r   r   r   r   rc      s
   U	rc   )Znumpyr
   r/   Zpandas.compatr   Zpandasr   r   r   Zpandas._testingZ_testingr   Zpandas.core.commoncorecommonrU   r   rc   r   r   r   r   <module>   s    5