o
    թZhsD                     @   s  d dl m Z  d dlZd dlZd dlmZ d dlZd dlmZm	Z	m
Z
mZmZ d dlmZ d dlmZ ejdd Zejdd	 Zejd
d Zejdd Zejdd Zejdd Zejdd Zejdddeddgddgdddgdfddeddgddgdddgdfd	deg d ddejgdg d!dfd	deg d"ejddgdg d#dfddeejddgg d$dg d%dfddeddejgg d&dg d'dfd(ded ddejgejddd)gdg d*dfd(ded ddejgejddd)gdg d*dfgd+d, Zd-d. Zd/d0 Zejd1d2d3gd4d5 Z d6d7 Z!d8d9 Z"d:d; Z#d<d= Z$d>d? Z%d@dA Z&dBdC Z'dDdE Z(dFdG Z)dHdI Z*ejdJddgdKdL Z+G dMdN dNZ,dS )O    )datetimeN)
MergeError)	DataFrameIndex
MultiIndex
date_rangeperiod_range)concatc                   C   s*   t tdddtdtdddddS )	N         Zabcde2000Y)startfreqperiodsdatacolumnsindex)r   npZarangeZreshapelistr    r   r   [/var/www/html/lang_env/lib/python3.10/site-packages/pandas/tests/frame/methods/test_join.pyframe_with_period_index   s
   r   c                   C      t dg dig ddS )Nar
   
   r         r   r   r   r   r   r   r   left      r$   c                   C   r   )Nb,  d         r!   r    r"   r#   r   r   r   r   right"   r%   r-   c                   C   s   t g dg ddtddS )Nr   r&   cdcatdogweaselhorser   r&   r   r"   )r   ranger   r   r   r   left_no_dup'   s   r8   c                   C   s$   t g dg ddtdddS )N)r   r&   r/   r0   e)meowbarkum... weasel noise?ZnayZchirpr   r/   r   r"   r   )r   r7   	set_indexr   r   r   r   right_no_dup/   s   r?   c                 C   s$   t | tdgdgddgdgddS )Nr   cowr6   r,   r"   T)sort)r	   r   )r8   r   r   r   left_w_dups:   s   rB   c                 C   s&   t | tdgdgddgdgdS )Nr9   moor=   r,   r"   r   )r	   r   r>   )r?   r   r   r   right_w_dupsA   s
   rD   zhow, sort, expectedinnerFr
   r   r*   r)   r6   r    r!   r"   Tr   r   r   r   r
   )r   r!   r    r'   r+   r)   r*   r(   r!   r    r,   outerr(   )r   r!   r    r,   c                 C   s"   | j |||dd}t|| d S )N1:1)howrA   validate)jointmassert_frame_equal)r$   r-   rK   rA   expectedresultr   r   r   	test_joinH   s   ,rR   c                  C   sb  t dg di} t g dg dd}t g dg dd}d}tjt|d | j|gd	d
 W d    n1 s:w   Y  tjt|d | j||gdd W d    n1 sZw   Y  tjt|d | j||gd	dd W d    n1 s{w   Y  tjtdd | ||g W d    n1 sw   Y  | |g}| |}t|| d S )Nkey)r!   r    r,   r   r   )r!      r,   r    r   )rS   v1)r   r    r,   r   r!   )keysv2z7Suffixes not supported when joining multiple DataFramesmatchy)lsuffixx)rsuffixr[   r]   zIndexes have overlapping values)r   pytestraises
ValueErrorrM   rN   rO   )firstsecondthirdmsgZ
arr_joinedZnorm_joinedr   r   r   test_suffix_on_list_joinx   s&   
rf   c                 C   sH   d}t jt|d | j|ddd W d    d S 1 sw   Y  d S )Nz"invalid" is not a valid argument. Valid arguments are:
- "1:1"
- "1:m"
- "m:1"
- "m:m"
- "one_to_one"
- "one_to_many"
- "many_to_one"
- "many_to_many"rX   r   invalidonrL   )r_   r`   ra   merge)r8   r?   re   r   r   r   test_join_invalid_validate   s
   "rk   dtypeobjectstring[pyarrow]c                 C   s   |dkr	t d | |} |j||_| j|ddd d}t jt|d | j|ddd W d    d S 1 s:w   Y  d S )	Nrn   Zpyarrowr   one_to_manyrh   zBMerge keys are not unique in right dataset; not a one-to-one mergerX   
one_to_one)r_   ZimportorskipZastyper   rM   r`   r   )r8   rD   rl   re   r   r   r   $test_join_on_single_col_dup_on_right   s"   

"rq   c                 C   sX   | j |ddd d}tjt|d | j |ddd W d    d S 1 s%w   Y  d S )Nr   many_to_onerh   zAMerge keys are not unique in left dataset; not a one-to-one mergerX   rp   rM   r_   r`   r   )rB   r?   re   r   r   r   #test_join_on_single_col_dup_on_left   s   "rt   c                 C   s   | j |ddd d}tjt|d | j |ddd W d    n1 s$w   Y  d}tjt|d | j |ddd W d    d S 1 sFw   Y  d S )	Nr   Zmany_to_manyrh   zCMerge keys are not unique in right dataset; not a many-to-one mergerX   rr   zBMerge keys are not unique in left dataset; not a one-to-many mergero   rs   )rB   rD   re   r   r   r   #test_join_on_single_col_dup_on_both   s"   "ru   c                  C   s   t g dg dg ddtddddg} t g d	g d
g ddtddddg}t g d	g d
g dg ddtddddg}| j|ddd}t|| d S )N)r   r   r&   r&   )r   r!   r   r!   r1   r   r&   r/   r   r"   r   r&   )r   r   r&   )r   r!   r   )r:   r;   r<   )r   r&   r0   r,   )r2   r3   r4   r.   rE   rJ   )rK   rL   )r   r7   r>   rM   rN   rO   )r$   r-   Zexpected_multirQ   r   r   r    test_join_on_multi_col_check_dup   s<   
	
	
rw   c              	   C   s  | j | jd d ddgf }| j | jdd  ddgf jd d d }||}t|j|j tg d}t|j| |j|d	d
}t|j|j t|j| |j|dd
}t|j|j t|j| |j|dd
}t|j|jdd  t|j| |j|dd
}t|j| j  t|j| t	j
tdd |j|dd
 W d    n1 sw   Y  d}dD ] }t	j
t|d | j| |d
 W d    n1 sw   Y  qd S )Nr   ABr   CD)rx   ry   rz   r{   r$   rK   r-   rE   rI   zjoin methodrX   Zfoozcolumns overlap but no suffix)rI   r$   rE   )locr   ZilocrM   rN   assert_index_equalr   r   Zsort_valuesr_   r`   ra   )float_frameff2joinedZexpected_columnsre   rK   r   r   r   test_join_index  s8   (
r   c                 C   s   | j d d ddgf }| j d d dddgf }| }| d d d d |d< | d d d d |d< ||}t|| |j|dd}t||d d d  |j|dd}t||j d d |jf  d S )Nrx   ry   r    rz   r{   r-   r}   )r~   copyrM   rN   rO   r   )r   afbfrP   rQ   r   r   r   test_join_index_more1  s   
 r   c                 C   sr   |   }|| jd }||}t||  d |_tjt	dd || W d    d S 1 s2w   Y  d S )Nr|   zmust have a namerX   )
r   popr   rM   rN   rO   namer_   r`   ra   )r   dfZserr   r   r   r   test_join_index_seriesC  s   
"r   c                 C   s   | j d d g df }| j d d g df }|j|ddd}|j d d ddgf d}|j d d ddgf d}| j d d dd	gf }|||}t||j d d |jf  d S )
N)rx   ry   rz   )ry   rz   r{   Z_df1Z_df2r^   ry   rz   rx   r{   )r~   rM   Z
add_suffixrN   rO   r   )r   df1df2r   Zdf1_sufZdf2_sufZ
no_overlaprP   r   r   r   test_join_overlapO  s    r   c                 C   s^   | j dd d}tj| jgd dd}| j|j}| |}t||| jd}t	
|| d S )Nc                 S   s   |  |  S )Nr   )rS   r   r   r   <lambda>_  s    z(test_join_period_index.<locals>.<lambda>r   r    r!   )Zaxisr   )renamer   Zconcatenatevaluesr   appendrM   r   r   rN   rO   )r   otherZjoined_valuesZjoined_colsr   rP   r   r   r   test_join_period_index^  s   
r   c                  C   s   t dg dig dd} t dg dig dd}t dg d	ig d
d}| j||gdd}t g dtjdddgtjddtjgdg dd}t|| d S )Nr   rF   rH   r"   r&   rG   )r   r,   r    r/   )    iX  )r    r    r   r$   r}   )r   r   r   r
   r(   r*   r   r   rv   )r!   r    r    r,   )r   rM   r   nanrN   rO   )r   r   df3r   rP   r   r   r   (test_join_left_sequence_non_unique_indexm  s   	r   c                 C   s6   | j  }| j| ddg g}||}t||  d S )Nrz   r{   )rx   Zto_framery   rM   rN   rO   )r   r$   r-   rQ   r   r   r   test_join_list_series  s   

r   sort_kwc                 C   s   t dddgiddgd}t ddd	gid
dgd}t dddgidd
gd}t dtdddddtddddtddd}| du rJ|jg dd}td  |j||gd| d}W d    n1 sdw   Y  t|| d S )Ncol1r!   r    r/   r   r"   col2r   r   r&   col3   rT          @r         ?rv   g      @g      @g      @g       @r   r   r   F)r/   r   r&   rI   )rK   rA   )r   floatreindexrN   Zassert_produces_warningrM   rO   )r   r   r&   r/   rP   rQ   r   r   r   )test_suppress_future_warning_with_sort_kw  s   r   c                   @   sD   e Zd Zdd Zdd Zdd Zdd Zd	d
 Zdd Zdd Z	dS )TestDataFrameJoinc                 C   s   |}|j |jd d dgf }|j |jdd  ddgf }|j|dd|j}| j }tj|t|j< t	||j|j
d}t|j rKJ t|| d S )	Nr   rx   r    ry   rz   rI   r}   r   r   )r~   r   rM   r   r   r   r   r   isnanr   r   allrN   rO   )selfZ multiindex_dataframe_random_dataframer   r&   r   rP   r   r   r   rR     s   zTestDataFrameJoin.test_joinc                 C   sp   t ddgddgddgd}t ddgddgddgd}|ddg}|ddg}dD ]	}|j||d q,d S )	Nr!   r    )r   r&   r\   )r   r&   rZ   r   r&   )r$   r-   rI   r}   )r   r>   rM   )r   r   r   rK   r   r   r   test_join_segfault  s   z$TestDataFrameJoin.test_join_segfaultc                 C   sr   ddg}t dddt dddg}t|tddgd}td	dgd
dgg||d}|j|dd}t|jd
ks7J d S )NZ20120209Z20120222i  r    	      Zaar   r!   r,   r   ri   )r   r   r7   rM   lenr   )r   Z	str_datesZdt_datesrx   rz   Ztstr   r   r   test_join_str_datetime  s   z(TestDataFrameJoin.test_join_str_datetimec                 C   s  t g dg dg dg dg dg dg dg dg d	g	g d
dddg}t ddgddggddgddg}t ddgddgddgddgddgddgdtjgdtjgdtjgg	|jddgd}t|j|dd| t|j|d d|ddg  tj	ddgg d!gddgd"}t ddgddgddgddgddgddgg|ddgd}t|j|d d| t|j|dd|ddg  d S )#N)r   r\   R
1?)r   rZ   ?)r   z<+J	?)r&   r\   4ֿ)r&   rZ   ^9S?)r&   r   ?)r/   r\   r!   )r/   rZ   r    )r/   r   r,   )rb   rc   value1r   rb   rc   r   r   r&   r
   Zvalue2r   r   r   r   r   r   r   r   g      @r   r   r$   r}   r-   )r\   rZ   r   names)
r   r>   r   r   r   rN   rO   rM   r   Zfrom_product)r   r   r   expZexp_idxr   r   r   test_join_multiindex_leftright  sd   
"z0TestDataFrameJoin.test_join_multiindex_leftrightc                 C   s   t ddd }tjd|fgddgd}tddgi|d}tjd|fgddgd}td	dgi|d}tjd|fgddgd}td
dgi|d}|||g}tjd|fgddgd}	tdgdgdgd|	d}
t||
 d S )Ni  r!   r   Zindex_0dater   r   r"   r   r   r   )	pd	Timestampr   r   from_tuplesr   rM   rN   Zassert_equal)r   r   Z	df1_indexr   Z	df2_indexr   Z	df3_indexr   rQ   Zexpected_indexrP   r   r   r   test_join_multiindex_dates  s   z,TestDataFrameJoin.test_join_multiindex_datesc                 C   s   t ddgddgddggd}tdd	g}t |dd
gddggd}tjtdd tj||dd W d    n1 s;w   Y  tjtdd |j|dd W d    d S 1 sZw   Y  d S )Nr   r&   r!      r   r   )r   r   )r    )r/   c1!   ,   z-Not allowed to merge between different levelsrX   r   )	r   r   r   r_   r`   r   r   rj   rM   )r   r   r   r   r   r   r   'test_merge_join_different_levels_raises  s   "z9TestDataFrameJoin.test_merge_join_different_levels_raisesc                 C   s   t tdtdddddd}t tdtdd	d
ddtd	dd}|j|dd}|j|j}t	|j| |jj
jdks@J d S )N)   r,   z2012-11-15 00:00:00r   Z100msz
US/Central)r   r   tzr"   )r,   r,   r,   Z250msr   rI   r}   )r   r   Zzerosr   r7   rM   r   unionrN   r   r   zone)r   Ztest1Ztest2rQ   rP   r   r   r   test_frame_join_tzaware-  s"   z)TestDataFrameJoin.test_frame_join_tzawareN)
__name__
__module____qualname__rR   r   r   r   r   r   r   r   r   r   r   r     s    
<r   )-r   numpyr   r_   Zpandas.errorsr   Zpandasr   r   r   r   r   r   Zpandas._testingZ_testingrN   Zpandas.core.reshape.concatr	   Zfixturer   r$   r-   r8   r?   rB   rD   markZparametrizer   rR   rf   rk   rq   rt   ru   rw   r   r   r   r   r   r   r   r   r   r   r   r   r   <module>   s    







""    	
+
$)	
