a
    PfsD                     @   s  d dl m Z  d dlZd dlZd dlmZ d dlZd dlmZm	Z	m
Z
mZmZ d dlmZ d dlmZ ejdd Zejdd	 Zejd
d Zejdd Zejdd Zejdd Zejdd Zejdddeddgddgdddgdfddeddgddgdddgdfd	deg d ddejgdg d!dfd	deg d"ejddgdg d#dfddeejddgg d$dg d%dfddeddejgg d&dg d'dfd(ded ddejgejddd)gdg d*dfd(ded ddejgejddd)gdg d*dfgd+d, Zd-d. Zd/d0 Zejd1d2d3gd4d5 Z d6d7 Z!d8d9 Z"d:d; Z#d<d= Z$d>d? Z%d@dA Z&dBdC Z'dDdE Z(dFdG Z)dHdI Z*ejdJddgdKdL Z+G dMdN dNZ,dS )O    )datetimeN)
MergeError)	DataFrameIndex
MultiIndex
date_rangeperiod_range)concatc                   C   s*   t tdddtdtdddddS )	N         Zabcde2000Y)startfreqperiodsdatacolumnsindex)r   npZarangeZreshapelistr    r   r   ]/var/www/ai-form-bot/venv/lib/python3.9/site-packages/pandas/tests/frame/methods/test_join.pyframe_with_period_index   s
    r   c                   C   s   t dg dig ddS )Nar
   
   r         r   r   r   r   r   r   r   left   s    r#   c                   C   s   t dg dig ddS )Nb,  d         r    r   r!   r"   r   r   r   r   right"   s    r+   c                   C   s   t g dg ddtddS )Nr   r$   cdcatdogweaselhorser   r$   r   r!   )r   ranger   r   r   r   left_no_dup'   s    r6   c                   C   s$   t g dg ddtdddS )N)r   r$   r-   r.   e)meowbarkum... weasel noise?ZnayZchirpr   r-   r   r!   r   )r   r5   	set_indexr   r   r   r   right_no_dup/   s    r=   c                 C   s$   t | tdgdgddgdgddS )Nr   cowr4   r*   r!   T)sort)r	   r   )r6   r   r   r   left_w_dups:   s    r@   c                 C   s&   t | tdgdgddgdgdS )Nr7   moor;   r*   r!   r   )r	   r   r<   )r=   r   r   r   right_w_dupsA   s
    rB   zhow, sort, expectedinnerFr
   r   r(   r'   r4   r   r    r!   Tr   r   r   r   r
   )r   r    r   r%   r)   r'   r(   r&   r    r   r*   outerr&   )r   r    r   r*   c                 C   s"   | j |||dd}t|| d S )N1:1)howr?   validate)jointmassert_frame_equal)r#   r+   rI   r?   expectedresultr   r   r   	test_joinH   s    ,rP   c                  C   sd  t dg di} t g dg dd}t g dg dd}d}tjt|d  | j|gd	d
 W d    n1 st0    Y  tjt|d" | j||gdd W d    n1 s0    Y  tjt|d$ | j||gd	dd W d    n1 s0    Y  tjtdd | ||g W d    n1 s40    Y  | |g}| |}t|| d S )Nkey)r    r   r*   r   r   )r       r*   r   r   )rQ   Zv1)r   r   r*   r   r    )keysZv2z7Suffixes not supported when joining multiple DataFramesmatchy)lsuffixx)rsuffixrW   rY   zIndexes have overlapping values)r   pytestraises
ValueErrorrK   rL   rM   )firstsecondthirdmsgZ
arr_joinedZnorm_joinedr   r   r   test_suffix_on_list_joinx   s    .02.
rb   c                 C   sF   d}t jt|d  | j|ddd W d    n1 s80    Y  d S )Nz"invalid" is not a valid argument. Valid arguments are:
- "1:1"
- "1:m"
- "m:1"
- "m:m"
- "one_to_one"
- "one_to_many"
- "many_to_one"
- "many_to_many"rT   r   invalidonrJ   )r[   r\   r]   merge)r6   r=   ra   r   r   r   test_join_invalid_validate   s    rg   dtypeobjectstring[pyarrow]c                 C   s   |dkrt d | |} |j||_| j|ddd d}t jt|d  | j|ddd W d    n1 sr0    Y  d S )	Nrj   Zpyarrowr   one_to_manyrd   zBMerge keys are not unique in right dataset; not a one-to-one mergerT   
one_to_one)r[   ZimportorskipZastyper   rK   r\   r   )r6   rB   rh   ra   r   r   r   $test_join_on_single_col_dup_on_right   s     

rm   c                 C   sV   | j |ddd d}tjt|d  | j |ddd W d    n1 sH0    Y  d S )Nr   many_to_onerd   zAMerge keys are not unique in left dataset; not a one-to-one mergerT   rl   rK   r[   r\   r   )r@   r=   ra   r   r   r   #test_join_on_single_col_dup_on_left   s    rp   c                 C   s   | j |ddd d}tjt|d  | j |ddd W d    n1 sH0    Y  d}tjt|d  | j |ddd W d    n1 s0    Y  d S )	Nr   Zmany_to_manyrd   zCMerge keys are not unique in right dataset; not a many-to-one mergerT   rn   zBMerge keys are not unique in left dataset; not a one-to-many mergerk   ro   )r@   rB   ra   r   r   r   #test_join_on_single_col_dup_on_both   s    $rq   c                  C   s   t g dg dg ddtddddg} t g d	g d
g ddtddddg}t g d	g d
g dg ddtddddg}| j|ddd}t|| d S )N)r   r   r$   r$   )r   r    r   r    r/   r   r$   r-   r   r!   r   r$   )r   r   r$   )r   r    r   )r8   r9   r:   )r   r$   r.   r*   )r0   r1   r2   r,   rC   rH   )rI   rJ   )r   r5   r<   rK   rL   rM   )r#   r+   Zexpected_multirO   r   r   r    test_join_on_multi_col_check_dup   s<    		rs   c              	   C   s  | j | jd d ddgf }| j | jdd  ddgf jd d d }||}t|j|j tg d}t|j| |j|d	d
}t|j|j t|j| |j|dd
}t|j|j t|j| |j|dd
}t|j|jdd  t|j| |j|dd
}t|j| j  t|j| t	j
tdd |j|dd
 W d    n1 sh0    Y  d}dD ]D}t	j
t|d | j| |d
 W d    n1 s0    Y  qzd S )Nr   ABr   CD)rt   ru   rv   rw   r#   rI   r+   rC   rG   zjoin methodrT   Zfoozcolumns overlap but no suffix)rG   r#   rC   )locr   ZilocrK   rL   assert_index_equalr   r   Zsort_valuesr[   r\   r]   )float_frameff2joinedZexpected_columnsra   rI   r   r   r   test_join_index  s0    (
.r   c                 C   s   | j d d ddgf }| j d d dddgf }| }| d d d d |d< | d d d d |d< ||}t|| |j|dd}t||d d d  |j|dd}t||j d d |jf  d S )Nrt   ru   r   rv   rw   r+   ry   )rz   copyrK   rL   rM   r   )r|   afbfrN   rO   r   r   r   test_join_index_more1  s    
r   c                 C   sp   |   }|| jd }||}t||  d |_tjt	dd || W d    n1 sb0    Y  d S )Nrx   zmust have a namerT   )
r   popr   rK   rL   rM   namer[   r\   r]   )r|   ZdfZserr   r   r   r   test_join_index_seriesC  s    
r   c                 C   s   | j d d g df }| j d d g df }|j|ddd}|j d d ddgf d}|j d d ddgf d}| j d d dd	gf }|||}t||j d d |jf  d S )
N)rt   ru   rv   )ru   rv   rw   Z_df1Z_df2rZ   ru   rv   rt   rw   )rz   rK   Z
add_suffixrL   rM   r   )r|   df1df2r   Zdf1_sufZdf2_sufZ
no_overlaprN   r   r   r   test_join_overlapO  s    r   c                 C   s^   | j dd d}tj| jgd dd}| j|j}| |}t||| jd}t	
|| d S )Nc                 S   s   |  |  S )Nr   )rQ   r   r   r   <lambda>_      z(test_join_period_index.<locals>.<lambda>r   r   r    )Zaxisr   )renamer   Zconcatenatevaluesr   appendrK   r   r   rL   rM   )r   otherZjoined_valuesZjoined_colsr   rN   r   r   r   test_join_period_index^  s    
r   c                  C   s   t dg dig dd} t dg dig dd}t dg d	ig d
d}| j||gdd}t g dtjdddgtjddtjgdg dd}t|| d S )Nr   rD   rF   r!   r$   rE   )r   r*   r   r-   )    iX  )r   r   r   r#   ry   )r   r   r   r
   r&   r(   r   r   rr   )r    r   r   r*   )r   rK   r   nanrL   rM   )r   r   df3r   rN   r   r   r   (test_join_left_sequence_non_unique_indexm  s    	r   c                 C   s6   | j  }| j| ddg g}||}t||  d S )Nrv   rw   )rt   Zto_frameru   rK   rL   rM   )r|   r#   r+   rO   r   r   r   test_join_list_series  s    

r   sort_kwc                 C   s   t dddgiddgd}t ddd	gid
dgd}t dddgidd
gd}t dtdddddtddddtddd}| du r|jg dd}td $ |j||gd| d}W d    n1 s0    Y  t|| d S )Ncol1r    r   r-   r   r!   col2r   r   r$   col3   rR          @r         ?rr   g      @g      @g      @g       @r   r   r   F)r-   r   r$   rG   )rI   r?   )r   floatreindexrL   Zassert_produces_warningrK   rM   )r   r   r$   r-   rN   rO   r   r   r   )test_suppress_future_warning_with_sort_kw  s    2r   c                   @   sD   e Zd Zdd Zdd Zdd Zdd Zd	d
 Zdd Zdd Z	dS )TestDataFrameJoinc                 C   s   |}|j |jd d dgf }|j |jdd  ddgf }|j|dd|j}| j }tj|t|j< t	||j|j
d}t|j rJ t|| d S )	Nr   rt   r   ru   rv   rG   ry   r   r   )rz   r   rK   r   r   r   r   r   isnanr   r   allrL   rM   )selfZ multiindex_dataframe_random_dataframer   r$   r   rN   r   r   r   rP     s    zTestDataFrameJoin.test_joinc                 C   sp   t ddgddgddgd}t ddgddgddgd}|ddg}|ddg}dD ]}|j||d qXd S )	Nr    r   )r   r$   rX   )r   r$   rV   r   r$   )r#   r+   rG   ry   )r   r<   rK   )r   r   r   rI   r   r   r   test_join_segfault  s    z$TestDataFrameJoin.test_join_segfaultc                 C   sr   ddg}t dddt dddg}t|tddgd}td	dgd
dgg||d}|j|dd}t|jd
ksnJ d S )NZ20120209Z20120222i  r   	      Zaar   r    r*   r   re   )r   r   r5   rK   lenr   )r   Z	str_datesZdt_datesrt   rv   Ztstr   r   r   test_join_str_datetime  s    z(TestDataFrameJoin.test_join_str_datetimec                 C   s  t g dg dg dg dg dg dg dg dg d	g	g d
dddg}t ddgddggddgddg}t ddgddgddgddgddgddgdtjgdtjgdtjgg	|jddgd}t|j|dd| t|j|d d|ddg  tj	ddgg d!gddgd"}t ddgddgddgddgddgddgg|ddgd}t|j|d d| t|j|dd|ddg  d S )#N)r   rX   R
1?)r   rV   ?)r   z<+J	?)r$   rX   4ֿ)r$   rV   ^9S?)r$   r   ?)r-   rX   r    )r-   rV   r   )r-   r   r*   )r^   r_   value1r   r^   r_   r   r   r$   r
   Zvalue2r   r   r   r   r   r   r   r   g      @r   r   r#   ry   r+   )rX   rV   r   names)
r   r<   r   r   r   rL   rM   rK   r   Zfrom_product)r   r   r   expZexp_idxr   r   r   test_join_multiindex_leftright  sd    z0TestDataFrameJoin.test_join_multiindex_leftrightc                 C   s   t ddd }tjd|fgddgd}tddgi|d}tjd|fgddgd}td	dgi|d}tjd|fgddgd}td
dgi|d}|||g}tjd|fgddgd}	tdgdgdgd|	d}
t||
 d S )Ni  r    r   Zindex_0dater   r   r!   r   r   r   )	pd	Timestampr   r   from_tuplesr   rK   rL   Zassert_equal)r   r   Z	df1_indexr   Z	df2_indexr   Z	df3_indexr   rO   Zexpected_indexrN   r   r   r   test_join_multiindex_dates  s    z,TestDataFrameJoin.test_join_multiindex_datesc                 C   s   t ddgddgddggd}tdd	g}t |dd
gddggd}tjtdd  tj||dd W d    n1 sv0    Y  tjtdd |j|dd W d    n1 s0    Y  d S )Nr   r$   r       r   r   )r   r   )r    )r-   c1!   ,   z-Not allowed to merge between different levelsrT   r   )	r   r   r   r[   r\   r   r   rf   rK   )r   r   r   r   r   r   r   'test_merge_join_different_levels_raises  s    .z9TestDataFrameJoin.test_merge_join_different_levels_raisesc                 C   s   t tdtdddddd}t tdtdd	d
ddtd	dd}|j|dd}|j|j}t	|j| |jj
jdksJ d S )N)   r*   z2012-11-15 00:00:00r   Z100msz
US/Central)r   r   tzr!   )r*   r*   r*   Z250msr   rG   ry   )r   r   Zzerosr   r5   rK   r   unionrL   r{   r   zone)r   Ztest1Ztest2rO   rN   r   r   r   test_frame_join_tzaware-  s"    z)TestDataFrameJoin.test_frame_join_tzawareN)
__name__
__module____qualname__rP   r   r   r   r   r   r   r   r   r   r   r     s   
<r   )-r   numpyr   r[   Zpandas.errorsr   Zpandasr   r   r   r   r   r   Zpandas._testingZ_testingrL   Zpandas.core.reshape.concatr	   Zfixturer   r#   r+   r6   r=   r@   rB   markZparametrizer   rP   rb   rg   rm   rp   rq   rs   r   r   r   r   r   r   r   r   r   r   r   r   r   <module>   s   







""    	+

$)	
