a
    Pfy                     @   s   d dl Zd dlZd dlm  mZ d dlZd dlm	Z	m
Z
mZmZmZmZmZ d dlmZ d dlmZ d dlmZ ejdd Zejdd Zejd	d
 Zejdd Zejdd ZG dd dZG dd dZdS )    N)	DataFrameIndex
MultiIndex
RangeIndexSeries	Timestampoption_context)concat)mergec                  C   s6   g d} g d}t jdt| }t| ||dS )z=left dataframe (not multi-indexed) for multi-index join tests)
barr   r   foor   bazr   quxr   Zsnap)
twoonethreer   r   r   r   r   r   r      key1key2data)nprandomdefault_rngstandard_normallenr   r    r   ^/var/www/ai-form-bot/venv/lib/python3.9/site-packages/pandas/tests/reshape/merge/test_multi.pyleft   s    r   c                 C   s   | }ddg|j _g d|_|S )z:right dataframe (multi-indexed) for multi-index join testsr   r   )Zj_oneZj_twoZj_three)indexnamescolumns)Z multiindex_dataframe_random_datadfr   r   r   right    s    
r#   c                   C   s:   t g dg dg dg dg ddg ddg dS )	N)Ar$   Br%   C)r$   r%   r$   r&   r$   )AMr'   IPr'   OP)hbwnhbZhbor+   r*   )i  i?  i	  i  i\  )OriginDestinationPeriodTripPurpZTripsr!   )r,   r-   r.   r/   r   	set_indexr   r   r   r   
left_multi*   s    	r3   c                   C   s:   t g dg dg dg dg ddg ddg dS )	N)r$   r$   r%   r%   r&   r&   E)r$   r%   r$   r%   r$   r%   F)r'   r'   r(   r'   r)   r(   r'   )abcr7   r6   r7   r6   )d   P   Z   r:   K   #   7   )r,   r-   r.   LinkTypeZDistancer0   )r,   r-   r.   r?   r1   r   r   r   r   right_multi8   s    	r@   c                   C   s   g dS )N)r,   r-   r.   r   r   r   r   r   on_cols_multiF   s    rA   c                	   @   s.  e Zd Zdd Zejddejde	ddgejdddgd	d
 Z
ejdddgdd Zdd Zdd Zdd Zdd Zdd Zdd Zdd Zejddejeegdd Zejdd d!gd"d# Zejd$d% Zejd&d' Zejd(d) Zd*d+ Zd,d- Zd.d/ Zd0d1 Z d2d3 Z!dS )4TestMergeMultic                 C   s   ddg}|j |||djdd}t|| ||d}t|| |j |||ddjdd}t|| ||dd}t|| d S )Nr   r   onhowT)droprD   rE   sort)joinreset_indexr
   tmassert_frame_equal)selfr   r#   	join_typeon_colsresultexpectedr   r   r   test_merge_on_multikeyL   s    z%TestMergeMulti.test_merge_on_multikeyinfer_stringFTZpyarrow)ZmarksrH   c                    s  t d| g ddd   fdd}tttttdtdd	 }ttj	d

|dddgd}|d	dtj	d
ddt|d tj	d
t|}|j|  } ||d<  | |d< |jdd |||| tj|jd	d ddf< tj|jd
d ddf< tj|jdd ddf<  ||d< tj	d
t|}|j|d df } | |d< |jdd |||| W d    n1 s0    Y  d S )Nzfuture.infer_string)1st2nd3rdc                    sB   dd   fdd}|| d || d d  | d  dd	  S )
Nc                 S   s   | | krdS t | S )Nr   )ord)r6   r   r   r   <lambda>g       zNTestMergeMulti.test_left_join_multi_index.<locals>.bind_cols.<locals>.<lambda>c                    s   |   td S )Nr6   )maprW   )tsZiordr   r   rX   h   rY   rT   rV   g      Y@rU   r   
   )fillna)r"   fr   r\   r   	bind_colsf   s    z<TestMergeMulti.test_left_join_multi_index.<locals>.bind_colsc                    s   | j |d|d}t| t|d k s*J |d   r>J |d   rRJ tj|d |d  dd  |jd d d df }tj|d |dd |jd u sJ |rt||j	d	d
 t
| | |dd}tt||_t|| d S )Nr   rG      4th5thF)Zcheck_names	mergesortkind)rD   rH   rE   )rI   r   ZisnaanyrK   Zassert_series_equalilocnamerL   sort_valuesr
   rJ   r   r   )r   r#   rH   resrP   outr`   Zicolsr   r   run_assertsk   s    z>TestMergeMulti.test_left_join_multi_index.<locals>.run_assertsr6   zra   r   )2   r   rT   rV   r0   rU   r   r]   floatrb   rc   T)inplace            )r   listrZ   chrr   arangerW   r   r   r   choiceinsertZintegersr   ZastypeZpermutationri   copyr2   nanloc)rM   rH   rS   ro   lcr   ir#   r   rn   r   test_left_join_multi_index^   s8    "z)TestMergeMulti.test_left_join_multi_indexc                 C   sJ   ddg}|j ||dd|d}|j ||dd|d}||j }t|| d S )Nr   r   Tr   )Zleft_onZright_indexrE   rH   r#   )Zright_onZ
left_indexrE   rH   )r
   r!   rK   rL   )rM   r   r#   rH   rO   Zmerged_left_rightZmerge_right_leftr   r   r   test_merge_right_vs_left   s    


z'TestMergeMulti.test_merge_right_vs_leftc                 C   s   t tdtjddgg dgddgddd	}ttd
g ddd}t|| ddgd}ttd
g ddgd tdd}t	|| d S )Nrw   r$   r%   ra   r   rv   lev1lev2r    Amount)rj   ZAAABBB)ra   r   rv   ra   r   rv   r   )r   r   colrD   )r   r   r   r   )
r   ranger   from_productr   ry   r
   rJ   rK   rL   )rM   sr"   rP   rQ   r   r   r   .test_merge_multiple_cols_with_mixed_cols_index   s    z=TestMergeMulti.test_merge_multiple_cols_with_mixed_cols_indexc                 C   s   dd t dD }t|d}|d d d }t||tjddd}t|d d d |d d d tjddd}t||d	d
 d S )Nc                 S   s   g | ]}t |qS r   )str).0r   r   r   r   
<listcomp>   rY   zCTestMergeMulti.test_compress_group_combinations.<locals>.<listcomp>i'  r   rx   i N  )r   r   Zvalue1)r   r   Zvalue2outerrE   )r   r   Ztiler   r   r   r   r
   )rM   r   r   r"   Zdf2r   r   r    test_compress_group_combinations   s     	z/TestMergeMulti.test_compress_group_combinationsc                 C   s  ddg}t g dd ddgd tjtdtjd	d
}tddg}t dddgi|d}|j||d}| }tj	|d< d|j
|jdk|jdk@ df< d|j
|jdk|jdk@ df< t|| |j|ddd |j||dd}t|| t g dd ddgd tjg dd tjd	tjtdtjd	d}tddg}t dddgi|d}|j||d}| }tj	|d< d|j
|jdk|jdk@ df< d|j
|jdk|jdk@ df< t|| |j|dd}|j||dd}t|| d S )Nk1k2)r   ra   r      r   r         Zdtype)r   r   v)r   r   )ra   r   v2ru      r   r   r   ra   re   T)rg   rs   )rD   rH   )r   r   Zk3r   rf   )r   r   arrayr{   Zint64r   from_tuplesrI   r~   r   r   r   r   rK   rL   rk   Zfloat32int32)rM   rO   r   r   r#   rP   rQ   r   r   r   #test_left_join_index_preserve_order   sH    




	
z2TestMergeMulti.test_left_join_index_preserve_orderc                 C   s  t g dg dg dg dg dg dg dg dg d	g d
g
g dg dd}t g dg dg dg dg dg dg dg dg dg dg dg dg dg dgg ddg d}|j|g dd d!}t g d"g d#d$d%d&d'tjgg d(g d)g d*d+d%d,d-tjgg d.g d/g d0g d1g d2g d3g d4gg d5g d6d}t|| |j|g dd d7d8}|jg dd9d:}t|| d S );N)XYr&   r6   )Wr   r&   e)VQr$   h)r   RDr   )r   r   r   r7   )r   r   r$   r8   )r   r   r%   r_   )r   r   r&   g)r   r   r&   j)r   r   r%   d)colacolbcolctag)
rv   r   r   ra   r   rw   rt   ru   	   r   r!   r   )r   r   r&   r   )r   r   r%   rv   )r   r   r%   r   )r   r   r$   ra   )r   r   r$   rt   )r   r   r%   ru   )r   r   r&   rw   )r   r   r&   r   )r   r   r&   i)r   r   r&   i)r   r   r&   r   )r   r   r   r   )r   r   r   rx   )r   r   r$   )col1col2col3valr0   )r   r   r   )r   r   r   r   rC   )r   r   r&   r6   rw   )r   r   r&   r6   r   r   r   r&   r   )r   r   r$   r   r   )r   r   r   r   r   )r   r   r   r   rx   r   r   r7   )r   r   r$   r8   ra   )r   r   r$   r8   rt   )r   r   r%   r_   rv   )r   r   r%   r_   r   )r   r   r&   r   r   )r   r   r&   r   r   )r   r   r%   r   ru   )r   r   r   r   r   )rv   rv   r   r   ra   ra   r   rw   rw   rt   rt   ru   r   r   TrG   re   rf   )r   r2   rI   r   r   rK   rL   rk   )rM   r   r#   rP   rQ   r   r   r   +test_left_join_index_multi_match_multiindex  sv    z:TestMergeMulti.test_left_join_index_multi_match_multiindexc                 C   s<  t ddgddgddgddggdd	gg d
d}t ddgddgddgddgddgddgddgddggddgdd}|j|ddd}t g dg dg dg dddtjgg dg dddtjggg d g d!d}t|| |j|ddd"d#}|jdd$d%}t|| t||	 ddd&}t
t||_t|| d S )'Nr8   r   r7   ra   r6   r   rv   r   r   )r   r   ra   rv   r   r   wxr   yrp   rr   qr   charr0   r   rC   )r8   r   r   )r8   r   r   )r8   r   r   )r8   r   r   )r6   r   r   )r6   r   rp   )r   r   r   )r   r   r   r   r   ra   ra   rv   TrG   re   rf   rE   rD   )r   r2   rI   r   r   rK   rL   rk   r
   rJ   r   r   r   )rM   r   r#   rP   rQ   Z	expected2r   r   r    test_left_join_index_multi_matchX  sP    



z/TestMergeMulti.test_left_join_index_multi_matchc                 C   s   t tdtjddtjddtdtjdddg dd}t ddtjtjtjgdd	tjtjtjgd
}t||ddd}|jdgdd}|	|}t
|| d S )NZabcder   ru   )idZv1r   dummyZv3r0   r6   r7   gX9v?gʡE@)r   Zsv3r   r   rC   ra   )axis)r   ry   r   r   r   r   r   r
   rF   rI   rK   rL   )rM   r   r#   rP   ZrdfrQ   r   r   r   test_left_merge_na_buglet  s$    

z(TestMergeMulti.test_left_merge_na_bugletc              
   C   s   g dg dg dddt jgg dg dddt jgg d	g d
g	}t|g dd}ddt jgddt jgddt jgddt jgddt jgddt jgg}t|g dd}|j|dd}|dj|ddd}|dt j}t|| d S )N)  r$         ?)r   r%   r   )  r%   r   i  r%   )  r%         @)r   r&   r   r&   )  r&   g      @)r   r&   r   )yearpanelr   r0   r$   r   r   r   r   r   i)r   r   r   r
   r^   replacerK   rL   )rM   r   frameZ
other_dataotherrP   rQ   r   r   r   test_merge_na_keys  s.    







z!TestMergeMulti.test_merge_na_keysklassNc                 C   s   t g dg ddgd}t|j|_|jj}|d ur>||}tjg dtjd}t g d|d}|j|d|gdd	}t	
|| t |g dg dd
}|j||jjgdd	}t	
|| d S Nr   )z
2016-01-01z
2017-01-01z
2018-01-01r6   r0   )i  i  i  r   )r6   Zkey_1innerrC   )Zkey_0a_xZa_yr   pdto_datetimer   r   r   r   r   r
   rK   rL   )rM   r   r"   	on_vector	exp_yearsrQ   rP   r   r   r   test_merge_datetime_index  s    z(TestMergeMulti.test_merge_datetime_index
merge_typer   r#   c                 C   s2  t dddgitjtddgtddggddgd	d
}t tjg ddgd	dgd}tjtddgtddggddgd	}|dkrt ddgtjtjtjgtdd|d
}|j|dddgd}|j	|dd}nJt tjtjtjgtdddgd|d
}|j|dddgd}|j	|dd}t
|| t
|| d S )Nr   r   z
1950-01-01r$   z
1950-01-02r%   dater   r   )r   r   state)r   r!   r   r   )r   r   r   r   )r   r   r#   )r   r   r   r   r   r   r   objectr
   rI   rK   rL   )rM   r   r   r#   Zexpected_indexrQ   Zresults_mergeZresults_joinr   r   r   (test_merge_datetime_multi_index_empty_df  sD    
z7TestMergeMulti.test_merge_datetime_multi_index_empty_dfc                 C   s.   t g dg dg ddg ddd}|S )Nr   )r   ra   r   )ffffAPAi^ )household_idmalewealthr0   r   r1   )rM   	householdr   r   r   r     s    zTestMergeMulti.householdc              
   C   sP   t g dddddddtjgddd	d	d
dtjgg ddg ddddg}|S )Nra   r   r   rv   rv   rv   rt   nl0000301109nl0000289783gb00b03mlx29lu0197800237nl0000289965ABN AmroRobecoRoyal Dutch ShellAAB Eastern Europe Equity FundPostbank BioTech Fonds      ?皙?333333?333333?r         ?r   )r   asset_idrj   sharer0   r   r   )r   r   r   r2   )rM   	portfolior   r   r   r     s2    
	zTestMergeMulti.portfolioc                 C   sH   t g dg dg dg dg dg dddd	gjg d
d}|S )N)r   ra   ra   r   r   r   )r   r   r       xAr   r   )r   r   r   r   r   r   )r   r   r   r   r   r   )ra   r   r   rv   rv   rv   )r   r   r   r   r   r   )r   r   rj   r   r   r   r   r   )r   r   rj   r   r0   )r   r2   reindex)rM   rQ   r   r   r   rQ   1  s     #zTestMergeMulti.expectedc                 C   s.   |  }|  }|j|dd}t|| d S )Nr   r   )r~   rI   rK   rL   rM   r   r   rQ   rP   r   r   r   test_join_multi_levelsX  s    z%TestMergeMulti.test_join_multi_levelsc                 C   sD   |  }|  }t| | dgddddg}t|| d S )Nr   r   rC   r   )r~   r
   rJ   r2   rK   rL   r   r   r   r   (test_join_multi_levels_merge_equivalencea  s    z7TestMergeMulti.test_join_multi_levels_merge_equivalencec                 C   sr   |  }|  }|j|dd}t|tddgitjdtjfgddgdd	gd
ddj|j	d}t
j||dd d S )Nr   r   r   r   rt   r   r   r   r   r   T)r   rH   r0   F)Zcheck_index_type)r~   rI   r	   r   r   r   r   r   r   r!   rK   rL   r   r   r   r   test_join_multi_levels_outern  s$    z+TestMergeMulti.test_join_multi_levels_outerc                 C   s   |  }|  }d|j_tjtdd |j|dd W d    n1 sJ0    Y  |  }|jddg tjtdd |j|dd W d    n1 s0    Y  d S )Nr   z+cannot join with no overlapping index names)matchr   r   r   z'columns overlap but no suffix specified)r~   r   rj   pytestZraises
ValueErrorrI   Z	set_names)rM   r   r   Z
portfolio2r   r   r   test_join_multi_levels_invalid  s    ,z-TestMergeMulti.test_join_multi_levels_invalidc              	   C   s@  t g dddddddtjgg ddg ddd	d
g}t g dg dg ddd
dg}t g dg dg dg dg ddg djddgd}t| | d
gddg d}t|| t g dg dg dg dg ddg djddgd}t| | d
gd dg d}t|| d S )!Nr   r   r   r   r   r   )r   r   r   r0   r   r   )r   r   r   r   r   )               )S緖?D >?
?HRE?)r   t
log_returnr  )r   r   r   rv   rv   rv   rv   rv   )r   r   r   r   r   r   r   r   )r  r  r	  r  r  r	  r
  r  )r   r   r   r   r   r   r   r   )r  r  r  r  r  r  r  r  )r   r   r  r   r  )r   r   r  r   r  r   rC   )r   r   r   rv   rv   rv   rv   rv   rv   ra   r   rt   )r   r   r   r   r   r   r   r   r   r   r   N)r  r  r	  r  r  r	  r
  r  NNNN)r   r   r   r   r   r   r   r   r   r   r   r   )r  r  r  r  r  r  r  r  NNNNr   )	r   r   r   r2   r   r
   rJ   rK   rL   )rM   r   r  rQ   rP   r   r   r   test_join_multi_levels2  s    	
!=>Bz&TestMergeMulti.test_join_multi_levels2)"__name__
__module____qualname__rR   r  markparametrizeparamtdZ
skip_if_nor   r   r   r   r   r   r   r   r   r   asarrayr   r   r   r   fixturer   r   rQ   r   r  r  r  r  r   r   r   r   rB   K   s<   >
6E2 

.


&	rB   c                   @   sL   e Zd Zdd Zdd Zejddej	e
egdd Zd	d
 Zdd ZdS )TestJoinMultiMultic           
      C   sz   |j j}|j j}|dkr(||| }n||| }t| | ||d| }|j||d }	t	|	| d S )Nr#   r   r   )
r   r    
differencer
   rJ   r2   
sort_indexrI   rK   rL   
rM   r3   r@   rN   rA   Z
left_namesZright_namesZlevel_orderrQ   rP   r   r   r   test_join_multi_multi4  s     z(TestJoinMultiMulti.test_join_multi_multic           
      C   s   |j |jd}|j |jd}|jj}|jj}|dkrD||| }n||| }t| | ||d| }|j	||d }	t
|	| d S )Nr0   r#   r   r   )rF   r!   r   r    r  r
   rJ   r2   r  rI   rK   rL   r   r   r   r   test_join_multi_empty_framesJ  s$    z/TestJoinMultiMulti.test_join_multi_empty_framesboxNc                 C   s   t g dg ddgd}t|j|_|jj}|d ur>||}tjg dtjd}t g d|d}|j|d|gdd	}t	
|| t |g dg dd
}|j||jjgdd	}t	
|| d S r   r   )rM   r#  r"   r   r   rQ   rP   r   r   r   r   e  s    z,TestJoinMultiMulti.test_merge_datetime_indexc                 C   s   t jg dddgd}tg dg dd|d}t jg d	dd
gd}tg dg dd|d}||}t| | dgddg d}t|| d S )N))K0ZX0)r$  ZX1)K1ZX2keyr   r   )ZA0A1A2)B0ZB1ZB2)r$   r%   r   ))r$  ZY0)r%  ZY1)K2ZY2)r*  ZY3r   )ZC0ZC1ZC2ZC3)ZD0ZD1ZD2ZD3)r&   r   r   rC   )r&  r   r   )	r   r   r   rI   r
   rJ   r2   rK   rL   )rM   Z
index_leftr   Zindex_rightr#   rP   rQ   r   r   r   test_single_common_level|  s(    
z+TestJoinMultiMulti.test_single_common_levelc                 C   s   t jddgddggddgd}t jg dddgd}t|d	g d
id}t|dg did}||}t|g d
dddtjgdd}t|| d S )Nra   r   rv   rt   r6   r7   r   ))rt   ra   )rv   r   )rv   ra   r   )r]         (   )r   r   r   )r   r   fingr/  r   r   )r   r   )	r   r   r   r   rI   r   r   rK   rL   )rM   Zmidx1Zmidx3r   r#   rP   rQ   r   r   r   test_join_multi_wrong_order  s    
z.TestJoinMultiMulti.test_join_multi_wrong_order)r  r  r  r!  r"  r  r  r  r   r  r   r   r   r+  r0  r   r   r   r   r  3  s   
r  )numpyr   r  Zpandas.util._test_decoratorsutilZ_test_decoratorsr  Zpandasr   r   r   r   r   r   r   r   Zpandas._testingZ_testingrK   Zpandas.core.reshape.concatr	   Zpandas.core.reshape.merger
   r  r   r#   r3   r@   rA   rB   r  r   r   r   r   <module>   s0   $	


	


     m