o
    ҷh                    @   sV  d dl mZm Z mZ d dlZd dlZd dlZd dlmZ d dl	m
Z
 d dlZd dlmZmZmZmZmZmZmZmZmZmZmZ d dlmZ d dlm
Z d dlmZ d dlm Z m!Z! dd
dZ"dd Z#dd Z$ej%e# dd ddd Z&ej%e# dd ddd Z'ej%e$ dd ddd Z(ej%dd Z)G dd dZ*dd  Z+G d!d" d"Z,ej%d#d$ Z-ej%d%d& Z.G d'd( d(Z/ej%d)d* Z0ej%d+d, Z1G d-d. d.Z2ej3j4d/d0d1 ej5D ed2d3gd2d3gd4d5ed d6d4d7ed8d9gd4d:g d;d d<d=d> Z6ej34d?d@dAgdddBdBd3fdCdd@dAgddBdDd3fddd@dAgdDdBd3fd@dAgdddBdBdfdEdd@dAgddBdDdfddd@dAgdDdBdfgdFdG Z7dHdI Z8ej34dJd d dKdLidMdNgfd d dKdOid dNgfd d dKdPidQdRgfd d dKdSdTgidQdRgfdUd dKdVidUd gfdWdWdKdXidYdWgfdZdZdKdVidZd[gfdUdUdKdXid\dUgfdUdZdKdXidUdZgfdUdUdKd]idUd\gfd d dKd^id_d gfdUdUi d\d`gfd d i dQdRgfgdadb Z9ej34dcd&eg dddedfej:gg dgdhfd@eg didedfdjej:gdkdlej:dmgdhfgdndo Z;ej34dpg dqdrds Z<ej34dKd$d&hd d dtgdudv Z=ej34dwdxdUdUe>dUdyfgdzd{ Z?ej34d|d}d~gej34ddDdBgdd Z@dd ZAdd ZBdd ZCdd ZDej34dddgdd ZEdd ZFej34dddgej34ddUdDdddgfdUdDdddgfgdd ZGej34dddgej34dddUiddgfddUiddgfgdd ZHej34dddgej34dddDiddDigdd ZIdd ZJdd ZKdd ZLdd ZMdd ZNdd ZOdd ZPdd ZQej34dddgdd ZRdd ZSdd ZTdd ZUej34dddgdd ZVej34dg dej34dddgddń ZWddǄ ZXddɄ ZYdd˄ ZZdS )    )datedatetime	timedeltaN)is_object_dtype)CategoricalDtype)CategoricalCategoricalIndex	DataFrameDatetimeIndexIndexIntervalIndex
MultiIndexPeriodIndex
RangeIndexSeriesTimedeltaIndex)concat)
MergeErrormerge   2   c                 C   sf   t t| }tt|||  }t||k r(tt ||d |t|   }tjd| |S )N   )	listrangenpasarraytilelenrandomdefault_rngshuffle)ngroupsnunique_groupsarr r%   X/var/www/html/venv/lib/python3.10/site-packages/pandas/tests/reshape/merge/test_merge.pyget_test_data%   s   "r'   c                   C   sT   t dgddt dgddt dgt dgt dgt tdgt tjdd	d
ggS )N   int64dtypeInt64gGz?fooT
2018-01-01
US/Easterntz)r   pd	Timestampr%   r%   r%   r&   
get_series0   s   r4   c                   C   s8   t tjgddt tjgddt tjgddt tjggS )Nr,   r*   floatobject)r   r   nanr2   NaTr%   r%   r%   r&   get_series_na<   s
   
r9   c                 C      | j jS Nr+   namexr%   r%   r&   <lambda>E       r@   )paramsidsc                 C      | j S )zV
    A parametrized fixture returning a variety of Series of different
    dtypes
    paramrequestr%   r%   r&   series_of_dtypeE      rI   c                 C   r:   r;   r<   r>   r%   r%   r&   r@   N   rA   c                 C   rD   )zk
    A duplicate of the series_of_dtype fixture, so that it can be used
    twice by a single function
    rE   rG   r%   r%   r&   series_of_dtype2N   rJ   rK   c                 C   r:   r;   r<   r>   r%   r%   r&   r@   W   rA   c                 C   rD   )zU
    A parametrized fixture returning a variety of Series with all NA
    values
    rE   rG   r%   r%   r&   series_of_dtype_all_naW   rJ   rL   c                  C   s@   t ddgddgddgd} t g dg dg dd	}| |fS )
Nr   r(   r   ab)col1col_conflictcol_left)r(   r            )r   r   r   r   r   )rO   rP   	col_rightr	   )df1df2r%   r%   r&   dfs_for_indicator`   s   rY   c                   @   s  e Zd Zejdd Zejdd Zejdd Zejdd Zd	d
 Z	dd Z
dd Zdd Zdd Zdd Zdd Zdd Zdd Zdd Zdd Zdd  Zd!d" Zd#d$ Zd%d& Zd'd( Zd)d* Zd+d, Zd-d. Zejd/g d0d1d2 Zejd3d4d4d5d4d6d7d8d4d9d8d6d:gd;d< Zd=d> Z d?d@ Z!dAdB Z"dCdD Z#dEdF Z$ejdGdHg dIfd4g dJfgejd/dKdLgdMdN Z%dOdP Z&dQdR Z'ej(dSdTdU Z)dVdW Z*dXdY Z+ejdZg d[d\d] Z,ejdZg d[d^d_ Z-d`da Z.dbdc Z/ddde Z0dfdg Z1dhdi Z2djdk Z3dldm Z4dndo Z5dpdq Z6drds Z7dtdu Z8dvdw Z9dxdy Z:dzd{ Z;d|d} Z<ejd/dLd~gejde=g de=g dfe>g de>ddde?j@e?j@e?j@gfgdd eAjBD eCDg deCDdddeEjFeEjFeEjFgfeGg dddeGddde?j@e?j@e?j@gddfeHg deHddde?j@e?j@e?j@gfdd ZIdd ZJejd/dKdLgdd ZKdd ZLdd ZMdS )	TestMergec                 C   sF   t t t tjddtjddd}||d dk }|S )Nr   r   )key1key2data1data2r\   r(   r	   r'   r   r   r   standard_normal)selfdfr%   r%   r&   rb   n   s   
zTestMerge.dfc                 C   s,   t tddtdddtjdddS )N
   )r"   rS   )r!   r"   r   )r[   r\   valuer_   ra   r%   r%   r&   rX   }   s   
zTestMerge.df2c                 C   s    t g dtjdddS )NrM   rN   cderi   rM   r      keyv1r	   r   r   r   r`   re   r%   r%   r&   left   s
   zTestMerge.leftc                 C   s"   t dtjddig ddS )Nv2r   rS   rh   rN   rg   rM   indexrn   re   r%   r%   r&   right   s   zTestMerge.rightc                 C   sP   t  }t dddgiddgdd}t||ddd}t dg idd	}t|| d S )
NrM   r(   r   r   r)   )rs   r+   T
left_indexright_indexr*   r	   r   tmassert_frame_equal)ra   df_emptydf_aresultexpectedr%   r%   r&   test_merge_inner_join_empty   s
   z%TestMerge.test_merge_inner_join_emptyc                 C   s,   t ||}t ||ddgd}t|| d S )Nr[   r\   onr   ry   rz   )ra   rb   rX   joinedexpr%   r%   r&   test_merge_common   s   
zTestMerge.test_merge_commonc                 C   sJ   t g dg dg dg dd}|t}|}t||}t|| d S )N)r(   r   r(   r   )r   r(   r   r   )r   r   r   r   )r(   r   r   rR   r   r(   r   rR   )r	   astyper5   r   ry   rz   ra   ro   rt   r~   r}   r%   r%   r&   test_merge_non_string_columns   s   

z'TestMerge.test_merge_non_string_columnsc                 C   sF   | d}| d}t||dd}t||dd d}t|| d S )Nr[   r   )	set_indexr   ry   rz   )ra   rb   rX   ro   rt   r}   r~   r%   r%   r&   test_merge_index_as_on_arg   s
   

z$TestMerge.test_merge_index_as_on_argc                 C   s   t g dtjddd}t dtjddig dd}t||d	d
ddd}t||d	d
ddd}t||jd d |j	f  t||d	d
dd
d}t||d	d
dd
d}t||jd d |j	f  d S )Nrf   r   rj   rk   rp   rS   rq   rr   rl   Tro   F)left_onrw   howsortrt   )right_onrv   r   r   )
r	   r   r   r   r`   r   ry   rz   loccolumns)ra   ro   rt   merged1merged2r%   r%   r&   (test_merge_index_singlekey_right_vs_left   s.    z2TestMerge.test_merge_index_singlekey_right_vs_leftc                 C   s   t g dtjddd}t dtjddig dd}t||d	d
dd}|j|d	dj|j }t	
|| t||d	d
dd}|j|d	dj|j }t	
||jd d |jf  d S )Nrf   r   rj   rk   rp   rS   rq   rr   rl   Tinnerr   rw   r   r   )r   rv   r   )r	   r   r   r   r`   r   joinr   rs   ry   rz   r   ra   ro   rt   r}   r~   r%   r%   r&    test_merge_index_singlekey_inner   s    z*TestMerge.test_merge_index_singlekey_innerc                 C   s  d}t jtjj|d t||dd W d    n1 sw   Y  d}t jtjj|d t||dd W d    n1 s?w   Y  d}t jtjj|d t||ddd	 W d    n1 sbw   Y  d
}t jt|d t||dgddgd W d    d S 1 sw   Y  d S )Nz&Must pass right_on or right_index=TruematchT)rv   z$Must pass left_on or left_index=True)rw   zRCan only pass argument "on" OR "left_on" and "right_on", not a combination of bothrl   )r   r   z)len\(right_on\) must equal len\(left_on\)r[   r\   r   r   )pytestraisesr2   errorsr   r   
ValueError)ra   rb   rX   ro   rt   msgr%   r%   r&   test_merge_misspecified   s"   "z!TestMerge.test_merge_misspecifiedc                 C   s   d}t jt|d t||ddddgd W d    n1 sw   Y  d}t jt|d t||dddgdd W d    n1 sCw   Y  t jt|d t||dddgddgd W d    d S 1 shw   Y  d S )	Nz>right_index parameter must be of type bool, not <class 'list'>r   ro   Fr[   r\   r   rv   rw   z=left_index parameter must be of type bool, not <class 'list'>r   r   r   r   )ra   rb   rX   r   r%   r%   r&   &test_index_and_on_parameters_confusion   s:   "z0TestMerge.test_index_and_on_parameters_confusionc                 C   sN   t ||dd}|d  d  }t||ksJ d|v sJ d|v s%J d S )Nrl   r   r   v1_xv1_y)r   value_countssumr   )ra   ro   mergedexp_lenr%   r%   r&   test_merge_overlap  s
   zTestMerge.test_merge_overlapc                 C   s   t g dg dd}t g dg dd}|j|ddd	d
d}tddddddtjgdd}t|d | tdtjdddddgdd}t|d | tddddddtjgdd}t|d | tdtjdddddgdd}t|d | d S )N)r-   barbazr-   r(   r   rR   rS   )lkeyrd   )r-   r   quxr-   )rT      rj   r   )rkeyrd   r   r   outerT)r   r   r   r   r   r   r-   r=   r   r   rR   r(   rS   value_xr   rT   r   rj   value_y)r	   r   r   r   r7   ry   assert_series_equal)ra   ro   rt   r   r   r%   r%   r&   %test_merge_different_column_key_names   s   
z/TestMerge.test_merge_different_column_key_namesc                 C   sz   t dddtdd}t dddtdd}t||d	d	d	d
}d|d< |d dk s-J d|d< |d dk s;J d S )Nr   r(   rM   rN   rc   rr   r-   r   rg   rh   Trv   rw   copyr   rM   peekaboorh   )r	   r   r   all)ra   ro   rt   r   r%   r%   r&   test_merge_copy4  s   zTestMerge.test_merge_copyc                 C   sz   t dddtdd}t dddtdd}t||d	d	d
d}t|d j|d js-J t|d j|d js;J d S )Nr   r(   r   rc   rr   r-   r   r   TFr   rM   rh   )r	   r   r   r   shares_memory_values)ra   using_array_managerro   rt   r   r%   r%   r&   test_merge_nocopy@  s
    zTestMerge.test_merge_nocopyc                 C   s   t g dttddddgd}t g dttdd	}t||dd
d}t g dtdddddddtjtjg	g ddg dd}t|| d S )Nr(   r(   r   r   rR   rT   rl   rd   rd   rl   r   r(   r(   r   rR   rS   rT   r   )rl   rvaluer   r   r   	r(   r(   r(   r(   r   r   rR   rS   rT   r   r(   r   rR   rS   )	r   r(   r   r(   r   r   rR   rS   rT   )rl   rd   r   )rd   rl   r   )	r	   r   r   r   r   arrayr7   ry   rz   )ra   ro   rt   r   r~   r%   r%   r&   "test_intelligently_handle_join_keyI  s   z,TestMerge.test_intelligently_handle_join_keyc                 C   s   t dgdgd}t dgdgd}t||dd}|d jd	ks"J t d
gdgd}t dgdgd}t||dd}|d jdksDJ t ddgi}t ddgi}tdg}tdg}t||||dd}|d jttkssJ d S )Nr(   rc   rk   r      r   r   rl   r)   TFr   boolvalr   r   r   key_0)r	   r   r+   r   r   int)ra   rW   rX   rb   r   r   r%   r%   r&   test_merge_join_key_dtype_cast\  s   z(TestMerge.test_merge_join_key_dtype_castc           	      C   s  t g dtddddgdd}t dtd	idd
}tjg ddd
}t||d|dd}t|||ddd}t|d |d  |d   sKJ |d   sUJ t dtdidgd}t dtd	i}tg d}tg d}t||||dd}t	g dt
dd}t|d | t dtdi}t dtd	i}tjg dtjd
}t||d|dd}t|d t	|dd d S )Nr   rT   r   rd   rl   r)   r   r+   r   r   r*   r   r   r   r   r   r   r<   rR   )r   r(   r(   r   r   rR   T)rv   r   r   r   )r	   r   aranger   r   ry   r   notnar   r   r   r)   )	ra   ro   rt   rl   r   r   r   r   r~   r%   r%   r&   test_handle_join_key_pass_arrays  s0   z)TestMerge.test_handle_join_key_pass_arrayc                 C   s   t  }tddgi|gd}tdddgi||gd}dd  dd  d	d
 dd
 }tjt|d t|| W d    d S 1 s@w   Y  d S )Nr?   rM   rr   yrN   rg   z>No common columns to perform merge on. Merge options: left_on=z, right_on=z, left_index=Fz, right_index=r   )r   nowr	   r   r   r   r   )ra   dtrW   rX   r   r%   r%   r&   &test_no_overlap_more_informative_error  s    "z0TestMerge.test_no_overlap_more_informative_errorc                 C   s   t ddd}t ddd}t ddd}t ddd}tddgi|gd	}td
ddgi||gd	}t|| tdg di|||gd	}td
g di||||||gd	}t|| tdddgi||gd	}td
ddgi||gd	}t|| d S )N  rT   r(   r   rR   rS   r?   rM   rr   r   rN   rg   )rM   rN   q)rg   rh   ri   fghrh   r   r	   _check_merge)ra   r   dt2dt3dt4rW   rX   r%   r%   r&   test_merge_non_unique_indexes  s   

z'TestMerge.test_merge_non_unique_indexesc                 C   sl   t ddd}t ddd}t ddd}tdg di||||gd}td	g d
i|||||gd}t|| d S )Nr   rT   r(   r   rR   r?   rM   rN   rg   rh   rr   r   )ri   r   r   z hir   )ra   r   r   r   rW   rX   r%   r%   r&   (test_merge_non_unique_index_many_to_many  s   z2TestMerge.test_merge_non_unique_index_many_to_manyc                 C   sZ   t dgdgd}t dg i}t||ddd}t|| t||ddd}t|| d S )Nr(   r   r   rl   ro   r   rt   rx   )ra   ro   rt   r}   r%   r%   r&   test_left_merge_empty_dataframe  s   z)TestMerge.test_left_merge_empty_dataframer   )r   ro   rt   r   c                 C   s:   t g |d d d}| }|j||d}t|| d S )Nr   rr   r   )r	   r   r   ry   rz   )ra   rs   r   ro   rt   r}   r%   r%   r&   test_merge_empty_dataframe  s   z$TestMerge.test_merge_empty_dataframekwargTru   r?   rv   r   rM   r   rw   r   c                 C   sR   t g dd}t g dd}t g dtd}t||fd|i|}t|| d S )NrM   rN   rg   r   r?   r   zrM   rN   rg   r?   r   r   r   r   )r	   r6   r   ry   rz   )ra   	join_typer   ro   rt   exp_inr}   r%   r%   r&   !test_merge_left_empty_right_empty  s
   z+TestMerge.test_merge_left_empty_right_emptyc                    sL  t g dd t g dg dg dgg ddt tjtjgd tdtjtjgd tdtjtjgd tdg d	g d
g ddg dd}|dd } fdd} fdd}ddddddfD ]}||| ||| qfddd}||| g d|d< ||| ddd}||| tjtjgd td|d< ||| d S )Nr   r   r(   r   rR   rS   rT   r   rj   r   	   r   rR   r*   r(   rS   rj   r   rT   r   rR   r   r   r   r   c                    H   t  fddi|}t||  t  fddi|}t||  d S )Nr   r   ro   r   r   r   r}   ro   rt   r%   r&   check1     z>TestMerge.test_merge_left_empty_right_notempty.<locals>.check1c                    r   )Nr   rt   r   r   r   r  r%   r&   check2  r  z>TestMerge.test_merge_left_empty_right_notempty.<locals>.check2Tru   r?   r   rM   r   r   r(   r   r   )r	   r   r   r7   r6   )ra   exp_outr   r  r  r   r%   r  r&   $test_merge_left_empty_right_notempty  s8   "





z.TestMerge.test_merge_left_empty_right_notemptyc              
      s   t g dg dg dgg ddt g ddt g dg dg d	tjtjgd
 tdtjtjgd
 tdtjtjgd
 tddg dddd jt_fdd  fddd S )Nr   r   r   r   r   r   r   r   r   rR   r*   r   r   c                    r   )Nr   r   rt   r   r   r  r%   r&   r  *  r  z>TestMerge.test_merge_left_notempty_right_empty.<locals>.check1c                    s   t fddi|}t||  t fddi|}t||  ddddddddd	ddd
fD ]} | | q4d S )Nr   ro   r   Tru   r?   r   rM   r   r   r   r   r  r  r   r  ro   rt   r%   r&   r  0  s   
z>TestMerge.test_merge_left_notempty_right_empty.<locals>.check2)r	   r   r   r7   r6   rs   r   re   r%   r  r&   $test_merge_left_notempty_right_empty  s    "z.TestMerge.test_merge_left_notempty_right_emptyc                 C   s|   t ||dddgd}|d d }t t|jd dt|jd dt|jd ddg dd}|j|dd}t|| d S )	Nr   rl   rd   r   r   r*   )r   rl   r   r   )r	   r   dtypesr   ry   rz   )ra   rI   rK   rb   r{   r~   actualr%   r%   r&   test_merge_empty_frame@  s   z TestMerge.test_merge_empty_framec                 C   sb   t ||dddgd}t ||dddgd}t |||dg dd}|j|dd}t|| d S )Nr   rl   rd   r   rl   r   r   r   rx   )ra   rI   rL   df_leftdf_rightr~   r  r%   r%   r&   test_merge_all_na_columnR  s"   z"TestMerge.test_merge_all_na_columnc                 C   s   t jdjddddt jdjddddtdddtddd	td
ddtdddtddd	tdd	dtddd	tdddtd
ddtdddg
d}t|}|j }t 	|}t|t jddd}|j
|ddd}t
||ddd}t|| |j |j k sJ d S )Nr   r   rc   sizer   r(      i  rS   i  rR   i  rT   )var1var2var3rj   )r  var8r  Fr   r   )r   r   r   integersr   r	   	from_dictr  uniquer   r   ry   rz   r   )ra   rh   rb   r  newr}   r   r%   r%   r&   test_merge_nosortg  s0   












 zTestMerge.test_merge_nosort)r   valuesF)r(   r(   r   r(   r(   )r   r(   r(   r(   r(   ro   rt   c                 C   s@   t dg di}|j|d||d}t |dgd}t|| d S )NrM   )r(   r   r(   )r   r   r   r   rx   )ra   r   r  r   rb   r}   r~   r%   r%   r&    test_merge_same_order_left_right  s   z*TestMerge.test_merge_same_order_left_rightc                 C   s   t ddgddgd}t dgdgd}|j|ddd}t ddd	ddd	dtjd	dtjd	ddd	d
d  g d }tj||dd d S )Nr   r(   i1i2r!  i3r!  _)r   rsuffix        r   r(   )r!  r"  i1_r$  Nr!  r"  r)  r$  F)check_dtype)r	   r   r   r7   r   reset_indexry   rz   ra   rW   rX   r}   r~   r%   r%   r&   test_merge_nan_right  s    

	
zTestMerge.test_merge_nan_rightc                 C   s~   t ddgddgd}t dgdgd}|j|dd	d
}t ddddtjdddddtjddg d }t|| d S )Nr   r(   g      ?      ?r   gffffff?r#  r%  r!  )r&  r   r(  r'  )r!  r)  r"  r$  r*  )r	   r   r   r7   ry   rz   r-  r%   r%   r&   test_merge_nan_right2  s   

zTestMerge.test_merge_nan_right2zMignore:Passing a BlockManager|Passing a SingleBlockManager:DeprecationWarningc                    s<   G  fdddt   |}|j|dd}t| sJ d S )Nc                       s   e Zd Ze fddZdS )z0TestMerge.test_merge_type.<locals>.NotADataFramec                    s    S r;   r%   re   NotADataFramer%   r&   _constructor  s   z=TestMerge.test_merge_type.<locals>.NotADataFrame._constructorN)__name__
__module____qualname__propertyr3  r%   r1  r%   r&   r2    s    r2  r[   r   )r	   r   
isinstance)ra   rb   rX   nadr}   r%   r1  r&   test_merge_type  s   zTestMerge.test_merge_typec                 C   s   t tdddddgtddgd}t tdd	}d
}t}|r"d }tj||d t||gdd}t||gdd}W d    n1 sDw   Y  t tdddddtdddddgtddtddgd}|rm|	t
}t|| d S )Ni     rT   8   r   iW  )rh   tr   r   zDThe behavior of DataFrame concatenation with empty or all-NA entriesr   T)ignore_index)r	   r  r   r   r   FutureWarningry   assert_produces_warningr   r   r6   rz   )ra   r   rh   rb   r   warnr}   r~   r%   r%   r&   test_join_append_timedeltas  s(   
z%TestMerge.test_join_append_timedeltasc                 C   s   t d}tt||gddgd}tt|gdgd}|j|ddd}tt||gtddt|tjgtddd	}t	|| d S )
Ni ABrr   rro   )r&  r   AB)00r)
r   timedelta64r	   r   r   r   r2   r8   ry   rz   )ra   tdlhsrhsr}   r~   r%   r%   r&   test_join_append_timedeltas2  s   
z&TestMerge.test_join_append_timedeltas2unit)Dr   msmsusnsc           
      C   s   t dddgi}td d gddgdd}d| d}|dv r d	}n|}||d}|d j|ks3J |j|dd
d}tjddg|d}tj	j
jj||jd}t ddg|dddgd}	|	d j|kseJ t||	 d S )N	entity_ide   f   daysrs   r=   zdatetime64[]rO  r   rP  zdatetime64[s]Tr   natr*   rU  rX  r   )r	   r   r   to_framer+   r   r   r   r2   corearraysDatetimeArray_simple_newry   rz   )
ra   rN  rW   serr+   	exp_dtyperX   r}   rX  r   r%   r%   r&   test_other_datetime_unit  s&   z"TestMerge.test_other_datetime_unitc           	      C   s   t dddgi}td d gddgdd}d| d}|dv rDd	}tjt|d
 || W d    n1 s6w   Y  |dd}n||d}|d j|ksUJ |j|ddd}t ddgt	j
ddg|ddddgd}t|| d S )NrU  rV  rW  rX  rY  zm8[rZ  r[  z/Supported resolutions are 's', 'ms', 'us', 'ns'r   zm8[s]Tr   r\  r*   r]  r   )r	   r   r   r   r   r   r^  r+   r   r   r   ry   rz   )	ra   rN  rW   rc  r+   r   rX   r}   r   r%   r%   r&   test_other_timedelta_unit
  s"   z#TestMerge.test_other_timedelta_unitc                 C   s   t g dg dg dd}t g dg dg dd}g d|_g d|_t g dg dg dg dg dd}g d|_tt||| g d	|_d
}tjt|d t|| W d    d S 1 sgw   Y  d S )Nr   r   r   rl   rm   rp   )rl   r-   r-   )rl   r   r   )rl   rm   rp   v3v4)rl   r-   r-   r   r   )r[   r-   r-   z;Data columns not unique: Index\(\['foo'\], dtype='object'\)r   )r	   r   ry   rz   r   r   r   r   )ra   rb   rX   r~   r   r%   r%   r&   &test_overlapping_columns_error_message$  s&   


	
"z0TestMerge.test_overlapping_columns_error_messagec                 C      t tjddddddgd}t tjddddg d	d}t tjdd
ddddtjtjgtjdddgd}t||ddd}t|| d S )N20151010r   r/   periodsr1   r(   r   20151011rR   r   rS   r  rl   r   r   )r	   r2   
date_ranger   r7   r   ry   rz   r   r%   r%   r&   test_merge_on_datetime64tz<  s$   z$TestMerge.test_merge_on_datetime64tzc              
   C   s   t ddgtjddddd}t ddgtjddddd}t g d	ttjddddtjg tjgttjdddd d
}t||ddd}t|| |d jdksWJ |d jdks`J d S )Nr(   r   rl  r/   rm  r   rR   ro  r   r  rl   r   r   r   zdatetime64[ns, US/Eastern]r   )	r	   r2   rp  r   r8   r   ry   rz   r+   r   r%   r%   r&   test_merge_datetime64tz_valuesU  s0   	z(TestMerge.test_merge_datetime64tz_valuesc                 C   s   t jdd}tt jd|jdgdgt jd|jdgdg dd}|d d }|j|d	d
}tttdt|dt|dttdt|ddg dd}t	|| d S )NUTCr0   2018g      @2019)r   rd   date2r   r   r   r   r*   )r   date2_xr   r   date2_y)
r2   DatetimeTZDtyper	   r3   r1   r   r   r5   ry   rz   )ra   dtzrt   ro   r}   r~   r%   r%   r&    test_merge_on_datetime64tz_emptyp  s(   
z*TestMerge.test_merge_on_datetime64tz_emptyc                 C   s   t tjddddddgd}d|d	< t tg d
dd}|d jdjd|d< t||ddd}t tjddddddgd tj	gd  tj	gd dgd  d}t
|| d S )Nz2017-10-29 01:00rS   HzEurope/Madrid)rn  freqr1   r   r   r(   rd   )z2017-10-29 03:00:00z2017-10-29 04:00:00z2017-10-29 05:00:00r   )r   rd   rs  r   r   r   rj   rR   )r   r   r   )r	   r2   rp  to_datetimer   tz_localize
tz_convertr   r   r7   ry   rz   r-  r%   r%   r&   +test_merge_datetime64tz_with_dst_transition  s.   	z5TestMerge.test_merge_datetime64tz_with_dst_transitionc                 C   s   t jdddd}tttt||dgd}t||g}|j|dddd	}tt	tj
dtjd
ddddddg| jd}t|| d S )Nz
2016-01-01   Mrn  r}  pnumrs   r   Tr   )rv   rw   r   r*   r   r(   pnum_xpnum_yr   rs   )r2   period_ranger	   r   r   r   r   r   r   r   r   r)   repeatreshape
sort_indexrs   ry   rz   )ra   rs   rb   rX   r}   r~   r%   r%   r&   "test_merge_non_unique_period_index  s   $z,TestMerge.test_merge_non_unique_period_indexc                 C   rk  )Nrl  r   rO  r  r(   r   ro  rR   r   rS   r  rl   r   r   )r	   r2   r  r   r7   r   ry   rz   r   r%   r%   r&   test_merge_on_periods  s    zTestMerge.test_merge_on_periodsc                 C   s   t ddgtjddddd}t ddgtjddddd}tjdddd}tjdddd}t g d	t|tjg tjgt| d
}t||ddd}t|| |d jdks[J |d jdksdJ d S )Nr(   r   rl  rO  r  r   rR   ro  r   r  rl   r   r   r   z	Period[D]r   )	r	   r2   r  r   r8   r   ry   rz   r+   )ra   ro   rt   exp_xexp_yr~   r}   r%   r%   r&   test_merge_period_values  s$   z"TestMerge.test_merge_period_valuesc           
      C   s@  |\}}|  }|  }tg dddtjtjtjtjgddtjtjtjtjgtjdddddgtjdddddgd	}tg d
g dd|d< |g d }t||dddd}t|| |j|dddd}t|| t|| t|| |}|jddid}t||dddd}	t|	| |j|dddd}	t|	| d S )Nr   r(   r   rR   rS   rT   r(   r   rM   rN   rR   rS   rT   )rO   col_conflict_xrQ   col_conflict_yrU   )	left_onlyboth
right_onlyr  r  r  r  r  r  
categories_merge)rO   r  rQ   r  rU   r  rO   r   Tr   r   	indicatorcustom_namer   )	r   r	   r   r7   r   r   ry   rz   rename)
ra   rY   rW   rX   df1_copydf2_copy	df_resulttestdf_result_custom_nametest_custom_namer%   r%   r&   test_indicator  sH   	

zTestMerge.test_indicatorc                 C   s   |\}}d}t jt|d t||dddd W d    n1 s!w   Y  t jt|d |j|dddd W d    d S 1 sBw   Y  d S )Nz<indicator option can only accept boolean or string argumentsr   rO   r   rT   r  r   )ra   rY   rW   rX   r   r%   r%   r&   #test_merge_indicator_arg_validation   s   "z-TestMerge.test_merge_indicator_arg_validationc                 C   s   |\}}t ||dddd}|jdk sJ |j |dddd}|jdk s(J t ||dddd}|jdk s:J |j |dddd}|jdk sLJ t ||dddd}|jd	k s^J |j |dddd}|jd	k spJ d S )
NrO   ro   Tr  r  rt   r  r   r  )r   r  r   )ra   rY   rW   rX   test2test3test4r%   r%   r&   %test_merge_indicator_result_integrity*  s   z/TestMerge.test_merge_indicator_result_integrityc              	   C   sV  |\}}dD ]T}t dddg|ddgi}d| d}tjt|d t||ddd	d
 W d    n1 s5w   Y  tjt|d |j|ddd	d
 W d    n1 sUw   Y  qt ddgddgd}d}tjt|d t||dddd
 W d    n1 sw   Y  tjt|d |j|dddd
 W d    d S 1 sw   Y  d S )N)_right_indicator_left_indicatorr  rO   r(   r   zECannot use `indicator=True` option when data contains a column named z;|Cannot use name of an existing column for indicator columnr   r   Tr  )rO   custom_column_namez:Cannot use name of an existing column for indicator columnr  r	   r   r   r   r   )ra   rY   rW   r%  r   df_badcolumnr   r%   r%   r&   test_merge_indicator_invalid=  s<   "z&TestMerge.test_merge_indicator_invalidc                 C   s   t ddgddgd}t g dg dd}t g dg d	d}tg d
g dd|d< t||ddgddd}t|| |j|ddgddd}t|| d S )Nr   r(   rM   rN   )rO   col2)r(   r(   rR   )rN   r?   r   )r   r(   r(   rR   rM   rN   r?   r   )r  r  r  r  r  r  r  rO   r  r   Tr  r	   r   r   ry   rz   )ra   df3df4hand_coded_resulttest5r%   r%   r&   %test_merge_indicator_multiple_columns_  s   
z/TestMerge.test_merge_indicator_multiple_columnsc                 C   s  t g dg ddtdd}t g dg ddtd	d}| }| }t||d
d
dd}t|| t|| t g dg dg dg ddtdg dd}t||d
d
dd}t|| t g dg dg ddtdd}t||ddd}t|| t|| t|| t||ddd}t|| t g dg dg ddg dtdd}|d}	t|	|d
ddd}t|| t|t dgdgddgdg}
t||
d
d
dd d}tj	t
|d t||
d
d
dd W d    n1 sw   Y  tj	t
|d t||
ddd W d    n	1 sw   Y  t|t dgdgddgdgd
d}t||d
d
dd d }tj	t
|d t||d
d
dd W d    n	1 sYw   Y  tj	t
|d t||ddd W d    n	1 syw   Y  t||
dd!d d"}tj	t
|d t||
d
d
dd W d    n	1 sw   Y  d#}tj	t
|d t||
ddd W d    n	1 sw   Y  d$}tj	t|d t||dd%d W d    n	1 sw   Y  t g d&g d'g ddtdd}t g d(g d)g d*d+tdd}t g d(g d)g d,g d*dtdd}d-}tj	t
|d t||ddd W d    n	1 sCw   Y  t||dd.gdd}t|| d S )/Nr   )catdogweaselhorser   rS   rr   rM   rN   rg   rh   ri   )meowbarkum... weasel noise?naychirprM   rg   rT   Tz1:1)rv   rw   validate)r  r  r  r  )a_xrN   a_yrg   r  
one_to_oner   rM   )r   r  rN   rM   rg   r  )rv   r   r  ri   mooone_to_manyzBMerge keys are not unique in right dataset; not a one-to-one merger   cowrR   )r   many_to_onezAMerge keys are not unique in left dataset; not a one-to-one mergemany_to_manyzCMerge keys are not unique in right dataset; not a many-to-one mergezBMerge keys are not unique in left dataset; not a one-to-many mergez"jibberish" is not a valid argument. Valid arguments are:
- "1:1"
- "1:m"
- "m:1"
- "m:m"
- "one_to_one"
- "one_to_many"
- "many_to_one"
- "many_to_many"	jibberish)rM   rM   rN   rN   )r   r(   r   r(   rM   rM   rN   )r   r(   r   )r  r  r  )rM   rN   rh   )r  r  r  zQMerge keys are not unique in either left or right dataset; not a one-to-one mergerN   )r	   r   r   r   ry   rz   r   r   r   r   r   r   )ra   ro   rt   	left_copy
right_copyr}   r~   
expected_2
expected_3left_index_resetright_w_dupsr   left_w_dupsexpected_multir%   r%   r&   test_validationr  s.  	
	

 					zTestMerge.test_validationc                 C   sP   t g g g d}tjdd t||dd W d    d S 1 s!w   Y  d S )Nr   raise)divider   r   )r	   r   errstater   )ra   rM   r%   r%   r&   )test_merge_two_empty_df_no_division_error7  s   "z3TestMerge.test_merge_two_empty_df_no_division_errorr   zindex,expected_index)r(   r   rS   )r(   r   rS   NNN)
2001-01-01
2002-02-02
2003-03-03r  r  r  c                 C   s.   g | ]}t g d |dt g dtjdfqS )r   r*   )r(   r   rR   NNN)r   r   float64.0dtypr%   r%   r&   
<listcomp>K  s    zTestMerge.<listcomp>)r(   r   r   rR   rR   rS   r  r  r  )r  
2001-01-02
2001-01-03rO  )r}  r  r  )1d2d3dr  r  r  c              	   C   s   t g dg dd|d}t dg di}|j|dd|d}t g d	g d
g dtjddgtjddgtjddggg dd}|j|dd t|| d S )Nr  rM   rl   rr   rN   r  rl   Tr   )r   r   r   r(   r(   r(   r   r   r   rR   rS   rT   rM   rl   rN   r   )inplace)r	   r   r   r7   r   ry   rz   )ra   r   rs   expected_indexrW   rX   r}   r~   r%   r%   r&   $test_merge_on_index_with_more_values=  s   ,


z.TestMerge.test_merge_on_index_with_more_valuesc                 C   sx   t g dg dd}t dg di}t g dg dg ddg dd	d
dtjgd}|j|dddd}t|| d S )Nr   )r   r(   r(   r  rN   r(   r   rR   N)r   r(   r(   r   )r(   r   r   rR   r  r   r(   r   r  rl   Trt   r   r	   r   r7   r   ry   rz   r   r%   r%   r&   test_merge_right_index_rightz  s   z&TestMerge.test_merge_right_index_rightc                 C   s   t ddgddgd}t ddgddgd}|j|dd	g|d
}|dkr0t ddgddgd}nt ddgddgd}t|| d S )Nr  pig(   r;  )animal	max_speedquetzalP   r  r  r   rt   rx   )ra   r   left_dfright_dfr}   r~   r%   r%   r&   test_merge_preserves_row_order  s   z(TestMerge.test_merge_preserves_row_orderc                 C   s   t g dtg dtddd}t dg ditg dd}|j|d	d
dd}t g dtg dg dddddtjgd}|jg dd}t	|| d S )Nr   r  abcr  r  rN   r   rr   rl   Trt   r   r  )rM   rM   rN   rg   )r(   r(   r   rR   r  r   r(   r   r   )
r	   r   r   r   r   r   r7   reindexry   rz   r   r%   r%   r&   8test_merge_take_missing_values_from_index_of_other_dtype  s    
zBTestMerge.test_merge_take_missing_values_from_index_of_other_dtypec                 C   sd   t tddd g dd}t tddd g dd}|jjD ]}d|j_q$|| d S )	Nr   )rS   rT   r(   r  r   )rT   rS   r  F)	r	   r   r   r  _mgrr`  flags	writeabler   )ra   r]   r^   r$   r%   r%   r&   test_merge_readonly  s   
zTestMerge.test_merge_readonlyN)Nr4  r5  r6  r   fixturerb   rX   ro   rt   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   markparametrizer   r   r  r	  r  r  r  r  r.  r0  filterwarningsr:  rB  rM  re  rf  rj  rq  rr  r{  r  r  r  r  r  r  r  r  r  r  r  r   r
   r2   r8   ry   ALL_REAL_NUMPY_DTYPESr   from_tuplesr   r7   r   r   r  r  r  r  r
  r%   r%   r%   r&   rZ   m   s    

	

		 



	
/* 


 ?
" F



 '
rZ   c                 C   sN   dD ]"}| j ||d}t|  | |dd}|d}tj||dd qd S )N)r   ro   r   r   T)r   r   rs   F)check_names)r   r   r,  r   ry   rz   )r?   r   r   r}   r~   r%   r%   r&   r     s   
r   c                   @   s<  e Zd Zejdddgeddgdgdd Zejde	j
e	je	je	je	je	jgejde	j
e	je	je	jgd	d
 Zejdg dg dg dg ddfg dddgddgddgdfddgg dddgddgdfgdd Zdd Zdd Zdd Zdd Zejdg d eg d!dfg d"eg d!dfd#dged$d%ged&fd#dged$d%ged&fgd'd( Zejdeddgd)d&g d*feddgd+d&g d*fg d g d,fg d"g d,fg d g d,fejd-dd.d/d0d1gfejd-dd.d/d#dgfejd-dd.d/d2dgfejd3dd4ejd3dd5d6fg	d7d8 Zejd9ddgd:fg d;fdgd<fdgd=fgd>d? Zejd9d@dAgd:fg d;fdAgd<fd@gd=fgdBdC Z ejdDd;g dEg dFgfd:g dEg dFgfd=g dEg dFgfd<g dFg dEgfgdGdH Z!dIdJ Z"ejdKg dLdMdN Z#dOS )PTestMergeDtypes
right_valsr-   r   categoryc              
   C   sv   t ddgtddgdddgddgtddgdd	tddgd
d	d}t d|i}t||dd}t|jjs9J d S )Nr-   r   r  r(   r         ?       @uint64r*   int32)rC  rD  CrO  EFrC  r   )r	   r   r   r   r   rC  r+   )ra   r  ro   rt   r}   r%   r%   r&   test_different  s   
zTestMergeDtypes.test_differentd1d2c           
      C   s>  t |}t |}tt jg dd |dddgd t jt dt jdd}td	d
g}tdt jddg|di|d}|j|ddgd}|	 }	|j
dkrUt d}t jt j|d|	d< d|	j|	jdk|	jdk@ df< d|	j|	jdk|	jdk@ df< t||	 |j|ddgdd}|	jddgddd t||	 d S )Nr  r   r*   r-   r   r     )k1k2v)r   r   )r(   r-   rp   rT   rj   rr   r   r!  r   r   r  r   r(   Tr  	mergesort)kindr  )r   r+   r	   r   r   r)   r   r  r   r   r$  r7   r   r   r!  ry   rz   sort_values)
ra   r  r  dtype1dtype2ro   rs   rt   r}   r~   r%   r%   r&   test_join_multi_dtypes  s*   




z&TestMergeDtypes.test_join_multi_dtypeszint_vals, float_vals, exp_valsr   )r  r        @XYr  r)  r(   rR   r   r  c                 C   sd   t d|i}t d|i}t |}|j|ddd}t|| |j|ddd}t||ddg  d S )Nr+  r,  r   rx   )ra   int_vals
float_valsexp_valsrC  rD  r~   r}   r%   r%   r&   test_merge_on_ints_floats  s   z)TestMergeDtypes.test_merge_on_ints_floatsc                 C   s~   t ddgddgdddgd}t d	gd
gdddgd}|j|ddd}t ddgddgtjdgdg dd}t|| d S )Nr  r  rc   r   rk   rl   rm   r   r      )rl   rp   rp   ro   r   g      i@rg  )r	   r   r   r7   ry   rz   r-  r%   r%   r&   test_merge_key_dtype_cast  s   z)TestMergeDtypes.test_merge_key_dtype_castc                 C   s0  t dg di}t dg di}t dgdgd}tt |j|ddd}t|| W d    n1 s7w   Y  tt |j|ddd}t||ddg  W d    n1 s^w   Y  t dtjtjdgi}td  |j|ddd}t||ddg  W d    d S 1 sw   Y  d S )	Nr+  r   r,  )皙?g      @r)  rR   r)  r*  r   )r	   ry   r@  UserWarningr   rz   r   r7   )ra   rC  rD  r~   r}   r%   r%   r&   !test_merge_on_ints_floats_warning   s    "z1TestMergeDtypes.test_merge_on_ints_floats_warningc                 C   st   t dtddgtdi}t dddgi}t dddgitd}t||dd}t|| t||dd}t|| d S Nrl   TFr*   r   )r	   r   r6   r   ry   rz   ra   rW   rX   r~   r}   r%   r%   r&   (test_merge_incompat_infer_boolean_object8  s   z8TestMergeDtypes.test_merge_incompat_infer_boolean_objectc                 C   sx   t dtddtjgtdi}t dddgi}t dddgitd}t||dd}t|| t||dd}t|| d S r6  )r	   r   r   r7   r6   r   ry   rz   r7  r%   r%   r&   5test_merge_incompat_infer_boolean_object_with_missingC  s   zETestMergeDtypes.test_merge_incompat_infer_boolean_object_with_missingzdf1_vals, df2_valsr  )rM   rN   rM   )r'  r  r  r   FTr*   c                 C   s\   t d|i}t d|i}t||dgd}t|jjsJ t||dgd}t|jjs,J d S )NrC  r   )r	   r   r   rC  r+   )ra   df1_valsdf2_valsrW   rX   r}   r%   r%   r&   !test_merge_incompat_dtypes_are_okO  s   z1TestMergeDtypes.test_merge_incompat_dtypes_are_okr  r   r  )rG  12z1/1/2011rO  r  z
2011-01-01z
2011-01-02r'  20130101)rn  r/   rm  c                 C   s  t d|i}t d|i}d|d j d|d j d}t|}tjt|d t||dgd W d    n1 s:w   Y  d|d j d|d j d}t|}tjt|d t||dgd W d    n1 smw   Y  t|t|krt |||d}t |||d}d|d j d|d j d	}t|}tjt|d t|| W d    n1 sw   Y  d|d
 j d|d
 j d}t|}tjt|d t||dd
gd W d    d S 1 sw   Y  d S d S )NrC  zYou are trying to merge on z and zE columns for key 'A'. If you wish to proceed you should use pd.concatr   r   rC  rD  r  rD  zE columns for key 'B'. If you wish to proceed you should use pd.concatr  zE columns for key 'C'. If you wish to proceed you should use pd.concat)	r	   r+   reescaper   r   r   r   r   )ra   r:  r;  rW   rX   r   r  r  r%   r%   r&    test_merge_incompat_dtypes_errorg  s<   



"z0TestMergeDtypes.test_merge_incompat_dtypes_errorzexpected_data, howr   r   rt   ro   c           	      C   s`   t dgdg|d}t dgdg|d}t|||d}tt|}t ||dg|d}t|| d S )N)r(   idr   r   r   rs   r   r+   r	   r   r   r   ry   rz   )	ra   any_numeric_ea_dtyper   expected_datar  r  r}   	exp_indexr~   r%   r%   r&   test_merge_EA_dtype     
z#TestMergeDtypes.test_merge_EA_dtyperM   rN   c           	      C   s`   t dgdg|d}t dgdg|d}t|||d}tt|}t ||dg|d}t|| d S )N)rM   rD  r   )rN   r   rF  rG  )	ra   r   rI  any_string_dtyper  r  r}   exp_idxr~   r%   r%   r&   test_merge_string_dtype  rL  z'TestMergeDtypes.test_merge_string_dtypezhow, expected_data)Tr(   rS   )FrT   rR   c                 C   sZ   t ddgddgd}t ddgddgd}t|||d	}t |g d
d}t|| d S )NTFr(   rT   rC  rD  rR   rS   rC  r  r   r@  r   rx   )ra   r   rI  rW   rX   r}   r~   r%   r%   r&   test_merge_bool_dtype  s
   z%TestMergeDtypes.test_merge_bool_dtypec           	      C   s   t g dg ddt d}| }t dddtjdgd	d
dtjdgd|d}| }t||dg|d}t|| t|| tt	
dt t	
dgtg dd}t|j| d S )N)r=  r>  34N)rT  5678)lvl0zlvl1-arZ  zlvl1-b)datar+   r=  r>  rS  rU  rW  rX  911)rY  rZ  zlvl1-crY  )ro   rt   r   r   O)rY  r[  r_  rr   )r	   r2   StringDtyper   NAr   ry   rz   r   r   r+   r   r  r   r
  )	ra   r   string_dtyperW   r  rX   r  r   r~   r%   r%   r&   test_merge_ea_with_string  s0   z)TestMergeDtypes.test_merge_ea_with_stringzleft_empty, how, exp)
)Fro   ro   )Frt   empty)Fr   re  )Fr   ro   )Fcrossempty_cross)Tro   re  )Trt   rt   )Tr   re  )Tr   rt   )Trf  rg  c                 C   s   t ddgddgd}t dgdgddd	}|r|d
}n|d
}|j||d}|dkr?t ddgddgtjtjgd}n2|dkrPt tjgdgdgd}n!|dkret g ddd}|rd|g d }n|dkrqt g ddd}t|| d S )Nr   r(   rR   rS   rP  rT   rQ  r)   r*   r   r   ro   r@  rt   )rD  rC  r  re  r   rg  )A_xrD  A_yr  )r	   headr   r   r7   ry   rz   )ra   
left_emptyr   r   ro   rt   r}   r~   r%   r%   r&   test_merge_empty  s$   
"z TestMergeDtypes.test_merge_emptyN)$r4  r5  r6  r   r  r  r   r   r  r   r)   r  intcint16int8uint8r  float32float16r(  r0  r2  r5  r8  r9  r6   r   r<  r2   rp  rC  rK  rO  rR  rd  rl  r%   r%   r%   r&   r    s    



5

	

	
	!r  c                   C   sL   t ttjdjddgddtddgtjdjg ddddS )Nr   r-   r   )rc   r  )onetwothreer*  )r	   r   r   r   r   choicer   CDTr%   r%   r%   r&   ro   3  s   ro   c                   C   s(   t tddgtddgddgdS )Nr-   r   r(   r   )r+  Z)r	   r   r   rw  r%   r%   r%   r&   rt   ?  s   "rt   c                
   @   s   e Zd Zdd Zdd Zdd Zdd Zej	d	d
dgdd Z
dd Zej	ddd dd dd gdd Zdd Zdd Zej	d	d
dgej	dg dd
dgd
dgfg dddgddgfg d d!d"gd!d"gfgd#d$ Zd%d& Zd'S )(TestMergeCategoricalc                 C   sT   t ||dd}|j }ttddgdtdtdgg dd}t|| d S )	Nr+  r   r-   r   r  r`  )r+  Y_xY_yrr   	r   r
  r  r   r   r   r+   ry   r   )ra   ro   r   r}   r~   r%   r%   r&   test_identicalG  s   
z#TestMergeCategorical.test_identicalc                 C   sT   t ||dd}|j }ttddgdtdtdgg dd	}t|| d S )
Nr+  r   r-   r   r  r`  r)   r+  r,  rx  rr   r|  ra   ro   rt   r   r}   r~   r%   r%   r&   
test_basicQ  s   
zTestMergeCategorical.test_basicc                 C   sD  t ddddddddddddd}t d	d	d	d	d	dd
d
d
d
d
dd}t||dddd}| }| }|d d|d< t||dddd}|d tdg|d< t|| | }|d d|d< t||dddd}t|| | }|d d|d< | }|d d|d< t||dddd}t|| d S )NrM   rN   rg   rh   ri   )r   r(   r   rR   rS   nullr   r   r   r   ro   )r   r   r   r  )r	   r   r   r   r   ry   rz   )ra   rt   ro   rb   r~   crightr}   cleftr%   r%   r&   test_merge_categorical`  s6   z+TestMergeCategorical.test_merge_categoricalc                 C   s   t tg dg ddg dd}t tg dg ddg dd}t||dgd	}t tg dg dg d
d}t|| d S )Nr@  r  )A0B0C0)FooLeft)r  rD  rC  )C1B1A1)r  Rightr  r   )r  r  r  )r  r  r  r  r-  r%   r%   r&   'tests_merge_categorical_unordered_equal  s$   
z<TestMergeCategorical.tests_merge_categorical_unordered_equalorderedTFc                 C   s   t ddg|d}tg dtg d|dg ddd	d
g}tg dtg d|dg ddd	d
g}t||dddd}tg dtg d|dg dddtjgdd	d
g}t|| d S )NP2P1r  r  )r  r  rO  )r  r  r  r*   r  )rD  prM   rD  r  )rC  r  r  )r  r  r  )rc   r;  r  )rD  r  r  ro   Tr   g      &@g      (@)rD  r  rM   r  )	r   r	   r   r   r   r   r7   ry   rz   )ra   r  pcatrW   rX   r}   r~   r%   r%   r&   5test_multiindex_merge_with_unordered_categoricalindex  s8   



zJTestMergeCategorical.test_multiindex_merge_with_unordered_categoricalindexc                 C   s   |j |jdd}t||dd}|j }ttddgdt	dtd	d
gdgg dd}t
|| |jj|jjs?J |jj|jjsJJ d S )Nr  )rx  r+  r   r-   r   r  r`  r(   r   r~  rr   )assignrx  r   r   r
  r  r   r   r   r+   ry   r   r+  r  #_categories_match_up_to_permutationr  r%   r%   r&   test_other_columns  s   
z'TestMergeCategorical.test_other_columnschangec                 C   s   | S r;   r%   r>   r%   r%   r&   r@     s    zTestMergeCategorical.<lambda>c                 C   s   |  tg dS )N)r-   r   bahr   rw  r>   r%   r%   r&   r@     s    c                 C   s   |  tddS )NTr  r  r>   r%   r%   r&   r@     s    c           	      C   s   ||j d}|j|d}t|j jjtsJ t||d|d}|j	 }t
tdtdtdgg dd}t|| d S )	Nr6   )r+  r+  r   r`  r)   r~  rr   )r+  r   r  r8  r  r+   r   r   r
  r  r   r   ry   r   )	ra   r  r   ro   rt   r+  r   r}   r~   r%   r%   r&   test_dtype_on_merged_different  s   
 z3TestMergeCategorical.test_dtype_on_merged_differentc                    sx   d t g d  g dd    fdddD  fddd	D d
}|dd }t||t|jd}t|| d S )NrT   )
rM   rN   rg   rh   ri   r   r   r   r   j)r=  wr?   r   r   r   c                    s$   g | ]}|gd    D ]}|qqS rE  r%   r  eachletterrP  r%   r&   r    s    zKTestMergeCategorical.test_self_join_multiple_categories.<locals>.<listcomp>)rP  r"   ur  oc                    s    g | ]}|g  D ]}|q	qS r%   r%   r  r  r%   r&   r    s    )
aabbccddeeffgghhiijjr   c                 S   s
   |  dS )Nr  )r   r>   r%   r%   r&   r@     s   
 zITestMergeCategorical.test_self_join_multiple_categories.<locals>.<lambda>r   )r	   applyr   r   r   ry   rz   )ra   rb   r}   r%   r  r&   "test_self_join_multiple_categories  s   


z7TestMergeCategorical.test_self_join_multiple_categoriesc                 C   s(  t tddddgtddddggddgd}|d d	|d< t tddddgtddd
dggddgd}|d d	|d< t td ddgtd dtjgtd tjdggg dd}t||ddgd}t	|| t td ddggg dd}t||ddgd}t	|| d S )Ni  r(   r3  r   ?r   num2r   r  rR   ffffff?num4r  r  r  )r   r  r  r   r~  r   )
r	   r   r   r2   r3   r   r7   r   ry   rz   )ra   rb   rX   expected_outerresult_outerexpected_innerresult_innerr%   r%   r&   test_dtype_on_categorical_dates  s.   $$z4TestMergeCategorical.test_dtype_on_categorical_datesz.category_column,categories,expected_categories)FTTF)r   r(   r(   r   r(   r   )FalseTruer  r  r  r  c           	      C   s   t g d|d}|d t||d|d< t ddgddgd	}||}t ddg|ddgd
}|d t||d|d< t|| d S )Nr   )rD  r  r  r  r   rS   r(   r   )rD  num)rD  r  r  )r	   r   rw  r   ry   rz   )	ra   category_columnr  expected_categoriesr  rW   rX   r}   r~   r%   r%   r&   /test_merging_with_bool_or_int_cateorical_column6  s   
zDTestMergeCategorical.test_merging_with_bool_or_int_cateorical_columnc                 C   s\   t tddtjgdddd}t||dd}t tddtjgddddd}t|| d S )	Nr(   r   r,   r*   rP  rC  r   )rC  B_xB_y)r	   r   r   r7   r   ry   rz   )ra   rb   r}   r~   r%   r%   r&   test_merge_on_int_arrayL  s   z,TestMergeCategorical.test_merge_on_int_arrayN)r4  r5  r6  r}  r  r  r  r   r  r  r  r  r  r  r  r  r  r%   r%   r%   r&   ry  F  s8    
+

( ry  c                   C      t dg dig ddS )NrM   r   rc   r   r   r(   r   rr   rV   r%   r%   r%   r&   r  V     r  c                   C   r  )NrN   ,  d   r1  rR   r(   r   rr   rV   r%   r%   r%   r&   r  [  r  r  c                   @   sZ  e Zd Zejdddeddgddgdd	d
gdfddeddgddgdd
d	gdfddeg dddejgdg ddfddeg dejddgdg ddfddeejddgg ddg ddfddeddejgg ddg ddfddedddejgejdddgdg ddfddedddejgejdddgdg ddfgdd Z	dS )TestMergeOnIndexeszhow, sort, expectedr   Fr   rc   r1  r  r   r   r(   rr   Tro   r  r  )r   rc   r   r  rt   r  r  r  r1  r  r   r   r   r  r   c                 C   s$   t ||dd||d}t|| d S )NT)rv   rw   r   r   r   )ra   r  r  r   r   r~   r}   r%   r%   r&   test_merge_on_indexesa  s   0z(TestMergeOnIndexes.test_merge_on_indexesN)
r4  r5  r6  r   r  r  r	   r   r7   r  r%   r%   r%   r&   r  `  sT    ""  	/r  rs   c                 C   s   g | ]}t d dg|ddqS )r(   r   	index_colr<   )r   r  r%   r%   r&   r    s    r  rC  rD  r  )r  r=   r   )startstopr=   r.   z
2018-01-02r   c                 C   s   t | j d| j dS )N[rZ  )typer4  r+   r>   r%   r%   r&   r@     s    )rC   c                 C   sb   t dddgi| d}t dddgi| d}|j|dgd	}t ddgddgd
| d}t|| d S )N	left_datar(   r   rr   
right_datar  r  r  r   )r  r  rx   )rs   ro   rt   r}   r~   r%   r%   r&   test_merge_index_types  s
   r  z-on,left_on,right_on,left_index,right_index,nmr   r   F)NNNTTrD  T)NNNTTNc              
   C   s  t dg ditjddgddggddgd	d
}tg dtjddgddggddgd	|d}t ddgddgdtjddgdggddgd	d
}|d ur]t||| ||||d}	t|	| d S d}
tjt	|
d t||| ||||d}	W d    d S 1 s}w   Y  d S )NrC  r   rM   rN   r   r(   r   r   namesrr   r   rY  rS   rR   rP  )r   r   r   rv   rw   z$Cannot merge a Series without a namer   )
r	   r   from_productr   r   ry   rz   r   r   r   )r   r   r   rv   rw   nmrM   rN   r~   r}   r   r%   r%   r&   test_merge_series  sH   
	"r  c                  C   s   t dg ditjddgddggddgd	d
} tg dtjddgddggddgd	dd}tjtdd t| |ddgd W d    d S 1 sIw   Y  d S )NrC  r   rM   rN   r   r(   r   r   r  rr   r   )rD  r  rY  z-Not allowed to merge between different levelsr   r   )r	   r   r  r   r   r   r   r   r   r%   r%   r&   test_merge_series_multilevel  s   
"r  z!col1, col2, kwargs, expected_colssuffixes) _duprG  0_dup)Nr  )_x_y0_x0_yr  r  rM   )Nr  r'  )r  Nz0.0_xrN   b_yr  )Nr  )_aN0_ar  c                 C   s   t | g di}t |g di}t ddgddgddgg|d	}|j|fd
d
d|}t|| t||fd
d
d|}t|| d S )Nr   r   r(   rS   r   rT   rR   r   r   Tru   rx   )rO   r  kwargsexpected_colsrM   rN   r~   r}   r%   r%   r&   test_merge_suffix  s   r  zhow,expectedr  <   F   X       )rC  r  B2)r  r1  r(   r  r   r  r  r  c                 C   sX   t g dg dd}t g dg dd}t||d| dd}g d	|_t|| d S )
N)r  r1  r(   )r  r  r   rP  r  r  rC  )r  r  )r   r   r  )rC  r  r  )r	   r   r   ry   rz   )r   r~   r  r  r}   r%   r%   r&   test_merge_duplicate_suffix	  s
   
r  zcol1, col2, suffixes))rM   rM   )NN)rM   rM   )r  N)r   r   )Nr  c                 C   sj   t | g di}t |g di}d}tjt|d t||dd|d W d    d S 1 s.w   Y  d S )Nr   rR   rS   rT   z'columns overlap but no suffix specifiedr   Trv   rw   r  r  )rO   r  r  rM   rN   r   r%   r%   r&   test_merge_suffix_error2	  s   "r  r  c                 C   sf   t dg di}t dg di}tjtdd t||dd| d W d    d S 1 s,w   Y  d S )	NrM   r   rN   r  zPassing 'suffixes' as ar   Tr  )r	   r   r   	TypeErrorr   )r  rM   rN   r%   r%   r&   test_merge_suffix_raisesA	  s
   "r  zcol1, col2, suffixes, msg)rM   rM   r   z(too many values to unpack \(expected 2\)z1not enough values to unpack \(expected 2, got 1\)c                 C   sf   t | g di}t |g di}tjt|d t||dd|d W d    d S 1 s,w   Y  d S )Nr   r  r   Tr  r  )rO   r  r  r   rM   rN   r%   r%   r&   test_merge_suffix_length_errorJ	  s
   "r  	cat_dtypers  rt  reversec           	      C   s   t g dddt g dddd}ttg d|d g ddd}g d}g d}|r8|  |  tt|||  |d	d}|j|d
d
d}tg dg dtg d|d dd}t|| d S )Nr   Fr  )rs  rt  rs  r   r-   ro   r-   r-   rt   Tru   ro   rt   r-   )	r   r	   r   r   r   r  r   ry   rz   )	r  r  
cat_dtypesrW   data_foo
data_rightrX   r}   r~   r%   r%   r&   test_merge_equal_cat_dtypesY	  s8   r  c                  C   s   t g ddd} ttddg| ddgdd	}ttg d| g d
dd	}|j|ddd}tddgddgtddg| dd	}t|| d S )Nr   Fr  rM   rN   r(   r   r  r-   )rR   r   r(   r  Tru   rR   r  )r   r	   r   r   r   r   ry   rz   )r  rW   rX   r}   r~   r%   r%   r&   test_merge_equal_cat_dtypes2~	  s$    r  c                  C   sj   t dttddtddgddi} |  }|d d|d< t|| ddd	}|  }t|| d S )
NrM   r   r(   r   intervalr*   r  r   r~  )	r	   r   r2   Intervalr   r   r   ry   rz   )rt   ro   r}   r~   r%   r%   r&   test_merge_on_cat_and_ext_array	  s   "r  c            	         s   g d} g d}t j| |fddgd}t|d}d|d< t|d}d|d< d	 d
|j|d fd} fdd| D fdd| D  }t j||gddgd}t|d}d|d< t|| d S )Nr   r=  r>  rS  r   r   r  r   r  rD  r  r  r   r  c                       g | ]}|  qS r%   r%   r  r  )l_sufr%   r&   r  	  s    z1test_merge_multiindex_columns.<locals>.<listcomp>c                    r  r%   r%   r	  )r_sufr%   r&   r  	  s    )r   r  r	   r   ry   rz   )	lettersnumbersrs   frame_xframe_yr}   expected_labelsr  r~   r%   )r
  r  r&   test_merge_multiindex_columns	  s&   


r  c                  C   st   t g dg dd} t g dtg dd}t| |ddd	}t g dg dtg d
d}t|| d S )Nr   )r=  r>  rT  )r?   r   r  )200020012002)r   r   ro   r   r~  )r  r  r8   r   )r	   r2   r  r   ry   rz   rW   rX   r}   r~   r%   r%   r&    test_merge_datetime_upcast_dtype	  s   r  n_categoriesrT      c                 C   s   t dgtt|  }tt| d dg|d}tdggdgt dgtt| dd}t||dddd	}td
d t| d D ddg|d}t|| d S )Nr   r(   rd   r  r   r  ro   Tr   c                 S   s&   g | ]}|d k r|dgn|t jgqS )r   g      @)r   r7   )r  r   r%   r%   r&   r  	  s   & z9test_categorical_non_unique_monotonic.<locals>.<listcomp>r   r   )r   r   r   r	   r   ry   rz   )r  rv   rW   rX   r}   r~   r%   r%   r&   %test_categorical_non_unique_monotonic	  s   r  c                  C   s`  t g dg dg dd} t| } t g dg dg dg dd}t|d	d
gd }t| | ddgd	d
gdd}|jd	d
gdd}| j|ddgd}t|| t g dg dddg dd} t| } t g dg dddg dg dd}t|d	d
gd }t| | ddgd	d
gdd}|jd	d
gdd}| j|ddgd}t|| d S )N)rM   rN   rM   rg   rM   rN   r   )r   r(   r   r(   r   r   )Cat1Int1)rM   rN   rg   rM   rN   rg   )r   r   r   r(   r(   r(   )r3  g333333?r  r  r/  g?)CatIntFactorr  r  r  r  r  ro   r   r(   )axisr   r  Tr  )	r   r	   r   r   r,  dropr   ry   rz   )rM   rN   r~   r}   r%   r%   r&   &test_merge_join_categorical_multiindex	  sT   r!  funcr   
merge_asof)r  err_msg)r   rv   r   rv   )r   rw   r   rw   c                 C      t ddgddgd}t ddgddgd}d	|d
  d|d  d}tjt|d tt| ||fi | W d    d S 1 sBw   Y  d S )Nr(   r   rR   rS   r   rT   r   r  zCan only pass argument "r   " OR "z" not both\.r   r	   r   r   r   getattrr2   r"  r  r$  ro   rt   r   r%   r%   r&   /test_merge_join_cols_error_reporting_duplicates!
     
"r*  c                 C   r%  )Nr(   r   rR   rS   r   rT   r   r  zMust pass "r   r&  z"\.r   r'  r)  r%   r%   r&   ,test_merge_join_cols_error_reporting_missing2
  r+  r,  r  c                 C   s   t ddgddgd}t ddgddgd}d	}tjt|d
 tt| ||fddi| W d    d S 1 s9w   Y  d S )Nr(   r   rR   rS   r   rT   r   r  zZCan only pass argument "on" OR "left_index" and "right_index", not a combination of both\.r   r   rM   r'  )r"  r  ro   rt   r   r%   r%   r&   1test_merge_join_cols_error_reporting_on_and_indexC
  s   
"r-  c                  C   sv   t ddgddgd} t ddgddgd}t| |dddd}t ddgddgddgddgddgd}t|| d S )	Nr(   r-   )r?   r   rt   Tr?   )r   rv   r   )r?   x_xz_xx_yz_yrx   ro   rt   r}   r~   r%   r%   r&   test_merge_right_left_indexW
  s   	r3  c                  C   s   t dgdgdddg} t ddgidg}t g g dtjdddg}t| |dgdd}t|| t|| ddgd	}t|| d S )
Nr(   r   r   rM   rN   r*   Tr   r   )r	   r   r   r)   r   ry   rz   rW   rX   r~   r}   r%   r%   r&   $test_merge_result_empty_index_and_onh
  s   r5  c                  C   s   t g dddd} t g ddd}tjtdd t| |dd	 W d    n1 s,w   Y  tjtdd t|| dd
d W d    d S 1 sLw   Y  d S )Nr   r(   r   )rM   rN   b_xr   (Passing 'suffixes' which cause duplicater   rM   r   )r  r  r  r	   r   r   r   r   r  r%   r%   r&   .test_merge_suffixes_produce_dup_columns_raisest
  s   "r9  c                  C   sb   t g dg dgg dd} t ddgdd}t| |d	d
}t g dgg dd}t|| d S )Nr  r  )rM   rN   rN   r   r(   rR   r   r   rM   r   )r(   r(   r(   r   )rM   r6  r6  r  rx   r2  r%   r%   r&   3test_merge_duplicate_columns_with_suffix_no_warning
  s
   r:  c                  C   sp   t g dg dgg dd} t ddgdd}tjtd	d
 t| |dd W d    d S 1 s1w   Y  d S )N)r(   r(   r(   r(   )r   r   r   r   )rM   rN   rN   r6  r   r(   rR   r   r   r7  r   rM   r   r8  r  r%   r%   r&   Itest_merge_duplicate_columns_with_suffix_causing_another_duplicate_raises
  s
   "r;  c                  C   s~   t ddgddggtddgd} t dd	gd
dggddgd}t|| dddd}t g dg dgtg dd}t|| d S )Nr(   r   rR   rS   rM        \@r   r   rc   r;  r  r?   r   r   Tr   )r   rc   r(   r   )r;  r  rR   rS   )r?   r   rM   r<  r	   r   r   ry   rz   r  r%   r%   r&   %test_merge_string_float_column_result
  s    r>  c                  C   sn   t dgdgdgd} t dgdgdgd}tjtdd t| |dgdd	 W d    d S 1 s0w   Y  d S )
Nr+  r     )r\  r   rs   i  zCan only pass argumentr   T)r   rv   r8  )df_1df_2r%   r%   r&   /test_mergeerror_on_left_index_mismatched_dtypes
  s
   "rB  c                  C   sb   t td} t| tdd}tdtddi}t||| dd}t||| jdd}t|| d S )NrR   rP  r  r   rC  r   )r   r   r	   r   _datary   rz   )cirt   ro   resr~   r%   r%   r&   #test_merge_on_left_categoricalindex
  s   rF  r+   r,   c                 C   s   t ddgddgd| d}t tjtjgddgd| d}t||dd	d
}t ddtjtjgddtjtjgtjtjddgd| d}t|| t||dd	d
}t tjtjddgddtjtjgtjtjddgd| d}t|| d S )Nr(   r   )rl   rO   r*   rR   rS   )rl   r  rl   r   r   )rl   rO   r  )rl   r  rO   r  )r+   ro   rt   r}   r~   r%   r%   r&   test_merge_outer_with_NaN
  s(   rG  c                  C   sh   t ddgitdgddd} t ddgitdgddd}t| |ddd}t dgdd}t|| d S )	NrM   r(   rg   r   rr   rh   r   )r  r  r=  r2  r%   r%   r&    test_merge_different_index_names
  s
   rH  c                 C   sb   t g ddd| d}t g ddd| d}|j||d}t g dddd| d}t|| d S )	Nr   r(   r   r*   r   r  r   r   rx   rH  r   ro   rt   r}   r~   r%   r%   r&   test_merge_ea
  s
   rJ  c                 C   s   t g ddd| d}t g ddd|  d}|j||d}t tg d| dtg d| dtg d	|  dd
}t|| d S )Nr   r(   r   r*   r   r  r   r  r  r   )r	   lowerr   r   ry   rz   rI  r%   r%   r&   test_merge_ea_and_non_ea
  s   rL  r)   int64[pyarrow]c                 C   sr   t d tdddgi| d}tdddgidd}||}| }t|| ||}| }t|| d S )NpyarrowrM   r(   r   r*   rM  )r   importorskipr	   r   r   ry   rz   )r+   rb   rX   r}   r~   r%   r%   r&   !test_merge_arrow_and_numpy_dtypes
  s   


rP  r   )r   ro   r   rt   r1   zAmerica/Chicagoc                 C   s8  t jddd| dt jddd| dt jddd| dg}t|d d dd	gd
}|d jd|d< t|dd  dd	gd}|d jd|d< t|dd	tjgtjdd	gd}|d jd|d< |dkrq|jdg jdd}n|dkr}|jddg }n|dkr|jddg jdd}|j	|d|d}t
|| d S )Ni  rT   r  r0         r   r  r  )r=  rM   r=  rT  r(   )r=  rN   rQ  )r=  rM   rN   r   T)r   ro   r   rt   r   )r2   r3   r	   r   as_unitr   r7   ilocr,  r   ry   rz   )r1   r   valsrW   rX   r~   r}   r%   r%   r&   (test_merge_datetime_different_resolution
  s$    rV  c                  C   sn   t dddgi} t ddgitjddgdgdd	}t ddgdtjgd
}| j|dgddd}t|| d S )NcolrC  rD  rN   r  )rC  )r  r  )r\  rs   )rW  rN   Tro   r   )r	   r   r  r   r7   r   ry   rz   )rb   rX   r~   r}   r%   r%   r&   "test_merge_multiindex_single_level  s   rX  c                  C   s  t dtjgt d} t dg}t dgdd}tjtdd | |}W d    n1 s.w   Y  t	|| tjtdd || }W d    n1 sPw   Y  t	||
d	 t dg}t d
gdgdd}| |}t	|| || }t	||
d	 d S )Nr  r*   r/  r   r,   r   zYou are mergingr   r  r(   )r	   r   r7   r2   
Int64Dtypery   r@  r4  r   rz   r   r4  r%   r%   r&   !test_merge_ea_int_and_float_numpy'  s"   



rZ  c                 C   s|   t d tdddgi| d}tdditddg| dd}|j|ddd	d
}ttddg| ddtjgd}t	|| d S )NrN  rM   rN   r*   r(   rg   rr   Tro   r   r   )
r   rO  r	   r   r   r   r   r7   ry   rz   )rM  ro   rt   r}   r~   r%   r%   r&   test_merge_arrow_string_index>  s   
r[  )r   r   )[r   r   r   rA  numpyr   r   pandas.core.dtypes.commonr   pandas.core.dtypes.dtypesr   pandasr2   r   r   r	   r
   r   r   r   r   r   r   r   pandas._testing_testingry   pandas.api.typesrw  pandas.core.reshape.concatr   pandas.core.reshape.merger   r   r'   r4   r9   r  rI   rK   rL   rY   rZ   r   r  ro   rt   ry  r  r  r  r  r  r  r  r  r  r  r7   r  r  r  tupler  r  r  r  r  r  r  r!  r*  r,  r-  r3  r5  r9  r:  r;  r>  rB  rF  rG  rH  rJ  rL  rP  rV  rX  rZ  r[  r%   r%   r%   r&   <module>   sh   4
	



          W  p

  

7


(

	


# 
8		
	
		
