U
    *if                     @  s   d dl mZ d dlmZ d dlZd dlZd dlZd dlmZ d dl	Z
d dl	mZmZmZmZmZ d dlmZ ejdddd	Zejd
dddZG dd dZG dd dZdS )    )annotations)datetimeN)np_version_under1p20)	DataFrameIndexSeries	Timestamp
date_rangezdict[str, list[int | str]])returnc                   C  s   t tdt ddS )N   ab..ab)listrange r   r   Z/home/mars/bis/venv/lib/python3.8/site-packages/pandas/tests/frame/methods/test_replace.pymix_ab   s    r   zdict[str, list[float | str]]c                   C  s"   t tdt dddtjdgdS )Nr   r   r   r   dr   r   c)r   r   npnanr   r   r   r   mix_abc   s    r   c                   @  s  e Zd Zdd Zejdddgejdgddejejgdgd	 d
g d
dddgdfddgddgddddgdddd
gd
dddgdfddgddgddddgdddd
gd
dddgdfgejdddgejdddgdd Z	dd  Z
d!d" Zd#d$ Zd%d& Zd'd( Zd)d* Zd+d, Zd-d. Zd/d0 Zd1d2 Zd3d4 Zejd5ejd6d7d6ejd8gd9d: Zejd;d<d=d>d?d@gdAdB ZejdCdDdEgdFdGdHdIdJgfdGd6d6gdKejidGejejgfgdLdM ZdNdO ZdPdQ ZdRdS ZdTdU ZdVdW ZdXdY ZdZd[ Z d\d] Z!d^d_ Z"d`da Z#dbdc Z$ejdddedfdggdhdi Z%djdk Z&dldm Z'dndo Z(dpdq Z)drds Z*dtdu Z+ejdve,dwdxdyd	gidxdze,dwdzdyd	gife,dwdxdyd	giej-d{dxdze,dwdzdyd	giej-d{fe,dwdxdyd	giej.d{dxdze,dwdzdyd	giej.d{fe,d|dddgidde,d|dddgife,d}d~ddgid~dze,d}dddgife,de/e0ddde0ddde0dddgie0ddde0ddde,de/e0dddgd	 ife,e0dddgdgddde,e0dddgdgdfe,e1dd	dddzejdygde2ddde2ddde,e2ddde2ddde2dddgdzejdygdfe,dxdgdydggdde,ddgdydggfe,dxdgdydggdxde,ddgdydggfe,dxdgdydggdde,ddgdydggfe,dxdgdydggdxde,ddgdydggfgdd Z3dd Z4dd Z5dd Z6dd Z7dd Z8dd Z9dd Z:dd Z;dd Z<dd Z=dd Z>dd Z?dd Z@dd ZAdd ZBdd ZCdd ZDdd ZEdd ZFdd ZGejddzddxdxdygdejdgdddFgdĜfejddzdxdygdddgdddFgdĜfdGddzdxdygdejdgdddFgdĜfdzdygddxdxdygdejdgdddFgdĜfdxdygddzdzdzgdejdgdddFgdĜfdddzdydygdejdgdddFgdĜfddFgddzdxdygdejdgdddgdĜfgddʄ ZHejddxdxdHd	d	gdydyggfdxdydHd	dxgdyd	ggfgdd̈́ ZIejddxdyd	gdddgdќddddҜdxdyd	gdddgdќfdxdyd	gdddgdќddddלdxdyd	gdddgdќfgddل ZJejde2dۃeKdxe.dxeLdxeMdxgdd݄ ZNdd߄ ZOdd ZPejddddddfdegejdejejgdd ZQejdejdgdd ZRejdeSdeTdzdgdd ZUdd ZVdd ZWdd ZXdd ZYdd ZZdd Z[ejddxgdgdzgdzgfdxgdxgdzgdzgfdgdgdzgdgfdgdxgdzgdgfgejde\e]ej^gdd Z_dS (   TestDataFrameReplacec                 C  s   t j|d d d< t j|d dd < | }|jt jddd}|d ksJtt||d |}t j|jdd|j	
df< t j|jd	d |j	
df< |t jd}|jdd
}t|| | }|jt jgdgdd}|d kstt||d d S )NA   r   Tinplace   foovalue)r   r   copyreplaceAssertionErrortmassert_frame_equalfillnailoccolumnsget_loc)selfdatetime_framefloat_string_frametsframereturn_valuemfresultexpectedr   r   r   test_replace_inplace!   s     z)TestDataFrameReplace.test_replace_inplacezto_replace,values,expected\s*\.\s*ze|f|gcrapr   r      hlor   
\s*(\.)\s*z(e|f|g)\1\1\1_crap..Ze_crapZf_crapZg_crapefgr    TFuse_value_regex_argsc                 C  sp   t tdtdtdd}|r2|j|||d}n|j||d|d}|rX|d ksTt|}t |}t|| d S )Nr   efghhelor   )r%   regexr    TrH   r    )r   r   r'   r(   r)   r*   )r/   
to_replacevaluesr6   r    rE   dfr5   r   r   r   test_regex_replace_list_obj8   s    *z0TestDataFrameReplace.test_regex_replace_list_objc           	      C  s^  t |}ddg}tjdg}ttdtdtdd}t |}|j||dd	}t |d dd
tjtjgddddgd}t|| ddg}ddg}|j||dd	}t |d ddddgd}t|| dddg}dddg}|j||dd	}t |d ddddgd}t|| dddg}dddg}|j||d}t |d ddddgd}t|| d S )Nr8   r   r9   r   r   Zhalor   TrH   r   r;   r<   r=   r>   (a|b)r?   r@   a_crapb_craprA   r   (b)rH   r%   )r   r   r   r   r   r'   r)   r*   )	r/   r   dfmixto_replace_resrK   Zmix2Zdfmix2resexpecr   r   r   test_regex_replace_list_mixedp   s8    





z2TestDataFrameReplace.test_regex_replace_list_mixedc                 C  s  t |}ddg}tjdg}| }|j||ddd}|d ks@tt |d ddtjtjgd}t|| dd	g}d
dg}| }|j||ddd}|d kstt |d ddddgd}t|| dddg}d
ddg}| }|j||ddd}|d kstt |d ddddgd}t|| dddg}d
ddg}| }|j||dd}|d ksbtt |d ddddgd}t|| d S )Nr8   r   r9   Tr    rH   r   r   r>   rO   r?   r@   rP   rQ   rA   rR   rH   r%   r    )r   r   r   r&   r'   r(   r)   r*   )r/   r   rT   rU   rK   rV   r3   rW   r   r   r   %test_regex_replace_list_mixed_inplace   s:    




z:TestDataFrameReplace.test_regex_replace_list_mixed_inplacec                 C  s  t |}|jddidtjidd}| }|jddidtjiddd}|d ksRtt |d ddtjtjg|d d}t|| t|| |jdd	idd
idd}| }|jdd	idd
iddd}|d kstt |d ddddg|d d}t|| t|| |jdd	idd
id}| }|jdd	idd
idd}|d ksPtt |d ddddg|d d}t|| t|| t |d tjdddg|d d}|jddtjidd}| }|jddtjiddd}|d kstt|| t|| |jddtjidd}| }|jddtjidd}|d ksHtt |d tjdddg|d d}t|| t|| d S )Nr   r8   TrN   rY   r   r   r   r>   z\1tyz.tyrS   rZ   .rI   r   r'   r   r   r&   r(   r)   r*   )r/   r   rT   rV   res2r3   rW   r   r   r   test_regex_replace_dict_mixed   sx            z2TestDataFrameReplace.test_regex_replace_dict_mixedc           	      C  s   t |}|jddtjiidd}| }| }|jddtjiiddd}|d ksVt|jddtjiid}|jddtjiidd}|d kstt |d ddtjtjg|d d	}t|| t|| t|| t|| d S )
Nr   r8   TrN   rY   rI   r   r   r   r]   )	r/   r   rT   rV   r^   Zres4r3   res3rW   r   r   r   test_regex_replace_dict_nested  s(      z3TestDataFrameReplace.test_regex_replace_dict_nestedc                 C  sR   |}t ddddgi|d}t ddddgi|d}|jd	d
idd}t|| d S )NfirstabcZbcaZcabdtypez.bczbc.zc.br   r\   TrN   r   r'   r)   r*   )r/   any_string_dtypere   rL   r6   r5   r   r   r   2test_regex_replace_dict_nested_non_first_character  s
    zGTestDataFrameReplace.test_regex_replace_dict_nested_non_first_characterc                 C  sT   t dddddgdd}t dddddgdd}|ddddi}t|| d S )	NQT   )Typetmpr      rl   )ri   rj   rf   r/   rL   r6   r5   r   r   r   %test_regex_replace_dict_nested_gh4115#  s    z:TestDataFrameReplace.test_regex_replace_dict_nested_gh4115c                 C  s   t |}t |d ttjgd tjtjtjdgd}|jddgtjdd}| }| }|jddgtjddd	}|d kst|jddgtjdd
}|d kstt|| t|| t|| d S )Nr   r   r   r   r8   za|bTrN   rI   rZ   )	r   r   arrayr   r'   r&   r(   r)   r*   )r/   r   rL   rW   rV   r^   r`   r3   r   r   r   !test_regex_replace_list_to_scalar)  s4         z6TestDataFrameReplace.test_regex_replace_list_to_scalarc                 C  s   t |}|jdddd}| }|jddddd}|d ks>t| }|jdddd}|d ksbtt |d ddddg|d	 d
}t|| t|| t|| d S )Nr8   r   TrN   rY   rZ   r   r   r   r   )r   r'   r&   r(   r)   r*   r/   r   rL   rV   r^   r3   r`   rW   r   r   r   !test_regex_replace_str_to_numericA  s     z6TestDataFrameReplace.test_regex_replace_str_to_numericc                 C  s   t |}|jddgddd}| }|jddgdddd}|d ksFt| }|jddgddd}|d ksntt |d ddddgddtjd	gd
}t|| t|| t|| d S )Nr8   r   r   TrN   rI   rZ   r   r   r   )r   r'   r&   r(   r   r   r)   r*   rs   r   r   r   (test_regex_replace_regex_list_to_numericP  s     z=TestDataFrameReplace.test_regex_replace_regex_list_to_numericc           
      C  s   t |}tddi}tdtji}|j||dd}| }|j||ddd}|d ksXt| }|j||dd}|d ks|tt |d ddtjtjg|d d	}	t||	 t||	 t||	 d S )
Nr   r8   TrN   rY   rZ   r   r   r   )	r   r   r   r   r'   r&   r(   r)   r*   )
r/   r   rL   s1s2rV   r^   r3   r`   rW   r   r   r   $test_regex_replace_series_of_regexes`  s     z9TestDataFrameReplace.test_regex_replace_series_of_regexesc                 C  sV   t |}t ddddg|d |d d}|dd}t|| |jjtjksRtd S )	Nr   rn   rk   r:   r   r   r   r   )	r   r'   r)   r*   r   re   r   Zobject_r(   )r/   r   rL   rW   rV   r   r   r   /test_regex_replace_numeric_to_object_conversionr  s
     zDTestDataFrameReplace.test_regex_replace_numeric_to_object_conversionrJ    )rz   ,)r{   rz   c                 C  sb   t dddgdddgdddgd}|j|d}t d	ddgdtjdgdddgd}t|| d S )
Nz1,000r   3rz   r   r   col1col2col3rN   Z1000r   r'   r   r   r)   r*   )r/   rJ   rL   r5   r6   r   r   r   +test_joint_simple_replace_and_regex_replacey  s    
z@TestDataFrameReplace.test_joint_simple_replace_and_regex_replacemetacharz[]z()z\dz\wz\sc                 C  sB   t d|dgi}|d|dii}t dddgi}t|| d S )Nr   elseZparenrf   )r/   r   rL   r5   r6   r   r   r   test_replace_regex_metachar  s    z0TestDataFrameReplace.test_replace_regex_metacharzdata,to_replace,expectedZxaxZxbxr   r   r   ZxcxZxdxz^\s*$c           	      C  s:   |}|||d}|j |dd}|||d}t|| d S )Nrd   TrN   r'   r)   assert_equal)	r/   datarJ   r6   frame_or_seriesrg   re   objr5   r   r   r   test_regex_replace_string_types  s
    z4TestDataFrameReplace.test_regex_replace_string_typesc                 C  s  t j|d d d< t j|d dd < |t jd}t||d t|dt j| t j|d d d< t j|d dd < d|d d d< tddgd}t||dd	 td
tdfdtdfg}|d
t j}tt jtdfdtdfg}t|| d S )Nr   r   r       חBr   r   )index   -Z20150101Z20150102)	r   r   r'   r)   r*   r+   r   pdto_datetime)r/   r0   zero_filledrL   df1Zexpected_dfr   r   r   test_replace  s$    z!TestDataFrameReplace.test_replacec                 C  s   t dt dt dd}t|}ddg}tjdg}|||}tdd	tjtjgdd
ddgddddgd}t|| dd
g}ddg}|||}tdd	ddgddddgddddgd}t|| d S )Nr   rF   rG   r   r\   rB   r9   r   r   rC   rD   r;   r<   r=   rA   )r   r   r   r   r'   r)   r*   )r/   r   ZdfobjrU   rK   rV   rW   r   r   r   test_replace_list  s,    





z&TestDataFrameReplace.test_replace_listc              	   C  s   t ddgg tjdgg}td|i}t||}|}|g tj}t|| d}tj	t
|jddd |tjg i W 5 Q R X tj	t
|jd	dd |tjd
dgi W 5 Q R X d S )Nr   r   rn   colzwNumPy boolean array indexing assignment cannot assign {size} input values to the 1 output values where the mask is truer   )sizematchrk   dummyZalt)r   r   r   r   r)   get_objr'   r   pytestraises
ValueErrorformat)r/   r   Zserr   r6   r5   msgr   r   r   test_replace_with_empty_list  s    z1TestDataFrameReplace.test_replace_with_empty_listc                 C  s   t ddddddd}|dddd}t ddddddd}t|| |d| }t|| t ddddddd}tddd}||ddd}t ddddddd}t|| ||| }t|| d S )	N        rn   r          @r   )zeroone      ?      ?)r   r'   r)   r*   meanr   )r/   rL   r5   r6   sr   r   r   test_replace_series_dict  s    z-TestDataFrameReplace.test_replace_series_dictc                 C  sT   t dddgdddgg}dddd}||}ttjgd }|j}t|| d S )Nr"   barbahrn   rk   r:   )r"   r   r   )r   r'   r   r   int64dtypesr)   assert_series_equal)r/   rL   mreprW   rV   r   r   r   test_replace_convert	  s    
z)TestDataFrameReplace.test_replace_convertc                 C  s   |}t j|jdd|jdf< t j|jdd |jdf< |t jd}|jdd}t|| t|dt j| |t jd}|jdd}t|| t|dt j| d S )	Nr   r!   r"   r#   r   ir$   r   )	r   r   r,   r-   r.   r'   r+   r)   r*   )r/   r1   r4   r5   r6   r   r   r   test_replace_mixed  s    z'TestDataFrameReplace.test_replace_mixedc                 C  s   t tddgddtddgddd}t tddgddtd	dgddd}|dd	}t|| |jdd	d
d}|d kstt|| d S )Nr   r   float64rd   r   rn   r   r   r   r   Tr   )r   r   r'   r)   r*   r(   )r/   rL   r6   r5   r3   r   r   r   &test_replace_mixed_int_block_upcasting!  s    z;TestDataFrameReplace.test_replace_mixed_int_block_upcastingc                 C  s   t tddgddtddgddtddgddd	}t tddgddtd
dgddtddgddd	}|dd
}t|| d S )Nr   r   r   rd   r   rn   r   rk   r   r   Cr   r   r   r'   r)   r*   ro   r   r   r   &test_replace_mixed_int_block_splitting7  s    z;TestDataFrameReplace.test_replace_mixed_int_block_splittingc                 C  s   t tddgddtddgddd}t tdd	gd
dtddgddd}|dd	}t|| t td	dgd
dtdd	gd
dd}|ddgd	dg}t|| d S )Nr   r   r   rd   r   rn   r   r   r"   objectrk   r   r   ro   r   r   r   test_replace_mixed2K  s&    z(TestDataFrameReplace.test_replace_mixed2c                 C  s|   t tddgddtddgddd}|d|  }| d}| }|d |jd< |d |jd	< t	|| d S )
Nr:   r   r   rd   r   r   r   r   rn   )rn   rn   )
r   r   r'   r   to_dictr&   astyper,   r)   r*   )r/   rL   r5   r6   r   r   r   r   test_replace_mixed3f  s     z(TestDataFrameReplace.test_replace_mixed3c                 C  sX   t dddtjgddddgd}|d	 d
|d	< |dtj}t|d	 |d	  d S )Nrn   rk   r:   Zsomestringshereher   r   Int64rz   )r   r   r   r   r'   r)   r   r/   rL   rV   r   r   r   1test_replace_nullable_int_with_string_doesnt_castr  s     zFTestDataFrameReplace.test_replace_nullable_int_with_string_doesnt_castre   booleanr   ZFloat64c                 C  sV   t dddg|d}tdddg|d}|dd}tdddg|d}t|| d S )	Nrn   r   rd   r   r   xr   X)r   r   r'   r)   r*   )r/   re   Znullable_serrL   r5   r6   r   r   r   !test_replace_with_nullable_columnz  s
    z6TestDataFrameReplace.test_replace_with_nullable_columnc                 C  sf   t dtddi}t dddddgi}|ddddi}t|| |ddd}t|| d S )	Nr   rn   r   r   rk   r:   r   )rn   r   r   r   r'   r)   r*   ro   r   r   r   test_replace_simple_nested_dict  s    z4TestDataFrameReplace.test_replace_simple_nested_dictc                 C  sj   t dtddi}t dddddgi}|dddd	}t|| |ddddd	i}t|| d S )
Nr   rn   r   r   rk   r:   r   r   )rn   r   r   ro   r   r   r   6test_replace_simple_nested_dict_with_nonexistent_value  s    zKTestDataFrameReplace.test_replace_simple_nested_dict_with_nonexistent_valuec                 C  sN   t ddd giddi}|tjd i}t ddd gitd}t|| d S )Nr%   *   r   rd   )r   r   r'   r   NAr   r)   r*   r/   rL   r5   r6   r   r   r   test_replace_NA_with_None  s    z.TestDataFrameReplace.test_replace_NA_with_Nonec                 C  sB   t tjtjg}|tjd tjd i}t d d g}t|| d S N)r   r   NaTr'   r   NaNr)   r*   r   r   r   r   test_replace_NAT_with_None  s    z/TestDataFrameReplace.test_replace_NAT_with_Nonec                 C  s   |j d }|j d }tj|j d< d|j d< |jtjdid}|jjtjdidj}t|| |jtjdddid}| }d|j d< d|j d< |}t|| ||j d< ||j d< d S )Nr   rn   r   rn   r   rJ   r   )r,   r   r   r'   rj   r)   r*   r&   )r/   r0   Z
orig_valueZorig2r5   r6   r2   r   r   r   test_replace_value_is_none  s    





z/TestDataFrameReplace.test_replace_value_is_nonec                 C  s   |  tj}tj|d d d< tj|d dd < |tjd}t||d t|dtj| tj|d d d< tj|d dd < d|d d d< |d }tj||dk< ||d< |jdd}t||jdd d S )Nr   r   r   r   r   bfill)method)	r&   r   r   float32r   r'   r)   r*   r+   )r/   r0   r2   r   r   r5   r   r   r   test_replace_for_new_dtypes  s    z0TestDataFrameReplace.test_replace_for_new_dtypesz"frame, to_replace, value, expectedZintsrn   rk   r   rd   Zboolscomplexy              ?y               @y              @y                Z
datetime64i  r      r   i     r!   r"   )dtstrr   20130101
US/EasternZperiodstzr   20130102r   2013010420130103r   r   g      @c                 C  s    t |d||}t|| d S )Nr'   )getattrr)   r*   )r/   framerJ   r%   r6   r5   r   r   r   test_replace_dtypes  s    cz(TestDataFrameReplace.test_replace_dtypesc              	     s  t jddd ddddtt jdt jgdddgddd	gd}| } fd
d| D }t|t| |dddgdddg}tt jdt jgdddgddd	gd}t|| ddddtt jdt jgdddgddd	gd}|t j}fdd| D }t|t| t jddg dddg| }| }t	t
 D ],}|j | | dd}|d ksZtqZt|| d}tjt|d | dd   W 5 Q R X d S )Nr   rz   r   r   missingrk   r   asdffdc                   s&   i | ]\}}||  | | qS r   r'   .0kvto_reprK   r   r   
<dictcomp>=  s      zLTestDataFrameReplace.test_replace_input_formats_listlike.<locals>.<dictcomp>c                   s$   i | ]\}}|| tj | qS r   )r'   r   r   r   )rK   r   r   r   L  s      Tr   z:Replacement lists must match in length\. Expecting 3 got 2r   rn   )r   r   r   infr'   itemsr)   r*   r&   r   lenr(   r   r   r   )r/   rL   filledr6   r5   ir3   r   r   r   r   #test_replace_input_formats_listlike5  s>       
z8TestDataFrameReplace.test_replace_input_formats_listlikec              	     s   t tjdtjgdddgdddgd}tjddd | d} fdd	| D }t|t | d
}tj	t
|d | tjddg W 5 Q R X tjddg | d}| }tt D ]$}|j | ddd}|d kstqt|| d S )Nr   rk   r   rz   r   r   r   c                   s"   i | ]\}}||  | d qS )r   r   r   r   r   r   r   e  s      zJTestDataFrameReplace.test_replace_input_formats_scalar.<locals>.<dictcomp>z.value argument must be scalar, dict, or Seriesr   r   Tr   )r   r   r   r   r'   r   r)   r*   r   r   	TypeErrorr&   r   r   r(   )r/   rL   r   r6   r   r5   r   r3   r   r  r   !test_replace_input_formats_scalar]  s"     z6TestDataFrameReplace.test_replace_input_formats_scalarc                 C  s   d S r   r   )r/   r   r   r   test_replace_limitu  s    z'TestDataFrameReplace.test_replace_limitc                 C  sR   t dddddd}ddd	d
dd}t d
dd	ddd}||}t|| d S NStrongly AgreeAgreeNeutralDisagreeStrongly Disagree)r   rn   rk   r:   r   r   rk   r:   r   rn   )r  r	  r  r  r
  r   r'   r)   r   r/   Zanswerweightsr6   r5   r   r   r   test_replace_dict_no_regexx  s"    

z/TestDataFrameReplace.test_replace_dict_no_regexc                 C  sV   t dddddd}t ddd	d
dd}t d
dd	ddd}||}t|| d S r  r  r  r   r   r   test_replace_series_no_regex  s&    		
z1TestDataFrameReplace.test_replace_series_no_regexc                 C  s   t dtjdgi}|jtjdddid}|jdtjfddgd}|jdtjgddgd}t dddgi}t|| t|| t|| d S )Nr   rn   r   r   r   rJ   r%   r   r   r   r'   r)   r*   )r/   rL   Zres1r^   r`   r6   r   r   r   6test_replace_dict_tuple_list_ordering_remains_the_same  s    zKTestDataFrameReplace.test_replace_dict_tuple_list_ordering_remains_the_samec                 C  sP   t ddddgddddgddddgddddgd}|d	di}t|| d S )
Nrn   rk   r:   0ZvrZbtZvo)ZfolZT_oppZT_DirZT_Enhz\Drf   r   r   r   r   )test_replace_doesnt_replace_without_regex  s    



z>TestDataFrameReplace.test_replace_doesnt_replace_without_regexc                 C  sF   t ddgtdd}|dd}t ddg|jd}t|| d S )NTFabr   r   )r   r   r'   r   r)   r*   r   r   r   r   test_replace_bool_with_string  s    z2TestDataFrameReplace.test_replace_bool_with_stringc                 C  s2   t tjdddk}|dd}t|| d S )Nrk   r   r   Zfdsa)r   r   randomrandr'   r)   r*   r/   rL   r5   r   r   r   (test_replace_pure_bool_with_string_no_op  s    z=TestDataFrameReplace.test_replace_pure_bool_with_string_no_opc                 C  sD   t tjdddk}|dd}t tjdtd}t|| d S )Nrk   r   FT)rk   rk   rd   )	r   r   r  r  r'   onesboolr)   r*   r   r   r   r   test_replace_bool_with_bool  s    z0TestDataFrameReplace.test_replace_bool_with_boolc                 C  sL   t ddgddgd}|ddd}t ddgddgd}t|| d S )NTFr   rn   Zasdbyes)r   Trf   r   r   r   r   %test_replace_with_dict_with_bool_keys  s    z:TestDataFrameReplace.test_replace_with_dict_with_bool_keysc                 C  sV   t ddgddgd}|ddi}t|| |d ddi}t||d  d S )	Nrn   rk   r:   r   )Y0ZY1Zreplace_stringtestr!  )r   r'   r)   r*   r   r  r   r   r   !test_replace_dict_strings_vs_ints  s
    z6TestDataFrameReplace.test_replace_dict_strings_vs_intsc                 C  s<   t dddgi}|tjtj gtj}|}t|| d S )Nr   T)r   r'   r   r   r   r)   r*   )r/   rL   rrB   r   r   r   test_replace_truthy  s    z(TestDataFrameReplace.test_replace_truthyc              	   C  sj   t dttddi}|dtttddtddi}|tttddtdd}t|| d S )Nr   rn   r   rk      )r   r   r   r'   dictzipr)   r*   r   r   r   r   -test_nested_dict_overlapping_keys_replace_int  s    $ zBTestDataFrameReplace.test_nested_dict_overlapping_keys_replace_intc                 C  sp   t dd}|t}t ddt}td|i}|tt||}|dtt||i}t	|| d S )Nrn   r   rk   r&  r   )
r   Zaranger   r   r   r'   r'  r(  r)   r*   )r/   r   ZastrZbstrrL   r5   r6   r   r   r   -test_nested_dict_overlapping_keys_replace_str  s    
zBTestDataFrameReplace.test_nested_dict_overlapping_keys_replace_strc                 C  s   t ddddgi}|ddddi}t ddddgi}t|| t ddddgi}|dddd	i}t ddddgi}t|| d S )
Nr   TFYN)TFr   rn   r  rf   )r/   rL   rV   expectr   r   r   test_replace_swapping_bug  s    z.TestDataFrameReplace.test_replace_swapping_bugc                   s   dt jddddt jddddt jddddt jdd	ddt jddddt jddddt jd
ddddi tdddddddgdgd}t|jjt d  ksttd fdd|jjD i}|jd dkst|	 }t
|| d S )Nfnamei     M)yearmonthfreqrn   i  r   r   i  	   out_augmented_AUG_2011.jsonout_augmented_JAN_2011.jsonout_augmented_MAY_2012.jsonout_augmented_SUBSIDY_WEEK.jsonout_augmented_AUG_2012.jsonout_augmented_MAY_2011.jsonout_augmented_SEP_2013.jsonr;  r=  r:  r9  r<  r7  r8  r-   c                   s   g | ]} d  | qS r/  r   r   r   r   r   r   
<listcomp>  s     z<TestDataFrameReplace.test_replace_period.<locals>.<listcomp>r   z	Period[M])r   Periodr   setr/  rK   keysr(   r   r'   r)   r*   ro   r   rA  r   test_replace_period   s<      	 
z(TestDataFrameReplace.test_replace_periodc              	     s   dt dt dt dt dt dt dt dd	i td
ddddddgdgd}t|jjt d  kspttd fdd|jjD i}| }t	|| d S )Nr/  z2011-08z2011-01z2012-05z2011-04z2012-08z2011-05z2013-09r6  r;  r=  r:  r9  r<  r7  r8  r>  c                   s   g | ]} d  | qS r?  r   r@  rA  r   r   rB  <  s     z>TestDataFrameReplace.test_replace_datetime.<locals>.<listcomp>)
r   r   rD  r/  rK   rE  r(   r'   r)   r*   ro   r   rA  r   test_replace_datetime"  s2    	 
z*TestDataFrameReplace.test_replace_datetimec              	   C  s:  t tdddddtjdgd}|tjd}t tddddtdddgd	d
d}t|| |d}t|| |dtj}t tddddtjtjdgd}t|| |t	dddt	ddd}t t	dddt	dddt	dddgdtjdgd}t|| |
 }tj|jd< |dtjit	ddd}t|| |
 }tj|jd< tjtdd  |dtjit	ddd}W 5 Q R X t t	dddt	dddt	dddgdtjdgd}t|| |
 }tj|jd< |dtjit	d}t t	dddt	dt	dddgdtjdgd}t|| d S )Nr   r:   r   r   r   rk   r   rn   r   rd   r   r   r   r   r   r   zmismatched timezoner   z
US/Pacific)r   r	   r   r   r'   r   r)   r*   r+   r   r&   r,   r   r   Zassert_produces_warningFutureWarningr   r   r   r   test_replace_datetimetz@  s    








 








z,TestDataFrameReplace.test_replace_datetimetzc              	   C  sh   t |}t||i  t||tg td t||di i t||tdi i d S )Nrd   r   )r   r)   r*   r'   r   r   )r/   r   rL   r   r   r    test_replace_with_empty_dictlike  s
    z5TestDataFrameReplace.test_replace_with_empty_dictlikezto_replace, method, expectedr   r   g      @Zffillpad)rn   rk   c                 C  sL   t dddgdtjdgdddgd	}|j|d |d
}t |}t|| d S )Nr   rn   rk   r   r   r   r   r   r   )rJ   r%   r   r  )r/   rJ   r   r6   rL   r5   r   r   r   test_replace_method  s    "$z(TestDataFrameReplace.test_replace_methodzreplace_dict, final_datac              	   C  s   t ddgddggddgdd}t|}tj|d d df ddgd	}|d dkrZddgnddg}tj|d d df |d	}t ||d
}||d}t|| d}	tj	t
|	d t|| W 5 Q R X |j|ddd}
|
d kst
t|| d S )Nrn   rk   r   r   category)r-   re   r   r:   )
categoriesr   zHAttributes of DataFrame.iloc\[:, 0\] \(column name=\"a\"\) are differentr   Tr   )r   r   rq   r   ZCategoricalr'   r)   r*   r   r   r(   )r/   Zreplace_dictZ
final_datarL   r   Zex_catr   r6   r5   r   r3   r   r   r   "test_categorical_replace_with_dict  s    
z7TestDataFrameReplace.test_categorical_replace_with_dictzdf, to_replace, expr   r&  )r~   r   )r   r   r&  4567)rP  rQ  rR  c                 C  s*   t |}t |}||}t|| d S r   rf   )r/   rL   rJ   expr6   r5   r   r   r   test_replace_commutative  s    
z-TestDataFrameReplace.test_replace_commutativereplacerZ20170827c                 C  sb   t |r.|jjdk r.|jtjjt	dd t
dg}|||d}t
|g}t|| d S )Nr0  znp.putmask doesn't coerce dtype)reasonr   r   )r   Zisscalarre   itemsizenodeZ
add_markerr   markZxfailr   r   r'   r)   r*   )r/   requestrV  rL   r5   r6   r   r   r   test_replace_replacer_dtype   s     

z0TestDataFrameReplace.test_replace_replacer_dtypec                 C  sP   t ddddddgidd}|dd	}t dd	ddddgidd}t|| d S )
Ngrprn   rk   r:   r   r   r   rd   
   rf   r   r   r   r   !test_replace_after_convert_dtypes  s    z6TestDataFrameReplace.test_replace_after_convert_dtypesc              	   C  sJ   t dddgdddgd}d}tjt|d	 |d
d  W 5 Q R X d S )Nr   zb r   zd ze zf )r   twozZExpecting 'to_replace' to be either a scalar, array-like, dict or None, got invalid type.*r   c                 S  s   |   S r   )strip)r   r   r   r   <lambda>'      zFTestDataFrameReplace.test_replace_invalid_to_replace.<locals>.<lambda>)r   r   r   r  r'   )r/   rL   r   r   r   r   test_replace_invalid_to_replace  s
    z4TestDataFrameReplace.test_replace_invalid_to_replacefloatr   r   r%   c                 C  s<   t td|d}|jd tj tjg|d}t|| d S )Nrk   rd   r  )r   r   eyer'   r   r)   r*   )r/   re   r%   rL   r5   r   r   r   "test_replace_no_replacement_dtypes)  s    z7TestDataFrameReplace.test_replace_no_replacement_dtypesreplacementc                 C  s|   t dddgdddgddd	gd
}td|_t dddgdddg|dd	gd
}td|_|d d||d< t|| d S )Nrn   rk   r:   r   r   r&  r   r0  r5  )r   A1r   ZAABr   )r   r   r-   r'   r)   r*   )r/   rh  r5   r6   r   r   r   #test_replace_with_duplicate_columns1  s    "

z8TestDataFrameReplace.test_replace_with_duplicate_columnsz2020-01c                 C  sB   t d|gd i}t||}| }|dd}t|| d S )NZPerr:   r   r   )r   r)   r   r&   r'   r   )r/   r   r%   r   r6   r5   r   r   r   test_replace_ea_ignore_float@  s
    z1TestDataFrameReplace.test_replace_ea_ignore_floatc                 C  sP  ddddgddddgd	d
ddgddddgddddgd}t |dddd}|d jjddddgdd|d< |d jjddddgdd|d< ddddgddddgd	d
ddgddddgddddgd}t |dddd}|d jjddddgdd|d< |d jjddddgdd|d< |dd}|dd}|dd}t|| d S )!zt
        Test for #23305: to ensure category dtypes are maintained
        after replace with direct values
        rn   rk   r:   r   r   r   r   r   g      ?g      @g      @g      @cat1cat2Zcat3Zcat4obj1obj2Zobj3Zobj4)r~   r   r   col4Zcol5r   rM  )r   rp  r   T)Zorderedrp  zcatXobj9N)r   r   catZreorder_categoriesr'   r)   r*   r/   Z
input_dictZinput_dfexpected_dictr6   r5   r   r   r    test_replace_value_category_typeJ  sL    







 


 








 


 
z5TestDataFrameReplace.test_replace_value_category_typec                 C  sv   dgdgdgd}t |ddddd}dgdgd	gd}t |ddddd}|ddd	d
}t|| dS )zf
        Test to ensure category dtypes are maintained
        after replace with dict values
        r   rn  rl  r}   rq  rM  rr  rt  rs  )r   rn  rl  N)r   r   r'   r)   r*   rv  r   r   r   test_replace_dict_category_type}  s    



z4TestDataFrameReplace.test_replace_dict_category_typec                 C  sH   t dddg}td}|j|didd}t dddg}t|| d S )Nr   r   r   z^a$rr  TrN   )r   recompiler'   r)   r*   )r/   rL   rH   r5   r6   r   r   r    test_replace_with_compiled_regex  s
    
z5TestDataFrameReplace.test_replace_with_compiled_regexc                 C  sZ   t dtddtddgi}|dtdddii}t dddgi}t|| d S )Nr   r   rn   r   )r   r   Intervalr'   r)   r*   r   r   r   r   test_replace_intervals  s     z+TestDataFrameReplace.test_replace_intervalsc                 C  sN   dddddi}t dtdi}||}t dtdi}t|| d S )NZpositivern   r   )u   正面u   中立u   负面r:   )r   r   r  r'   r)   r*   )r/   Zcolumns_values_mapr   r5   r6   r   r   r   test_replace_unicode  s
    
z)TestDataFrameReplace.test_replace_unicodec                 C  s8   |dg d}| }|d tji}t|| d S )Nr=   z|S)r   r&   r'   r   r   r)   r   )r/   r   r   r6   r   r   r   test_replace_bytes  s    z'TestDataFrameReplace.test_replace_bytesz!data, to_replace, value, expectedr   boxc           	      C  s0   ||}||}| |||}t|| d S r   r   )	r/   r   rJ   r%   r6   r  r   r   r5   r   r   r   !test_replace_list_with_mixed_type  s    z6TestDataFrameReplace.test_replace_list_with_mixed_typeN)`__name__
__module____qualname__r7   r   rZ  parametrizer   r   rM   rX   r[   r_   ra   rh   rp   rr   rt   ru   rx   ry   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   Zint32Zint16r   r   r	   r   r   r   r  r  r  r  r  r  r  r  r  r   r#  r%  r)  r*  r.  rF  rG  rI  rJ  rL  rO  rU  Zint8r   r   r\  r_  rd  rg  rj  rC  r}  rk  rx  ry  r|  r~  r  r  r   tuplerq   r  r   r   r   r   r       s  






%)(E 


	

& 











b
(
	
"X	$$ 
2







	3	r   c                	   @  s   e Zd Zejdededdedeeddgejddej	fdgejd	d
dgejdd
dgejdd
dgdd Z
ejddd
gdd Zdd ZdS )TestDataFrameReplaceRegexr   r   rF   r   r   zto_replace,valuer8   )r>   z\1\1\1compile_regexTFregex_kwargr    c                 C  s   t |}| }|rt|}|r,|}	d }nd}	|j||||	d}
|rV|
d ksRt|}
|tjkrhtj}nd}||j|d dkdf< t	
|
| d S )NTrY   z...r   r\   )r   r&   rz  r{  r'   r(   r   r   locr)   r*   )r/   r   rJ   r%   r  r  r    rL   r6   rH   r5   Zexpected_replace_valr   r   r   test_regex_replace_scalar  s"    

z3TestDataFrameReplaceRegex.test_regex_replace_scalarrH   c                 C  s   t dgdgd}t dgdgd}|jdd|d}t|| t dgdgd}t dgdgd}|jdd|d}t|| d S )Nr  r   rn   )rJ   r%   rH   1rf   )r/   rH   r   Zexpected_df1Z
result_df1Zdf2Zexpected_df2Z
result_df2r   r   r   test_replace_regex_dtype_frame  s    z8TestDataFrameReplaceRegex.test_replace_regex_dtype_framec                 C  sZ   t dddgdddgd}|dtjd}t dtjdgtjddgd}t|| d S )Nr   rn   rk   r   r  r   r   r   r   r   +test_replace_with_value_also_being_replaced  s    zETestDataFrameReplaceRegex.test_replace_with_value_also_being_replacedN)r  r  r  r   rZ  r  r   r   r   r   r  r  r  r   r   r   r   r    s"    
r  )
__future__r   r   rz  numpyr   r   Zpandas.compatr   Zpandasr   r   r   r   r   r	   Zpandas._testingZ_testingr)   Zfixturer   r   r   r  r   r   r   r   <module>   s2              4