U
    NZf                     @   s  d Z ddlmZ ddlZddlmZ ddlmZ ej	
dZedd Zedd	 Zd
d Zeej	ddedddggdddgdfdeddddddggddddddgdfdedddddddggdddddd d!gdfgd"d# Zeej	d$d%dddgedd&d&gd'd(d)ggdddgdfd*ddddddgedd&d+d,d-d.gd'd(d)d/d0d1ggdddddd2gdfd3dddddddgedd&d+d,d-d.d4gd'd(d)d/d0d1d5ggdddddd6d7gdfgd8d9 Zed:d; Zed<d= Zed>d? ZdS )@z
Tests that duplicate columns are handled appropriately when parsed by the
CSV engine. In general, the expected result is that they are either thoroughly
de-duplicated (if mangling requested) or ignored otherwise.
    )StringION)	DataFrameZpyarrow_skipc                 C   sL   | }d}|j t|dd}tdddddggd	d
dddgd}t|| d S )Nza,a,b,b,b
1,2,3,4,5,)sep               aa.1bzb.1zb.2columnsread_csvr   r   tmassert_frame_equalall_parsersparserdataresultexpected r   L/tmp/pip-unpacked-wheel-nbcvw55c/pandas/tests/io/parser/test_mangle_dupes.py
test_basic   s
    "r   c                 C   sH   | }d}t dddgdddggdd	d
gd}|t|}t|| d S )Nza,b,a
0,1,2
3,4,5r   r   r   r   r	   r
   r   r   r   r   )r   r   r   r   r   )r   r   r   r   r   r   r   r   test_basic_names   s
    "r   c              	   C   s>   | }d}t jtdd |jt|dddgd W 5 Q R X d S )Nz0,1,2
3,4,5Duplicate namesmatchr   r   namespytestZraises
ValueErrorr   r   )r   r   r   r   r   r   test_basic_names_raise'   s    r&   zdata,expectedza,a,a.1
1,2,3r   r   r   r   a.2r   r   z+a,a,a.1,a.1.1,a.1.1.1,a.1.1.1.1
1,2,3,4,5,6r	   r
      a.1.1za.1.1.1z	a.1.1.1.1z!a,a,a.3,a.1,a.2,a,a
1,2,3,4,5,6,7   a.4a.3za.5za.6c                 C   s"   | }| t|}t|| d S )N)r   r   r   r   )r   r   r   r   r   r   r   r   test_thorough_mangle_columns0   s    r-   zdata,names,expectedza,b,b
1,2,3r   123za,b,c,d,e,f
1,2,3,4,5,6cdef456za.1.1.1.1.1za,b,c,d,e,f,g
1,2,3,4,5,6,7g7za.2.1za.3.1c              	   C   s4   | }t jtdd |jt||d W 5 Q R X d S )Nr   r   r!   r#   )r   r   r"   r   r   r   r   r   test_thorough_mangle_namesM   s    "r:   c           	      C   s   d}| }dddg}t ||i}tdD ]t}t  }t|d D ]6}ddd|  t|d  }|jd|dddgd q<|||< |t| }t|| q&d S )	N0r   r   r   
Unnamed: 0.r   )loccolumnvalue)	r   rangemininsertr   r   Zto_csvr   r   )	r   Zorig_keyr   Z
orig_valueZdfir   jZcol_namer   r   r   !test_mangled_unnamed_placeholdersu   s    
rF   c              	   C   sP   | }d}| t|}tdddddddggd	d
dddddgd}t|| d S )Nz%a,a,a.1,a,a.3,a.1,a.1.1
1,2,3,4,5,6,7r   r   r   r	   r
   r(   r*   r   r'   r   r+   r,   za.1.2r)   r   r   r   r   r   r   $test_mangle_dupe_cols_already_exists   s    rG   c                 C   sD   | }d}| t|}tddddggdddd	gd
}t|| d S )Nz,Unnamed: 0,,Unnamed: 2
1,2,3,4r   r   r   r	   zUnnamed: 0.1r<   zUnnamed: 2.1z
Unnamed: 2r   r   r   r   r   r   0test_mangle_dupe_cols_already_exists_unnamed_col   s    
rH   )__doc__ior   r$   Zpandasr   Zpandas._testingZ_testingr   markZusefixturesZskip_pyarrowr   r   r&   Zparametrizer-   r:   rF   rG   rH   r   r   r   r   <module>   s   


	 	

