o
    _~#g                  
   @  s  d dl mZ d dlmZmZ d dlmZ d dlmZ d dlZd dl	m
Z
 d dlZd dlZd dlmZ d dlmZ d dlZd dlZd d	lmZ d d
lmZ d dlm  mZ d dlZd dlmZmZm Z m!Z!m"Z" d dl#m$Z% d dl&m'Z'm(Z( e r|ej)j*Z+g dZ,ej-de.dgdej-de.dgdej-de.dgdej-de.ddej-de.ddej-de.ddgZ/d5ddZ0dd Z1ej2dd e/D e3dd d! Z4ej2d"d# Z5ej2d$d Z6ej2d%d& Z7d6d(d)Z8d7d-d.Z9d/d0 Z:G d1d2 d2Z;G d3d4 d4Z<dS )8    )annotations)datetimetime)partial)BytesION)Path)URLError)
BadZipFile)using_pyarrow_string_dtype)is_platform_windows)	DataFrameIndex
MultiIndexSeriesread_csv)ArrowStringArrayStringArray).xls.xlsx.xlsm.xlsb.odsxlrdmarksopenpyxlpyxlsbodfcalaminepython_calamineread_extstrreturnboolc                 C  s   | j d } | dkr|dkrdS | dkr|dkrdS |dkr#| dvr#dS | dkr-|d	kr-dS |d	kr7| d
vr7dS | dkrA|dkrAdS dS )zm
    Filter out invalid (engine, ext) pairs instead of skipping, as that
    produces 500+ pytest.skips.
    r   r   r   Fr   r   >   r   r   r   r   >   r   r   r   T)values)enginer     r&   /var/www/static.ux5.de/https/Moving-Object-Detection-with-OpenCV/env/lib/python3.10/site-packages/pandas/tests/io/excel/test_readers.py_is_valid_engine_ext_pairF   s   
r(   c                 C  s    | j |f }tj|| jd}|S )z
    engine gives us a pytest.param object with some marks, read_ext is just
    a string.  We need to generate a new pytest.param inheriting the marks.
    r   )r$   pytestparamr   )r%   r    r$   	new_paramr&   r&   r'   _transfer_marks[   s   r,   c                 C  s*   g | ]}t D ]}t||rt||qqS r&   )read_ext_paramsr(   r,   ).0engextr&   r&   r'   
<listcomp>f   s    r1   )paramsidsc                 C     | j S )zS
    Fixture for Excel reader engine and read_ext, only including valid pairs.
    )r*   )requestr&   r&   r'   engine_and_read_exte   s   r6   c                 C  s   | \}}|S Nr&   r6   r%   r    r&   r&   r'   r%   u      r%   c                 C  s   | \}}|S r7   r&   r8   r&   r&   r'   r    {   r9   c                 C  s"   | dddd}t |dddd}|S )	zI
    Obtain the reference data from read_csv with the Python engine.
    iodatacsvz	test1.csvr   Tpython)	index_colparse_datesr%   )r   )datapathfilepathdf_refr&   r&   r'   rB      s   rB   
str | Nonec                 C  s   dS )Nnsr&   )r    r%   r&   r&   r'   get_exp_unit   s   rE   expectedr   Nonec                 C  s$   d | j _t||}| j || _ d S r7   )indexnamerE   as_unit)rF   r    r%   unitr&   r&   r'   adjust_expected   s   
rL   c                 C  s$   | dkr| tjjdd d S d S )Nr   z3Sheets containing datetimes not supported by pyxlsbreason)applymarkerr)   markxfail)r%   r5   r&   r&   r'   xfail_datetimes_with_pyxlsb   s   rR   c                   @  s  e Zd Zejdddd Zdd Zdd Zd	d
 Zdd Z	dd Z
ejdg dg dg dg dg dg dgdd Zejdddgddggdd Zdd Zdd Zd d! Zd"d# Zd$d% Zd&d' Zejd(d)d*gd+d, Zd-d. Zd/d0 Zd1d2 Zd3d4 Zd5d6 Zd7d8 Zd9d: Zd;d< Zejd=d)eg d>g d?g d>d@dAej dBgdCfdDdEe!e!dCee"g d>dDdFe"g d?dEdFe"g dGe#dFe"dHdIej dJge#dFdCfgdKdL Z$dMdN Z%dOdP Z&ejj'e( dQdRdSdT Z)ejdUi dVfdWdXidVfgdYdZ Z*d[d\ Z+ejd]d^ed_d`gifdaedbgdcfgddde Z,dfdg Z-dhdi Z.djdk Z/dldm Z0dndo Z1dpdq Z2ej3drdsdt Z4dudv Z5dwdx Z6dydz Z7ejd{d|d}d|gd|d}gd~dd~gd~dggdd Z8dd Z9dd Z:ejj;ejj<dd Z=e>j?ejj<dd Z@ejj<dd ZAejjBdd ZCdd ZDe>Eddd ZFdd ZGdd ZHdd ZIejddej dddgfdej gd fgdd ZJdd ZKdd ZLdd ZMdd ZNdd ZOdd ZPdd ZQdd ZRejdddd}dVgd}d)fddd)d}dVgd)fddd}dVgd}dVgd)fddd}dVgd}d)fddd)d)d}d*gfddd)d)dd fgdd ZSdd ZTdd ZUdd ZVddĄ ZWddƄ ZXddȄ ZYddʄ ZZdd̄ Z[d)S )TestReadersTautousec                 C  2   t tj|d}||ddd |td| dS )zG
        Change directory and set engine for read_excel calls.
        r%   r:   r;   excel
read_excelN)r   pdrY   chdirsetattrselfr%   r@   monkeypatchfuncr&   r&   r'   cd_and_set_engine      zTestReaders.cd_and_set_enginec           	      C  s   dd }| tjd| dddddd}td	| d
}t|}W d    n1 s+w   Y  |d ur7|}n||dd   }||ksEJ d S )Nc                 _  r4   r7   rW   )r^   argskwargsr&   r&   r'   parser   s   z,TestReaders.test_engine_used.<locals>.parserparser   r   r   r   xlsxxlsmxlsbxlsodstest1rb   )r\   rZ   	ExcelFileopenrY   )	r^   r    r%   r_   re   expected_defaultsfresultrF   r&   r&   r'   test_engine_used   s   zTestReaders.test_engine_usedc              	   C  s   ddiddiddiddiddid}|dv rt d}n|d	kr&t d
}nt d}|d urZtjt|d tjd| dd||dd   d W d    d S 1 sSw   Y  d S d S )Nfooabcd{   TrueTrg   >   r   r   z8open_workbook() got an unexpected keyword argument 'foo'r   z/load() got an unexpected keyword argument 'foo'z8load_workbook() got an unexpected keyword argument 'foo'matchrm   Sheet1r   ro   )
sheet_namer>   engine_kwargs)reescaper)   raises	TypeErrorrZ   rY   )r^   r    r%   rr   msgr&   r&   r'   test_engine_kwargs   s*   
"zTestReaders.test_engine_kwargsc                 C  s   d}t jt|d tjd| dddd W d    n1 sw   Y  t jt|d tjd| dd	gddd
 W d    d S 1 sDw   Y  d S )Nz Passing an integer for `usecols`rz   rm   r|   r      r}   r>   usecolsSheet2ro   r}   skiprowsr>   r   r)   r   
ValueErrorrZ   rY   r^   r    r   r&   r&   r'   test_usecols_int   s   "zTestReaders.test_usecols_intc                 C  sv   t || |ddg }t||| tjd| ddg dd}tjd| dd	gdg dd
}t|| t|| d S )NBCrm   r|   r   )r      r   r   r   ro   r   rR   rL   rZ   rY   tmassert_frame_equal)r^   r5   r%   r    rB   rF   df1df2r&   r&   r'   test_usecols_list   s   
	zTestReaders.test_usecols_listc                 C  s  t || |g d }t||| tjd| dddd}tjd| ddgddd	}t|| t|| |d
dg }t||| tjd| dddd}tjd| ddgddd	}t|| t|| tjd| dddd}tjd| ddgddd	}t|| t|| d S )NAr   r   rm   r|   r   zA:Dr   r   ro   r   r   r   zA,C,DzA,C:Dr   )r^   r5   r%   r    rB   rF   r   df3r&   r&   r'   test_usecols_str  sR   
	zTestReaders.test_usecols_strr   )r   ro   r   )r   r   ro   )ro   r   r   )ro   r   r   )r   r   ro   )r   ro   r   c                 C  sH   t || |ddg }t||| tjd| dd|d}t|| d S )Nr   r   rm   r|   r   r   r   )r^   r5   r%   r    r   rB   rF   rt   r&   r&   r'   .test_usecols_diff_positional_int_columns_order5  s   
z:TestReaders.test_usecols_diff_positional_int_columns_orderr   Dc                 C  s>   |ddg }t t||_tjd| d|d}t|| d S )Nr   r   rm   r|   r}   r   )rangelenrH   rZ   rY   r   r   )r^   r    r   rB   rF   rt   r&   r&   r'   .test_usecols_diff_positional_str_columns_orderE  s   z:TestReaders.test_usecols_diff_positional_str_columns_orderc                 C  s>   t || |}t||| tjd| ddd}t|| d S Nrm   r|   r   r}   r>   r   r^   r5   r%   r    rB   rF   rt   r&   r&   r'   test_read_excel_without_slicingM  s
   
z+TestReaders.test_read_excel_without_slicingc                 C  sH   t || |ddg }t||| tjd| dddd}t|| d S )Nr   r   rm   r|   r   zA,D:Er   r   r   r&   r&   r'   test_usecols_excel_range_strV  s   
z(TestReaders.test_usecols_excel_range_strc                 C  sL   d}t jt|d tjd| ddd W d    d S 1 sw   Y  d S )NzInvalid column name: E1rz   rm   r|   zD:E1r   r   r   r&   r&   r'   $test_usecols_excel_range_str_invalida  s   "z0TestReaders.test_usecols_excel_range_str_invalidc                 C  sT   d}t jt|d tjd| ddgddgd W d    d S 1 s#w   Y  d S )Nz(list indices must be integers.*, not strrz   rm   r|   r   r   r   r)   r   r   rZ   rY   r   r&   r&   r'   test_index_col_label_errorg  s   "z&TestReaders.test_index_col_label_errorc                 C  s<   t jd| ddd}tg dtg ddd}t|| d S )Nrm   Sheet3r   r   )r   r   r   EFrI   columnsrH   )rZ   rY   r   r   r   r   r^   r    rt   rF   r&   r&   r'   test_index_col_strr  s
   zTestReaders.test_index_col_strc                 C  sR   t jd| dg dd}tg dtg gd g gd g ddd}t|| d S )	Nrm   r   r   r   )r   r   r   r   levelscodesnamesr   )rZ   rY   r   r   r   r   r   r&   r&   r'   test_index_col_emptyz  s   z TestReaders.test_index_col_emptyr>   Nr   c                 C  sT   t jd| d|d}tg dg dgg dd}|r"||j| }t|| d S )Nrm   Sheet4r   )i1ax)i2by)z
Unnamed: 0col1col2r   )rZ   rY   r   	set_indexr   r   r   )r^   r    r>   rt   rF   r&   r&   r'   test_index_col_with_unnamed  s   
z'TestReaders.test_index_col_with_unnamedc                 C  sL   d}t jt|d tjd| dgd W d    d S 1 sw   Y  d S )NzEUsecols do not match columns, columns expected but not found: \['E'\]rz   rm   r   r   r   r   r&   r&   r'   %test_usecols_pass_non_existent_column  s
   "z1TestReaders.test_usecols_pass_non_existent_columnc                 C  sN   d}t jt|d tjd| ddgd W d    d S 1 s w   Y  d S )Nz['usecols' must either be list-like of all strings, all unicode, all integers or a callable.rz   rm   E1r   r   r   r   r&   r&   r'   test_usecols_wrong_type  s
   "z#TestReaders.test_usecols_wrong_typec                 C  s8   t jd| dd}tddggddgd}t|| d S )	Ntest2r|   r}   aaaabbbbbTestTest1r   rZ   rY   r   r   r   )r^   r    parsedrF   r&   r&   r'   test_excel_stop_iterator  s   z$TestReaders.test_excel_stop_iteratorc                 C  sd   t || |dkr|dkr|tjjdd tjd| dd}ttj	ggdgd	}t
|| d S )
Nr   r   z+Calamine can't extract error from ods filesrM   test3r|   r   r   r   )rR   rO   r)   rP   rQ   rZ   rY   r   npnanr   r   )r^   r5   r%   r    r   rF   r&   r&   r'   test_excel_cell_error_na  s   
z$TestReaders.test_excel_cell_error_nac           	      C  s   t || |}t||| tjd| ddd}tjd| ddgdd}t|| t|| tjd| dddd}t||jd d	  d S )
Nrm   r|   r   r   r   ro   r}   r   r>   r}   r>   
skipfooter)rR   rL   rZ   rY   r   r   iloc)	r^   r5   r%   r    rB   rF   r   r   r   r&   r&   r'   test_excel_table  s   
zTestReaders.test_excel_tablec                 C  sV  t || t||}tg dg dg dg dg dttdddtddd	td
ddtdddtdddgd| ddd}d}tj|| dd}t	|| |
 }d|j|jd df< tj|| dd}t	|| t|jD ]\}	}
tj|| d|	d}||
}t	|| qt|d t|d< tj|| ddtid}t	|| d S )N)ro   r      r   )g      ?g      @gHzG?gQ?g&.>)TFTTF)ro   r   r   r      )r   r   cdei  
         iq  ro         i  r   M8[]dtype)IntColFloatColBoolColStrColStr2ColDateCol
test_typesr|   r   g      @r   r   r   r}   
converters)rR   rE   r   	from_dictr   r   rZ   rY   r   r   copylocrH   	enumerater   r   applyr!   )r^   r5   r%   r    rK   rF   basenameactualfloat_expectedicolrI   expr&   r&   r'   test_reader_special_dtypes  sJ   









z&TestReaders.test_reader_special_dtypesc              
   C  sz   d}t g ddtjdddgg ddtjd	d
dgd}dd dd dd dd d}tj|| d|d}t|| d S )Ntest_converters)ro   r   r   r   g      )@gL2@g3333333@g:0y5>)Foundr   r   	Not foundr   1345)r   r   r   r   c                 S  s   | dkrt | S dS )N r   )intr   r&   r&   r'   <lambda>
  s    z4TestReaders.test_reader_converters.<locals>.<lambda>c                 S  s   | rd|  S t jS )Nr   )r   r   r  r&   r&   r'   r    s    c                 S  s   | dkrdS dS )Nr  r   r   r&   r  r&   r&   r'   r        c                 S  s   | rt | S dS )Nr  )r!   r  r&   r&   r'   r    r	  )r   r   r   r   r|   r   )r   r   r   r   rZ   rY   r   r   )r^   r    r   rF   r   r   r&   r&   r'   test_reader_converters  s"   
	
z"TestReaders.test_reader_convertersc                 C  s   d}t || }tg dg dg dddtjdgd}t|| t j|| dd	td
d}|d d|d< |d d	|d< t	g dt
d|d< t|| d}tjt|d t j|| ddid W d    d S 1 srw   Y  d S )N	testdtypero   r   r   r         @      @      @      @      ?       @      @r   r   r   r   float64float32)r   r   r   r   r   r   001002003004r   z(Unable to convert column d to type int64rz   r   int64)rZ   rY   r   r   r   r   r   r!   astyper   objectr)   r   r   )r^   r    r   r   rF   r   r&   r&   r'   test_reader_dtype  s*   	"zTestReaders.test_reader_dtypezdtype,expectedr  r  r  r  r  r  r  r  r   r  r  2r  c                 C  s&   d}t j|| |d}t|| d S )Nr  r   rZ   rY   r   r   )r^   r    r   rF   r   r   r&   r&   r'   test_reader_dtype_str4  s   z!TestReaders.test_reader_dtype_strc                   s  |dv rt d| d ttddgddtdd	gd
dtddgddtddgddttjdgddttjdgd
dttjdgddttjdgddttdgd ttjtjgddd
t|}j	|ddd tj
|d|d}W d    n1 sw   Y  |dkrdd lddlm  t fddjD } |d jjjdd |d<  d d g|d!< n}t||}|d d"| d#|d< t|| d S )$Nr   r   No engine for filetype: ''ro   r   Int64r   r  r  Float64TFbooleanr   r   string   g      @z
2019-12-31r   )
r   r   r   r   r   rs   ghijtestr}   rH   r}   dtype_backendpyarrowr   )ArrowExtensionArrayc                   s$   i | ]}| j | d dqS )T)from_pandas)array)r.   colr5  dfpar&   r'   
<dictcomp>t  s    z2TestReaders.test_dtype_backend.<locals>.<dictcomp>r.  us)rK   r/  r   r   )r)   skipr   r   rZ   NA	Timestampr   ensure_cleanto_excelrY   r4  pandas.arraysr5  r   r7  	_pa_arraycast	timestamprE   r  r   )r^   r    r3  r%   	file_pathrt   rF   rK   r&   r9  r'   test_dtype_backendV  sJ   
zTestReaders.test_dtype_backendc                 C  s   |dv rt d| d ttjdgdtjgd}t|}|j|ddd	 tj	|dd
dd}W d    n1 s;w   Y  t
|| d S )Nr$  r%  r&  r  r  r   r   r0  Fr1  numpy_nullabler  )r}   r3  r   )r)   r>  r   r   r   r   rA  rB  rZ   rY   r   )r^   r    r:  rG  rt   r&   r&   r'   test_dtype_backend_and_dtype  s   z(TestReaders.test_dtype_backend_and_dtypezinfer_string takes precedencerM   c              	   C  sH  |dv rt d| d t d}td| ttjddgtjdtjd	tj	gtjdd
}t
|}|j|ddd tj|ddd}W d    n1 sQw   Y  |dkrwtttjddgtjdttjd	tj	gtjdd
}ntt|ddgt|d	d gd
}t
|| W d    d S 1 sw   Y  d S )Nr$  r%  r&  r4  zmode.string_storager   r   r   r   rI  r0  Fr1  rJ  r2  r=   )r)   r>  importorskiprZ   option_contextr   r   r7  object_r?  r   rA  rB  rY   r   r   r   )r^   r    string_storager;  r:  rG  rt   rF   r&   r&   r'   test_dtype_backend_string  s8   
"z%TestReaders.test_dtype_backend_stringzdtypes, exp_valuero   a.1r  c           	      C  st   d}dt i|}| }tj|| |d}ttdgt dt|g|s#t nd dd}||ks2J dt|| d S )Ndf_mangle_dup_col_dtypesr   r   ro   )r   rQ  zdtype dict changed)r  r   rZ   rY   r   r   r   r   )	r^   r    dtypes	exp_valuer   
dtype_dictdtype_dict_copyrt   rF   r&   r&   r'   test_dtype_mangle_dup_cols  s   z&TestReaders.test_dtype_mangle_dup_colsc                 C  s2   d}t || }tdg di}t|| d S )Ntest_spacestestcol)zthis is greatz4    spacesz1 trailing z
 1 leadingz2  spaces  multiple  timesr   )r^   r    r   r   rF   r&   r&   r'   test_reader_spaces  s   zTestReaders.test_reader_spaceszbasename,expectedzgh-35802COLUMNzTest (1)zgh-36122z
got 2nd sar   c                 C  s6   |dkrt d|  t|| }t|| d S )Nr   zSkipped for engine: )r)   r>  rZ   rY   r   r   )r^   r%   r    r   rF   r   r&   r&   r'   test_read_excel_ods_nested_xml  s   	z*TestReaders.test_read_excel_ods_nested_xmlc                 C  sF   d}t j|| d d}g d}t||  |t| ks!J d S )Ntest_multisheetr   )CharlieAlphaBeta)rZ   rY   r   assert_contains_allkeyslistr^   r    r   dfsexpected_keysr&   r&   r'   test_reading_all_sheets  s
   z#TestReaders.test_reading_all_sheetsc                 C  sV   d}g d}t j|| |d}tt|}t||  t|t| ks)J d S )Nr]  )r   r^  r^  r   )rZ   rY   rc  setr   ra  rb  r   )r^   r    r   rf  re  r&   r&   r'   %test_reading_multiple_specific_sheets  s   z1TestReaders.test_reading_multiple_specific_sheetsc                 C  s2   d}t j|| d d}g d}t||  d S )Nblank_with_headerr   )r|   r   r   )rZ   rY   r   ra  rb  rd  r&   r&   r'   "test_reading_all_sheets_with_blank  s   z.TestReaders.test_reading_all_sheets_with_blankc                 C  s$   t jd| dd}t|t  d S )Nblankr|   r   )rZ   rY   r   r   r   )r^   r    r   r&   r&   r'   test_read_excel_blank  s   z!TestReaders.test_read_excel_blankc                 C  s0   t ddgd}tjd| dd}t|| d S )Ncol_1col_2r   rj  r|   r   )r   rZ   rY   r   r   )r^   r    rF   r   r&   r&   r'   !test_read_excel_blank_with_header  s   z-TestReaders.test_read_excel_blank_with_headerc                 C  s   t jtdd tjd| dgd d W d    n1 sw   Y  t jtdd tjd| dd d d	 W d    d S 1 sAw   Y  d S )
Nz \(sheet: Sheet1\)$rz   rj  ro   )headerr}   rm   c                 S  s   dd S )Nro   r   r&   r  r&   r&   r'   r  #      zHTestReaders.test_exception_message_includes_sheet_name.<locals>.<lambda>)r   r}   )r)   r   r   rZ   rY   ZeroDivisionErrorr^   r    r&   r&   r'   *test_exception_message_includes_sheet_name  s   "z6TestReaders.test_exception_message_includes_sheet_namez-ignore:Cell A4 is marked:UserWarning:openpyxlc                 C  s   t || ttddgtddgddggddgd	}|d
kr*|tjjdd |d u r<|dv r<|tjjdd td| }t	
|| d S )Nz
2016-03-12zMarc Johnsonz
2016-03-16z
Jack Blackg@xDzTimothy BrownDateColWithBigInt	StringColr   r   zMaybe not supported by openpyxlrM   )r   r   z)Defaults to openpyxl, maybe not supportedtestdateoverflow)rR   r   rZ   r@  rO   r)   rP   rQ   rY   r   r   )r^   r5   r%   r    rF   rt   r&   r&   r'   test_date_conversion_overflow%  s$   
	z)TestReaders.test_date_conversion_overflowc           
      C  sf   t || d}d}|}t||| tj|| |dd}tj|| d|d}	t|| t|	| d S Nrm   r|   r   r   )r>   r}   r   )
r^   r5   r    r%   rB   filenamer}   rF   r   r   r&   r&   r'   test_sheet_nameA  s   

zTestReaders.test_sheet_namec                 C  sd   d| }t j|ddd}t|d}t j|ddd}t|| W d    d S 1 s+w   Y  d S )Nrm   r|   r   r   rn   )rZ   rY   rq   r   r   )r^   r    pthrF   rs   r   r&   r&   r'   test_excel_read_bufferR  s   "z"TestReaders.test_excel_read_bufferc                 C  sF   d}t jtdd tjd|d W d    d S 1 sw   Y  d S )Nrv   zUnknown engine: foorz   r  rW   r   )r^   
bad_enginer&   r&   r'   test_bad_engine_raisesY  s   "z"TestReaders.test_bad_engine_raisesr}   r   r   r   r|   c                 C  sJ   d}t jt|d tjd| |d W d    d S 1 sw   Y  d S Nz?Worksheet index 3 is invalid|Worksheet named 'Sheet4' not foundrz   rl  r   r   )r^   r    r}   r   r&   r&   r'   test_bad_sheetname_raises^  s   "z%TestReaders.test_bad_sheetname_raisesc                 C  sV   d| }d g d}tjt|d t| W d    d S 1 s$w   Y  d S )Nrv   |)z(No such file or directoryu   没有那个文件或目录zFile o directory non esistente)rz   )joinr)   r   FileNotFoundErrorrZ   rY   )r^   r    bad_filer{   r&   r&   r'   test_missing_file_raisesh  s   
"z$TestReaders.test_missing_file_raisesc                 C  s   d}|d u rt }d}n"|dkrddlm} |}d}n|dkr)ddlm} |}d	}nt}d
}tj||d t	t
| W d    d S 1 sGw   Y  d S )Ns   foozLExcel file format cannot be determined, you must specify an engine manually.r   r   )	XLRDErrorzFUnsupported format, or corrupt file: Expected BOF record; found b'foo'r   CalamineErrorzCannot detect file formatzFile is not a zip filerz   )r   r   r  r   r  r	   r)   r   rZ   rY   r   )r^   r%   
bad_streamerrorr   r  r  r&   r&   r'   test_corrupt_bytes_raisesu  s&   "z%TestReaders.test_corrupt_bytes_raisesc                 C  sh   t d| d}|j| d W d    n1 sw   Y  t|j}td| }t|| d S )Nrm   rn   )content)rq   serve_contentreadrZ   rY   urlr   r   )r^   
httpserverr    rs   	url_tablelocal_tabler&   r&   r'   test_read_from_http_url  s   z#TestReaders.test_read_from_http_urlc                 C  s~   t d| d}|jd| |d W d    n1 sw   Y  d|j d| }tj||d}td| }t|| d S )Nrm   rn   KeyBodys3:///test1)storage_options)rq   
put_objectrI   rZ   rY   r   r   )r^   r    s3_public_buckets3sors   r  r  r  r&   r&   r'   test_read_from_s3_url  s   z!TestReaders.test_read_from_s3_urlc           	      C  s   t d| d}|jd| |d W d    n1 sw   Y  dd l}|jdi |}| d|j d| }t|}W d    n1 sHw   Y  td| }t|| d S )Nrm   rn   r  r   r  r  r&   )	rq   r  s3fsS3FileSystemrI   rZ   rY   r   r   )	r^   r    r  r  rs   r  s3r  r  r&   r&   r'   test_read_from_s3_object  s   z$TestReaders.test_read_from_s3_objectc                 C  s|   t j|dddd| }t|}z	td| }W n ty5   dt  }t	
d|  Y nw t|| d S )Nr:   r;   rX   rm   zfile://localhost/ zfailing on )ospathr  rZ   rY   r   platformunamestripr)   r>  r   r   )r^   r    r@   
localtabler  r  platform_infor&   r&   r'   test_read_from_file_url  s   
z#TestReaders.test_read_from_file_urlc                 C  sD   d| }t j|ddd}td| }t j|ddd}t|| d S r   )rZ   rY   r   r   r   )r^   r    str_pathrF   path_objr   r&   r&   r'   test_read_from_pathlib_path  s
   z'TestReaders.test_read_from_pathlib_pathzpy.pathc                 C  s\   ddl m} tjd| }tj|ddd}| d| }tj|ddd}t|| d S )Nr   )localrm   r|   r   )	py.pathr  r  r  r  rZ   rY   r   r   )r^   r    	LocalPathr  rF   r  r   r&   r&   r'   test_read_from_py_localpath  s   z'TestReaders.test_read_from_py_localpathc                 C  sZ   t jd| }t|d}tj|ddd}~|  W d    d S 1 s&w   Y  d S )Nrm   rn   r|   r   r   )r  r  r  rq   rZ   rY   r  )r^   r    r  rs   r   r&   r&   r'   test_close_from_py_localpath  s   
"z(TestReaders.test_close_from_py_localpathc                 C  s   t || |dkr|dkr|tjjdd tdtdddtdd	d
dtddddtddddtddddtddddtddddtddd d!td d"dd#td$d%d&d'td(d)d*gi}tj	d+| d,d-}t
|| tj	d.| d,d-}t
|| d S )/Nr   r   z0ODS file contains bad datetime (seconds as text)rM   Timero   r   r   -   8   i r      1   i@ r+     *   i    9   #   i 	   )      i           i'	 r   i`
 5   i 5    %   r   i       6   
times_1900r|   r   
times_1904)rR   rO   r)   rP   rQ   r   r   r   rZ   rY   r   r   )r^   r5   r%   r    rF   r   r&   r&   r'   test_reader_seconds  s6   


zTestReaders.test_reader_secondsc           	   	   C  sJ  t || t||}tddgddgg}d| }tddtdd	gd
dtddgddtddgddtdd	gg|d}||d
  d| d||d
 < tj|dddgdd}t	
|| ||_g d|_tj|dddgd}t	
|| ||_tj|dddgddgd}t	
|| g d|_|dd g|_tj|d!ddgd}t	
|| ttd|_|d"d#g|_tj|d$ddgdd}t	
|| |jdd
gdd%d"d#g|_tj|d&dddgd}t	
|| |d"d#g|_|dd g|_tj|d'ddgddgd}t	
|| tj|d(ddgddgd
d)}t	
|| d S )*Nrv   barr   r   testmultiindexro   r  
2015-01-01Tr   r  
2015-01-02Fr   r  
2015-01-03r   r  
2015-01-04r   r   r   	mi_columnr   )r}   rq  r>   r  mi_indexr   bothr}   r>   rq  ilvl1ilvl2mi_index_namec1c2mi_column_name)levelname_with_int	both_nameboth_name_skiprows)r}   r>   rq  r   )rR   rE   r   from_productr   rZ   r@  r  rY   r   r   rH   r   	set_namesrc  r   
set_levels)	r^   r5   r%   r    rK   mimi_filerF   r   r&   r&   r'   test_read_excel_multiindex
  sn   

"	

z&TestReaders.test_read_excel_multiindexzsheet_name,idx_lvl2both_name_blank_after_mi_namer   r   both_name_multiple_blanksr   c              	   C  s   t || d| }tjddgddggddgd}t||}td	d
tddgddtddgddtddgddtddgg|tjg d|fddgdd}	|	|d  d| d|	|d < tj	||dd	gdd	gd}
t
|
|	 d S )Nr  rv   r  r   r   r  r  r   ro   r  r  Tr   r  r  Fr   r  r  r   r  r  )rv   rv   r  r  r  r  r   r   r   r   r  )rR   r   r  rE   r   rZ   r@  from_arraysr  rY   r   r   )r^   r5   r%   r    r}   idx_lvl2r  r  rK   rF   rt   r&   r&   r'   +test_read_excel_multiindex_blank_after_name^  s0   


"z7TestReaders.test_read_excel_multiindex_blank_after_namec                 C  sP   d| }t j|dddgd}tddg}tg dgd	 |d
}t|| d S )Nr  index_col_noner   ro   r}   rq  r   r   keyvalr  r   r   )rZ   rY   r   r  r   r   r   )r^   r    r  rt   exp_columnsrF   r&   r&   r'   &test_read_excel_multiindex_header_only  s
   z2TestReaders.test_read_excel_multiindex_header_onlyc           	      C  s  d| }t jt jt jt jt jt jgg dg dg dg dg dgtd}g d}tg d	g d
gg dg dgd d gd}tg d	d d}t|||d}tj|ddd}t	
|| ||_tj|dddgd}t	
|| t g dg dg dg dg dg}g d}tg dg dgg dg dgd d gd}tg dd d}t|||d}tj|ddd}t	
|| ||_tj|dddgd}t	
|| d S )Ntest_index_name_pre17)R0C0R0C1R0C2R0C3R0C4)R1C0R1C1R1C2R1C3R1C4)R2C0R2C1R2C2R2C3R2C4)R3C0R3C1R3C2R3C3R3C4)R4C0R4C1R4C2R4C3R4C4r   )C_l0_g0C_l0_g1C_l0_g2C_l0_g3C_l0_g4)R0R_l0_g0R_l0_g1R_l0_g2R_l0_g3R_l0_g4)R1R_l1_g0R_l1_g1R_l1_g2R_l1_g3R_l1_g4)r   ro   r   r   r   r   r   r   rH   r   single_namesr   r   multi_namesro   )r  r  r  r  r  )r  r  r  r  r   )r   ro   r   r   r   single_no_namesmulti_no_names)r   r7  r   r  r   r   r   rZ   rY   r   r   rH   )	r^   r    r{  r;   r   r  sirF   r   r&   r&   r'   test_excel_old_index_format  sf   	z'TestReaders.test_excel_old_index_formatc              	   C  sR   d}dD ]"}t jt|d tjd| |d W d    n1 s!w   Y  qd S )Nz#Passing a bool to header is invalid)TFrz   rm   rq  r   )r^   r    r   argr&   r&   r'   test_read_excel_bool_header_arg  s   z+TestReaders.test_read_excel_bool_header_argc              	   C  st  t || t||}tjd| dddgd}tddtdd	gdd
tddgddtddgddtdd	ggg dd}|d d| d|d< t|| tjd| dt	
ddgd}t|| tjd| ddd d}t|| tjd| ddg dd}tdd
tddgddtddgddtdd	ggg dd}|d d| d|d< t|| d S )Ntestskiprowsskiprows_listr   r   r}   r   ro   r  r  Tr  r  Fr   r  r  r   r  r  r  r   r   r   r   c                 S     | dv S N)r   r   r&   r  r&   r&   r'   r    rr  z6TestReaders.test_read_excel_skiprows.<locals>.<lambda>)r}   r   r   )rR   rE   rZ   rY   r   r@  r  r   r   r   r7  r^   r5   r%   r    rK   r   rF   r&   r&   r'   test_read_excel_skiprows  sT   

		z$TestReaders.test_read_excel_skiprowsc                 C  s   t || t||}tjd| ddd d}tddtdd	gd
dtddggg dd}|d d| d|d< t|| d S )Nr+  r,  c                 S  s   | dvS )N)ro   r   r   r&   r  r&   r&   r'   r    rr  zFTestReaders.test_read_excel_skiprows_callable_not_in.<locals>.<lambda>r-  ro   r  r  Tr   r  r  Fr  r   r   r   r   )	rR   rE   rZ   rY   r   r@  r  r   r   r0  r&   r&   r'   (test_read_excel_skiprows_callable_not_in  s   

	z4TestReaders.test_read_excel_skiprows_callable_not_inc                 C  s@   d}t jd| |d}t d| }|d | }t|| d S )Nr   rm   nrowsr"  )r^   r    num_rows_to_pullr   rF   r&   r&   r'   test_read_excel_nrows-  s
   z!TestReaders.test_read_excel_nrowsc                 C  s@   t d| }t|}|d }t jd| |d}t|| d S )Nrm   r   r3  )rZ   rY   r   r   r   )r^   r    rF   num_records_in_filer5  r   r&   r&   r'   0test_read_excel_nrows_greater_than_nrows_in_file5  s
   z<TestReaders.test_read_excel_nrows_greater_than_nrows_in_filec                 C  sJ   d}t jt|d tjd| dd W d    d S 1 sw   Y  d S )Nz'nrows' must be an integer >=0rz   rm   r  r3  r   r   r&   r&   r'   +test_read_excel_nrows_non_integer_parameter=  s   "z7TestReaders.test_read_excel_nrows_non_integer_parameterz-filename,sheet_name,header,index_col,skiprowsr  r  r  r  r  r+  r,  c                 C  r.  r/  r&   r  r&   r&   r'   r  K  rr  zTestReaders.<lambda>c           	      C  sL   t j|| ||||djdd }t j|| ||||dd}t|| dS )z
        For various parameters, we should get the same result whether we
        limit the rows during load (nrows=3) or after (df.iloc[:3]).
        )r}   rq  r>   r   Nr   )r}   rq  r>   r   r4  )rZ   rY   r   r   r   )	r^   r    r{  r}   rq  r>   r   rF   r   r&   r&   r'   test_read_excel_nrows_paramsC  s$   z(TestReaders.test_read_excel_nrows_paramsc                 C  sF   t jtdd td| dd W d    d S 1 sw   Y  d S )Nzbut 3 positional argumentsrz   rm   r|   r   r   rt  r&   r&   r'   test_deprecated_kwargsg  s   "z"TestReaders.test_deprecated_kwargsc                 C  sV   d| }g d}t jg ddd}t||dd}tj|dd	d
gd d}t|| d S )Nr  ))r   r   r  r   r   r<  ))r   r   r  ro   r   r=  )r   ro   r  )r   r   r!  r  r   ro   r  )r   from_tuplesr   rZ   rY   r   r   )r^   r    	file_namer;   idxrF   rt   r&   r&   r'   "test_no_header_with_list_index_colk  s   z.TestReaders.test_no_header_with_list_index_colc                 C  s>   d| }dt jddg}t|dgd}t|}t|| d S )None_col_blank_lineg      ?ro   r   numbersr   )r   r   r   rZ   rY   r   r   )r^   r    r?  r;   rF   rt   r&   r&   r'   test_one_col_noskip_blank_linex  s
   
z*TestReaders.test_one_col_noskip_blank_linec                 C  sj   d| }t ddg}tjtjgtjtjgddgddgg}t||d}tj|d	d
dgd}t|| d S )Nr  )r   r   )r   r   ro   r   r   r   r   mi_column_empty_rowsr   r  )	r   r>  r   r   r   rZ   rY   r   r   )r^   r    r?  r   r;   rF   rt   r&   r&   r'    test_multiheader_two_blank_lines  s   $
z,TestReaders.test_multiheader_two_blank_linesc                 C  s$   d| }t |}|jdksJ dS )z
        Sheets can contain blank cells with no data. Some of our readers
        were including those cells, creating many empty rows and columns
        trailing_blanks)r   r   N)rZ   rY   shape)r^   r    r?  rt   r&   r&   r'   test_trailing_blanks  s   
z TestReaders.test_trailing_blanksc                 C  t   |dkr	t d |dkr|t jjdd t jtdd tjd| d	d
 W d    d S 1 s3w   Y  d S )Nr   *chartsheets do not exist in the ODF formatr   4pyxlsb can't distinguish chartsheets from worksheetsrM   z"Worksheet named 'Chart1' not foundrz   
chartsheetChart1r   	r)   r>  rO   rP   rQ   r   r   rZ   rY   r^   r5   r%   r    r&   r&   r'   test_ignore_chartsheets_by_str  s   
"z*TestReaders.test_ignore_chartsheets_by_strc                 C  rJ  )Nr   rK  r   rL  rM   z0Worksheet index 1 is invalid, 1 worksheets foundrz   rM  ro   r   rO  rP  r&   r&   r'   test_ignore_chartsheets_by_int  s   
"z*TestReaders.test_ignore_chartsheets_by_intc                 C  sF   t jd| ddd}tg dg dg dgg dd	}t|| d S )
Ntest_decimal,ro   )decimalr   )ro   gAc̝ė@g	hAABCpoig2[j@)r   gHzG^@g{G@DEFuytgUq&?)r   g%Cq@g^@GHIrezg)@)IdNumber1Number2Text1Text2Number3r   r   r   r&   r&   r'   test_euro_decimal_format  s   z$TestReaders.test_euro_decimal_format)\__name__
__module____qualname__r)   fixturera   ru   r   r   r   r   rP   parametrizer   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r
  r   r   r   r   r!   r   r  r#  rH  rK  rQ   r
   rP  rW  rZ  r\  rg  ri  rk  rm  rp  ru  filterwarningsry  r|  r~  r  r  r  r  network
single_cpur  tdskip_if_not_us_localer  r  slowr  r  
skip_if_nor  r  r  r  r  r  r'  r*  r1  r2  r6  r8  r9  r:  r;  rA  rD  rF  rI  rQ  rR  rb  r&   r&   r&   r'   rS      s   

3(

	

	2
0
$









	$T
!I6
	rS   c                
   @  s   e Zd Zdd Zejdddd Zdd Zd	d
 Zej	
dg ddd Zdd Zdd Zej	
ddddgddgdddgddggdd Zdd Zdd Zdd Zd d! Zd"d# Zd$d% Zej	
d&d'd(gd)d* Zd+d, Zd-d. Zd/d0 Zd1d2 Zd3S )4TestExcelFileReadc              	   C  s   d}t jt|dd1 td| d}tj| |d W d    n1 s&w   Y  W d    d S W d    d S 1 s>w   Y  d S )NzPassing bytes to 'read_excel' is deprecated and will be removed in a future version. To read from a byte string, wrap it in a `BytesIO` object.F)r{   raise_on_extra_warningsrm   rn   rW   )r   assert_produces_warningFutureWarningrq   rZ   rY   r  )r^   r%   r    r   rs   r&   r&   r'   test_deprecate_bytes_input  s   "z,TestExcelFileRead.test_deprecate_bytes_inputTrT   c                 C  rV   )zH
        Change directory and set engine for ExcelFile objects.
        rW   r:   r;   rX   rp   N)r   rZ   rp   r[   r\   r]   r&   r&   r'   ra     rb   z#TestExcelFileRead.cd_and_set_enginec                 C  sr   dddddd}t d| }|j}W d    n1 sw   Y  |d ur)|}n||dd   }||ks7J d S )Nr   r   r   r   rg   rm   ro   )rZ   rp   r%   )r^   r    r%   rr   rX   rt   rF   r&   r&   r'   ru     s   z"TestExcelFileRead.test_engine_usedc                 C  s  t d| }t j|dddgd}W d    n1 sw   Y  tdgdgdgtjgdggd	gd
}t|| t d| }t j|dddgd}W d    n1 sUw   Y  ttjgdgtjgtjgdggd	gd
}t|| t d| }t j|dddgd}W d    n1 sw   Y  tdgdgdgtjgdggd	gd
}t|| t d| }t j|dddgd}W d    n1 sw   Y  ttjgdgtjgtjgdggd	gd
}t|| d S )Ntest4r|   Fappler}   keep_default_na	na_valuesr?  ro   rabbitr   r   Ttest51.#QNANr   )rZ   rp   rY   r   r   r   r   r   )r^   r    rX   r   rF   r&   r&   r'   test_excel_passes_na  sH   

 

 z&TestExcelFileRead.test_excel_passes_na	na_filter)NTFc                 C  s   i }|d ur
||d< t d| }t j|fdddgd|}W d    n1 s*w   Y  |du r@dgd	gd
gdgdgg}ntjgd	gtjgtjgdgg}t|dgd}t|| d S )Nr}  rz  r|   Tru  rv  Fr{  ro   r   ry  r   r   )rZ   rp   rY   r   r   r   r   r   )r^   r    r}  rd   rX   r   rF   r&   r&   r'   test_excel_passes_na_filter  s&   	z-TestExcelFileRead.test_excel_passes_na_filterc           
      C  s  t || |}t||| td| }tj|ddd}tj|ddgdd}W d    n1 s1w   Y  t|| t|| td| }|jddd}|jddgdd}W d    n1 sdw   Y  t|| t|| td| }tj|dddd}	W d    n1 sw   Y  t|	|jd d	  td| }|jdddd
}	W d    n1 sw   Y  t|	|jd d	  d S )Nrm   r   r   ro   r   )r>   )r   r>   r   r   )r>   r   )	rR   rL   rZ   rp   rY   r   r   rf   r   )
r^   r5   r%   r    rB   rF   rX   r   r   r   r&   r&   r'   test_excel_table_sheet_by_index'  s.   
z1TestExcelFileRead.test_excel_table_sheet_by_indexc                 C  s   t || |}t||| d}d}t|| }|j|dd}	W d    n1 s*w   Y  t|| }|jd|d}
W d    n1 sHw   Y  t|	| t|
| d S rz  )rR   rL   rZ   rp   rf   r   r   )r^   r5   r%   r    rB   rF   r{  r}   rX   	df1_parse	df2_parser&   r&   r'   r|  B  s   
z!TestExcelFileRead.test_sheet_namer}   r   r   r   r|   c              	   C  s   d}t jt|d. td| }|j|d W d    n1 s"w   Y  W d    d S W d    d S 1 s:w   Y  d S r  )r)   r   r   rZ   rp   rf   )r^   r    r}   r   rX   r&   r&   r'   r  T  s   "z+TestExcelFileRead.test_bad_sheetname_raisesc              	   C  s   d| }t j|dd|d}t|d%}t |}t j|ddd}W d    n1 s+w   Y  W d    n1 s:w   Y  t|| d S )Nrm   r|   r   r}   r>   r%   rn   r   )rZ   rY   rq   rp   r   r   )r^   r%   r    r}  rF   rs   rk   r   r&   r&   r'   r~  _  s   z(TestExcelFileRead.test_excel_read_bufferc              	   C  sx   t d| d&}t|}tj|dd|d W d    n1 s!w   Y  W d    n1 s0w   Y  |js:J d S )Nrm   rn   r|   r   r  )rq   rZ   rp   rY   closed)r^   r%   r    rs   rh   r&   r&   r'   test_reader_closes_filei  s   z)TestExcelFileRead.test_reader_closes_filec              	   C  s   d}t d| /}tjt|d t j|dd W d    n1 s#w   Y  W d    d S W d    d S 1 s;w   Y  d S )Nz8Engine should not be specified when passing an ExcelFilerm   rz   rv   rW   )rZ   rp   r)   r   r   rY   )r^   r    r   xlr&   r&   r'   test_conflicting_excel_enginesq  s   "z0TestExcelFileRead.test_conflicting_excel_enginesc                 C  sj   t jd| |d}td| d}| }W d    n1 sw   Y  t jt||d}t|| d S )Nrm   rW   rn   )rZ   rY   rq   r  r   r   r   )r^   r%   r    rF   rs   r;   r   r&   r&   r'   test_excel_read_binaryy  s   
z(TestExcelFileRead.test_excel_read_binaryc                 C  s^   t d| d}tj||d}W d    n1 sw   Y  tjd| |d}t|| d S )Nrm   rn   rW   )rq   rZ   rY   r   r   )r^   r    r%   rs   rt   rF   r&   r&   r'   %test_excel_read_binary_via_read_excel  s
   z7TestExcelFileRead.test_excel_read_binary_via_read_excelc              	   C  s   t dd1}tjtdd tj|ddgd W d    n1 s!w   Y  W d    d S W d    d S 1 s9w   Y  d S )Nzdf_header_oob.xlsxrn   zexceeds maximumrz   r   ro   r(  )rq   r)   r   r   rZ   rY   )r^   r%   rs   r&   r&   r'   )test_read_excel_header_index_out_of_range  s   "z;TestExcelFileRead.test_read_excel_header_index_out_of_ranger{  zdf_empty.xlsxzdf_equals.xlsxc                 C  s`   t dgdd}tjddgddgd}td	d
gg||dd}tj|dddd	gd}t|| d S )NZI2r   r  )r   zB.1I11I12r  ro   r   r  )rH   r   r   r|   r   r  )r   r   r>  r   rZ   rY   r   r   )r^   r{  r@  colsrF   rt   r&   r&   r'   test_header_with_index_col  s   z,TestExcelFileRead.test_header_with_index_colc                 C  s   t || d| }t|}tj|ddgd|d}W d    n1 s$w   Y  t||}tjddgd| dd	}tj|d d |dd  g|d  |d  gd
}	t	g g |	d}
t
|
| d S )Ntest_datetime_mir   ro   )rq  r>   r%   z
2020-02-29z
2020-03-01r   r   r   r  r!  )rR   rZ   rp   rY   rE   DatetimeIndexr   r  to_pydatetimer   r   r   )r^   r5   r%   r    rs   rX   r   rK   dtiexpected_column_indexrF   r&   r&   r'   test_read_datetime_multiindex  s   



z/TestExcelFileRead.test_read_datetime_multiindexc              	   C  sx   t jtdd+ td| dd W d    n1 sw   Y  W d    d S W d    d S 1 s5w   Y  d S )NzValue must be one of *rz   zio.excelz.readerabc)r)   r   r   rZ   rM  rt  r&   r&   r'   test_engine_invalid_option  s   "z,TestExcelFileRead.test_engine_invalid_optionc                 C  sr   |dkr	t d |dkr|t jjdd td| }|jdgks'J W d    d S 1 s2w   Y  d S )Nr   rK  r   rL  rM   rM  r|   )r)   r>  rO   rP   rQ   rZ   rp   sheet_names)r^   r5   r%   r    rX   r&   r&   r'   test_ignore_chartsheets  s   
"z)TestExcelFileRead.test_ignore_chartsheetsc              
   C  s   t f}|d u rtd|  n|dkrdd l}t |jjf}n|dkr,ddlm} |f}t	d| B}t
|jddd td	 z	tj||d
 W n	 |yV   Y nw W d    n1 saw   Y  W d    d S W d    d S 1 syw   Y  d S )NzInvalid test for engine=r   r   r   r  corruptzutf-8)encodingFrW   )r	   r)   r>  r   biffhr  r   r  r   rA  r   
write_textrq  rZ   rp   )r^   r%   r    errorsr   r  filer&   r&   r'   test_corrupt_files_closed  s,   "z+TestExcelFileRead.test_corrupt_files_closedN)rc  rd  re  rs  r)   rf  ra   ru   r|  rP   rg  r~  r  r|  r  r~  r  r  r  r  r  r  r  r  r  r  r&   r&   r&   r'   ro    s6    

&





ro  )r    r!   r"   r#   )r    r!   r%   rC   r"   r!   )rF   r   r    r!   r%   r!   r"   rG   )=
__future__r   r   r   	functoolsr   r:   r   r  pathlibr   r  r   urllib.errorr   zipfiler	   numpyr   r)   pandas._configr
   pandas.compatr   pandas.util._test_decoratorsutil_test_decoratorsrk  pandasrZ   r   r   r   r   r   pandas._testing_testingr   pandas.core.arraysr   r   rP   rj  
pytestmarkr-   r*   rn  engine_paramsr(   r,   rf  r!   r6   r%   r    rB   rE   rL   rR   rS   ro  r&   r&   r&   r'   <module>   s    


	



	
	          )