a
    GGbp                     @   s  d Z ddlmZ ddlmZ ddlZddlZddlmZ ddl	m
Z
mZ ddlmZ ejdZejdeed	d	gd
d Zdd Zdd Zejddddgie
g dg dgg ddfdddgde
g dgg ddfddddgde
dd ggd!d"gdfgd#d$ Zd%d& Zejd'd(g d)g d*gfd+g d,g d-gfd.g d/g d0gfgd1d2 Zejd3g d4d5d6 Zd7d8 Zejd9i e
d:dd;gifdd<gd=e
d<dd;gifgd>d? Zd@dA ZdBdC ZdDdE Z dS )Fzj
Tests that skipped rows are properly handled during
parsing for all of the parsers defined in parsers.py
    )datetime)StringION)EmptyDataError)	DataFrameIndexZpyarrow_skipskiprows   c                 C   sz   | }d}|j t||d ddd}ttdddtdddtdddgdd	}ttd
ddg d|d}t	|| d S )Nzr#foo,a,b,c
#foo,a,b,c
#foo,a,b,c
#foo,a,b,c
#foo,a,b,c
#foo,a,b,c
1/1/2000,1.,2.,3.
1/2/2000,4,5,6
1/3/2000,7,8,9
r   Tr   headerZ	index_colZparse_dates           name      ?      $@r   r   r   r   r   columnsindex
read_csvr   r   r   r   npZarangeZreshapetmassert_frame_equal)all_parsersr   parsertextresultr   expected r"   Clib/python3.9/site-packages/pandas/tests/io/parser/test_skiprows.pytest_skip_rows_bug   s    
"r$   c                 C   sl   | }dd dd tdD  }dd dd dD  }|jt|dd	gd
}|t|}t|| d S )Nza,b,c

c              	   S   s0   g | ](}d  t|t|d t|d gqS ,r   r   joinstr.0ir"   r"   r#   
<listcomp>7       z'test_deep_skip_rows.<locals>.<listcomp>
   c              	   S   s0   g | ](}d  t|t|d t|d gqS r&   r(   r+   r"   r"   r#   r.   :   r/   )r   r   r   r      r      	   r   r2   r   )r)   ranger   r   r   r   )r   r   dataZcondensed_datar    Zcondensed_resultr"   r"   r#   test_deep_skip_rows3   s    r7   c                 C   sz   | }d}|j t|dd ddd}ttdddtdddtddd	gdd
}ttdddg d|d}t	|| d S )Nz^#foo,a,b,c
#foo,a,b,c

#foo,a,b,c
#foo,a,b,c

1/1/2000,1.,2.,3.
1/2/2000,4,5,6
1/3/2000,7,8,9
r   r   Tr	   r   r   r   r   r   r   r   r   r   r   r   )r   r   r   r6   r   r!   r"   r"   r#   test_skip_rows_blankB   s    
"r8   zdata,kwargs,expectedzKid,text,num_lines
1,"line 11
line 12",2
2,"line 21
line 22",2
3,"line 31",1r   )r   zline 21
line 22r   )r   zline 31r   idr   Z	num_linesr   z+a,b,c
~a
 b~,~e
 d~,~f
 f~
1,2,~12
 13
 14~~r   )Z	quotecharr   )za
 bze
 dzf
 f)abczdText,url
~example
 sentence
 one~,url1
~example
 sentence
 two~,url2
~example
 sentence
 three~,url3r   zexample
 sentence
 twoZurl2TextZurlc                 C   s*   | }|j t|fi |}t|| d S )Nr   r   r   r   )r   r6   kwargsr!   r   r    r"   r"   r#   test_skip_row_with_newline\   s    #rC   c                 C   sL   | }d}g dg dg}t |g dd}|jt|dgd}t|| d S )NzYid,text,num_lines
1,"line '11' line 12",2
2,"line '21' line 22",2
3,"line '31' line 32",1)r   zline '21' line 22r   )r   zline '31' line 32r   r9   r;   r   r4   r   r   r   r   r   )r   r   r6   exp_datar!   r    r"   r"   r#   test_skip_row_with_quote   s    rF   zdata,exp_dataz\id,text,num_lines
1,"line 
'11' line 12",2
2,"line 
'21' line 22",2
3,"line 
'31' line 32",1)r   zline 
'21' line 22r   )r   zline 
'31' line 32r   z\id,text,num_lines
1,"line '11
' line 12",2
2,"line '21
' line 22",2
3,"line '31
' line 32",1)r   zline '21
' line 22r   )r   zline '31
' line 32r   zbid,text,num_lines
1,"line '11
' 	line 12",2
2,"line '21
' 	line 22",2
3,"line '31
' 	line 32",1)r   zline '21
' 	line 22r   )r   zline '31
' 	line 32r   c                 C   s8   | }|j t|dgd}t|g dd}t|| d S )Nr   r4   r9   r;   r   r   r   r   r   )r   r6   rE   r   r    r!   r"   r"   r#   $test_skip_row_with_newline_and_quote   s    rH   line_terminator)r%   z
c                 C   s   | }d g d}tg dg dg dgg dd}|jdkr`|d	kr`tjjd
d}|j| |d|}|j	t
|ddg dd}t|| d S )Nr%   )zSMOSMANIA ThetaProbe-ML2X z2007/01/01 01:00   0.2140 U M z2007/01/01 02:00   0.2141 M O z2007/01/01 04:00   0.2142 D M )
2007/01/01z01:00g1Zd?UM)rK   z02:00gk	g?rM   O)rK   z04:00gBfj?DrM   )datetimevarflagZoflagr;   ZpythonrJ   z+'CR' not respect with the Python parser yet)reasonr   T)r   Zdelim_whitespacenames)r)   r   ZenginepytestmarkZxfailZnodeZ
add_markerreplacer   r   r   r   )r   rI   Zrequestr   r6   r!   rW   r    r"   r"   r#   test_skiprows_lineterminator   s,    	rY   c                 C   s8   | }d}t ddgi}|jt|dd}t|| d S )Nz	a"
b"
a
1r=   r   r   r4   rD   )r   r   r6   r!   r    r"   r"   r#   test_skiprows_infield_quote   s
    rZ   zkwargs,expected1   Zfoo)r
   rU   c                 C   s6   | }d}|j t|fddd i|}t|| d S )Na
1
2
3
4
5r   c                 S   s   | d dkS )Nr   r   r"   xr"   r"   r#   <lambda>   r/   z)test_skip_rows_callable.<locals>.<lambda>rA   )r   rB   r!   r   r6   r    r"   r"   r#   test_skip_rows_callable   s    ra   c                 C   sT   | }d}d}t jt|d& |jt|dd d W d    n1 sF0    Y  d S )Nr]   zNo columns to parse from filematchc                 S   s   dS )NTr"   r^   r"   r"   r#   r`      r/   z)test_skip_rows_skip_all.<locals>.<lambda>r4   )rV   raisesr   r   r   )r   r   r6   msgr"   r"   r#   test_skip_rows_skip_all   s
    rf   c                 C   sT   d}| }d}t jt|d& |jt|dd d W d    n1 sF0    Y  d S )Nzby zeror]   rb   c                 S   s   dd S )Nr   r   r"   r^   r"   r"   r#   r`     r/   z-test_skip_rows_bad_callable.<locals>.<lambda>r4   )rV   rd   ZeroDivisionErrorr   r   )r   re   r   r6   r"   r"   r#   test_skip_rows_bad_callable   s
    rh   c                 C   sF   d}| }|j t|dg dd}tg dg dd}t|| d S )Nz$a,b
1,a
2,b
3,c
4,d
5,e
6,f
7,g
8,h
r\   )r   r1   r   )Znrowsr   )r   r   r\      r2   )r=   r?   egh)r=   r>   rG   )r   r6   r   r    r!   r"   r"   r#   test_skip_rows_and_n_rows  s
    
rm   )!__doc__r   ior   Znumpyr   rV   Zpandas.errorsr   Zpandasr   r   Zpandas._testingZ_testingr   rW   ZusefixturesZ
pytestmarkZparametrizelistr5   r$   r7   r8   rC   rF   rH   rY   rZ   ra   rf   rh   rm   r"   r"   r"   r#   <module>   s|   

!

	
"

		