U
    sVc                     @   s   d Z ddlmZ ddlmZ ddlZddlZddlZddlm	  m
Z ddlZddlmZmZmZmZmZmZmZmZ ddlmZ ddlmZ ddlmZ ejdd	 Zejd
d ZG dd dZ dS )z5 test with the TimeGrouper / grouping with datetimes     )datetime)StringION)	DataFrameDatetimeIndexIndex
MultiIndexSeries	Timestamp
date_rangeoffsets)Grouper)
BinGrouperc                  C   sh   t ddddddgtdddddtdddddtdd	dd
dtdd	dd	dtjtdddddgd} | S )z
    DataFrame used by groupby_with_truncated_bingrouper, made into
    a separate fixture for easier re-use in
    test_groupby_apply_timegrouper_with_nat_apply_squeeze
                	        r   
            )QuantityDate)r   r	   pdNaT)df r   I/tmp/pip-unpacked-wheel-xj8nt62q/pandas/tests/groupby/test_timegrouper.pyframe_for_truncated_bingrouper   s    r    c                 C   s:   | }t ddd}||}t|jjt|jjks6t|S )a+  
    GroupBy object such that gb.grouper is a BinGrouper and
    len(gb.grouper.result_index) < len(gb.grouper.group_keys_seq)

    Aggregations on this groupby should have

        dti = date_range("2013-09-01", "2013-10-01", freq="5D", name="Date")

    As either the index or an index level.
    r   5Dkeyfreq)r   groupbylengrouperZresult_indexZgroup_keys_seqAssertionError)r    r   tdggbr   r   r   !groupby_with_truncated_bingrouper3   s
    
r+   c                   @   s  e Zd Zdd Zejdddgdd Zdd	 Zejd
ddddgdd Z	dd Z
dd Zdd Zdd Zdd Zdd Zdd Zdd  Zd!d" Zd#d$ Zd%d& Zd'd( Zd)d* Zd+d, Zd-d. Zd/d0 Zd1d2 Zd3d4 Zd5d6 Zd7d8 Zd9d: Ze d;d<d= Z!d>S )?TestGroupByc           
      C   s  t d ddddddgtddddd	tdddddtdd
ddd	tdd
dd
d	tddddd	tddddd	gd}|jdd}||fD ]}|dg}t dd	itddddddd}tjdddgdd|jd	ddgd	f< d}t	j
t|d |d }W 5 Q R X t	|| | }t	j
t|d |tdd }W 5 Q R X t	|| t	j
t|d |tdd }	W 5 Q R X t	|	| qd S ) NzCarl Carl Carl Carl Joe Carlr   r   r   r   r   r   r   r   r   r      r   r   Buyerr   r   r   byr   Z20130901Z20131205r!   left)r$   nameZ	inclusiveindex      int64dtype!The default value of numeric_onlymatchr$   )r   splitr   sort_values	set_indexr
   nparrayiloctmassert_produces_warningFutureWarningresamplesumassert_frame_equal
sort_indexr%   r   )
selfdf_originaldf_reorderedr   expectedmsgresult1	df_sortedresult2Zresult3r   r   r   test_groupby_with_timegrouperK   sJ        $z)TestGroupBy.test_groupby_with_timegroupershould_sortTFc                 C   s   t d d ddddddgtdddd	d
tdddd	dtddddd
tddddd
tddddd
tddddd
gd}|r|jddd}|jddd}|tdd}|jstt	|j
tst|j}t	|tstt|dkstd S )NzA A A A A BzCarl Mark Carl Joe Joe Carlr   r   r      r   r   r   r   r   r   r   r-   r   ZBranchr/   r   r   r   Fr1   Z	ascendingr   ZdropZ6Mr>   )r   r?   r   r@   rA   r%   r   
group_keysr(   
isinstancer'   r   groupsdictr&   )rL   rU   r   gr\   r   r   r   %test_groupby_with_timegrouper_methodsz   s,    
z1TestGroupBy.test_groupby_with_timegrouper_methodsc                 C   sL  t d d ddddddddgtdddd	d
tdddd	dtddddd
tddddd
tddddd
tddddd
tddddd
tddddd
gdd}|jddd}||fD ]0}t d dddgtdddd
d
tdddd
d
tdddd
d
gdddg}d}tjt|d |t	dddg
 }W 5 Q R X t|| t d ddddgtdddd
d
tdddd
d
tdddd
d
tdddd
d
gdddg}tjt|d |t	d ddg
 }W 5 Q R X t|| qt d d ddddddddgtdddd	d
tdddd	dtddddd
tddddd
tddddd
tddddd
tddddd
tddddd
gdd}|jddd}||fD ]}t d! d"ddd#dgtdddd
d
tdddd
d
tdddd
d
tdddd
d
tdddd
d
gdddg}d}tjt|d |t	d$ddg
 }W 5 Q R X t|| tjt|d |t	d%ddg
 }W 5 Q R X t d dddgtdddd
d
tdddd
d
tdddd
d
gdddg}t|| | }tjt|d  |t	d%dd&dg
 }W 5 Q R X t|| tjtd'd  |t	d%d(d&dg
  W 5 Q R X |d}tjt|d  |t	d%dd)dg
 }W 5 Q R X t|| tjt|d  |t	d%d
d)dg
 }W 5 Q R X t|| tjtd*d  |t	d%d(d)dg
  W 5 Q R X | }|jtd |d< tjt|d  |t	d%dd&dg
 }W 5 Q R X t d dddgtdd+d,d
d
tdd+d,d
d
tdd+d,d
d
gdddg}t|| d-}tjt|d" |t	d%ddd.dg
  W 5 Q R X t dggdgttdddd
d
gt dd/d0}tjt|d |t	d%d
 }W 5 Q R X t|| tjt|d |t	d%dg
 }W 5 Q R X t|| |jd|_|jjt ksttjt|d |t	d%dd&
 }W 5 Q R X t|| tjt|d |t	d%dd&g
 }W 5 Q R X t|| qd S )1NzA A A A A A A Bz$Carl Mark Carl Carl Joe Joe Joe Carlr   r   r   rV   r   r   r   r   r   r   r   r-   r   rW   r   r   FrX   zCarl Joe Markr      r.   r/   r;   r<   Ar>   zCarl Mark Carl Joe   Z6MSzCarl Joe Mark Carl Joer7      Z1DZ1Mr$   r#   z#'The grouper name foo is not found'foo)r$   levelzThe level foo is not valid      z2The Grouper cannot specify both a key and a level!)r$   r#   rf   r$   r3   columnsr5   )r   r?   r   rA   r@   rE   rF   rG   r%   r   rI   rJ   reset_indexpytestZraisesKeyError
ValueErrorcopyr5   r   ZMonthEndr   shiftr$   r(   )rL   rM   rR   r   rO   rP   resultZwarn_msgr   r   r    test_timegrouper_with_reg_groups   s<   
"
"""
$$
$$$$
    "z,TestGroupBy.test_timegrouper_with_reg_groupsr$   DMra   zQ-APRc                 C   s  t tddddddddddddgddddddddd	d	d	d	gd
dddddddddddgddddddddddddgdd}|dd  |jdd! ddg	 
d"}d |_|	 t|d#dgd   }t|| |t|d#dgd   }t|| d S )$NZ20121002Z20121007Z20130130Z20130202Z20130305Z20121207r   r   r   i  il  i  i     io  Z   i8  ig  i-  i!  r-      r   r6   '   r   -   "   )dateuser_id
whole_costZcost1r|   r}   r~   )Z	min_countr8   r>   )r   r   to_datetimerA   r%   rH   rI   dropnaZreorder_levelsrK   Zastyper3   r   rE   assert_series_equal)rL   r$   r   rO   rQ   rS   r   r   r   %test_timegrouper_with_reg_groups_freqU  sf    #&
	z1TestGroupBy.test_timegrouper_with_reg_groups_freqc                 C   s(  t d ddddddgtddddd	tdddddtdd
ddd	tdd
dd
d	tddddd	tddddd	gd}|jdd}|jd	ddg |jddg |jdg g}dddg}||fD ]H}|tddd}t||D ]&\}}t|}	|	|	}
t
|
| qq|jdg |jdg |jdg g}dddg}||fD ]X}|dtdddg}t||D ]0\\}}}t|}	|	||	f}
t
|
| q\q8|d}|jdd}|jd	ddg |jddg |jdg g}||fD ]J}|tdd}t||D ](\}}t|}	|	|	}
t
|
| qqd S )NzCarl Joe Joe Carl Joe Carlr   r   r   r   r   r   r   r   r   r   r-   r   r   r.   r   r0   rc   
2013-09-30
2013-10-31
2013-12-31ru   r   rd   )Joer   )ZCarlr   )r   r   r/   r>   )r   r?   r   r@   rD   r%   r   zipr	   	get_grouprE   rJ   rA   )rL   rM   rN   expected_listZdt_listr   groupedtrO   dtrr   Zg_listbr   r   r   test_timegrouper_get_group  s^    









z&TestGroupBy.test_timegrouper_get_groupc                 C   s   t ddgddgd}| }t|d |d< dd }|tdd	|}|td
dd|}t|j	dd|j	dd d S )N
10/10/2000
11/10/2000r   r   r|   valuer|   c                 S   s   t | d  gdS )Nr   )rI   )r   rI   xr   r   r   sumfunc_series  s    zMTestGroupBy.test_timegrouper_apply_return_type_series.<locals>.sumfunc_seriesr#   ru   rd   TrY   )
r   rp   r   r   r%   r   applyrE   rJ   rl   )rL   r   df_dtr   rO   rr   r   r   r   )test_timegrouper_apply_return_type_series  s    
 
z5TestGroupBy.test_timegrouper_apply_return_type_seriesc                 C   s   t ddgddgd}| }t|d |d< dd }|tdd	|}|td
dd|}t|j	dd|j	dd d S )Nr   r   r   r   r   r|   c                 S   s
   | j  S N)r   rI   r   r   r   r   sumfunc_value  s    zKTestGroupBy.test_timegrouper_apply_return_type_value.<locals>.sumfunc_valuer   ru   rd   TrY   )
r   rp   r   r   r%   r   r   rE   r   rl   )rL   r   r   r   rO   rr   r   r   r   (test_timegrouper_apply_return_type_value  s    
 
z4TestGroupBy.test_timegrouper_apply_return_type_valuec                 C   s8  d}t dd|d}tt|t|d|d}|dd }|j}tt| d	 t	s^t
t d
ddd}tdddddgdddddgd|d}|jddj}dddddg}dd |D }	t||	 |jdd}|D ]Z}
||
}|j|
df |j|
d f gg}t|
gdd!d"}t|td#|d$}	t||	 qd S )%Ni  z2012/1/1Z5min)startr$   periods)highlowr4   c                 S   s   t | j| j| jS r   )r   yearmonthdayr   r   r   r   <lambda>      z?TestGroupBy.test_groupby_groups_datetimeindex.<locals>.<lambda>r   z
2015/01/01r   r|   )r   r3   r7   rb   rV   r   r   r   r   rc   ra   Brf   z
2015-01-05z
2015-01-04z
2015-01-03z
2015-01-02z
2015-01-01c                 S   s    i | ]}t |t|gd dqS )r|   r3   )r	   r   ).0r|   r   r   r   
<dictcomp>  s     zATestGroupBy.test_groupby_groups_datetimeindex.<locals>.<dictcomp>ra   r   rt   )r3   r$   ZABrj   )r
   r   rB   aranger%   r\   r[   listkeysr   r(   rE   Zassert_dict_equalr   locr   rJ   )rL   r   indr   r   r\   r5   rr   datesrO   r|   dataZexpected_indexr   r   r   !test_groupby_groups_datetimeindex  s0     &
z-TestGroupBy.test_groupby_groups_datetimeindexc           	      C   sj  ddddddg}t ddddddg|tjdddd	d
gd d}|d dd |d< tddddddgddd}tddgd dd}t||g}t ddd	dd
dgd	d
d
d	d	d
gd|ddgd}|ddg	 }t
|| t|dd}t tjdddd	d
dd	d
dgd|d}tdddgdd}t dddgd
ddgd|ddgd}|jdd	 }t
|| d S ) N2011-07-19 07:00:002011-07-19 08:00:002011-07-19 09:00:00ar   r7   r8   r9   r   r   r   )labelr   value1value2r   c                 S   s   t | ddS )N
US/Pacifictz)r	   )dr   r   r   r   %  r   zBTestGroupBy.test_groupby_groups_datetimeindex_tz.<locals>.<lambda>r   )r   r3   r   r   r   rc   r   r   r   r   r   r5   rk   z
Asia/Tokyor   r4   rb   r   )r   rB   r   r   r   r   r   from_arraysr%   rI   rE   rJ   	rL   r   r   Zexp_idx1Zexp_idx2Zexp_idxrO   rr   Zdidxr   r   r   $test_groupby_groups_datetimeindex_tz  sf    
 z0TestGroupBy.test_groupby_groups_datetimeindex_tzc                 C   sR   t dtdfdtdfgddgd}|d }|d d tdksNtd S )Nr   z
2012-07-03z
2012-07-04r   r|   )rk   )r   rB   
datetime64r%   firstr	   r(   )rL   r   rr   r   r   r   &test_frame_datetime64_handling_groupbyR  s    z2TestGroupBy.test_frame_datetime64_handling_groupbyc              	   C   s   d}t jt|d dddgd}|jdddjdd	 }ttd
ddtdddtdddtdddtdddgdtd}t	
|| d}|dj|}t |j|}tdddgdddgdd}t |j|}t	
|| d S )Nz0,2000-01-28 16:47:00,America/Chicago
1,2000-01-29 16:48:00,America/Chicago
2,2000-01-30 16:49:00,America/Los_Angeles
3,2000-01-31 16:50:00,America/Chicago
4,2000-01-01 16:50:00,America/New_Yorkr   r|   r   )headernamesF)rZ   c                 S   s   t | j| jS r   )r   r   r   tz_localizer3   r   r   r   r   r   g  r   z9TestGroupBy.test_groupby_multi_timezone.<locals>.<lambda>z2000-01-28 16:47:00-0600zAmerica/Chicagor   z2000-01-29 16:48:00-0600z2000-01-30 16:49:00-0800zAmerica/Los_Angelesz2000-01-31 16:50:00-0600z2000-01-01 16:50:00-0500zAmerica/New_York)r3   r:   z2000-01-28 16:47:00z2000-01-29 16:48:00z2000-01-31 16:50:00r   r   r   r5   r3   )r   Zread_csvr   r%   r|   r   r   r	   objectrE   r   r   r   r   r   )rL   r   r   rr   rO   r   Z
res_valuesZ
exp_valuesr   r   r   test_groupby_multi_timezone[  s4    




z'TestGroupBy.test_groupby_multi_timezonec           	      C   sd  ddddddg}t ddddddgdd |D tjdd	d
ddgd d}tjddddddgddd}tddgd dd}t||g}t ddddddgddddddgd|ddgd}|ddg	 }t
|| tj|dd}t tjdd	d
ddddddgd|d}tjdddgdd}t dddgdddgd|ddgd}|jdd	 }t
|| d S )Nr   r   r   r   r   c                 S   s   g | ]}t j|d dqS )Hr>   )r   ZPeriod)r   r   r   r   r   
<listcomp>  s     z;TestGroupBy.test_groupby_groups_periods.<locals>.<listcomp>r7   r8   r9   r   r   r   )r   periodr   r   r   r   ri   r   r   r   rc   r   r   r   r   r   r>   r4   rb   r   )r   rB   r   r   ZPeriodIndexr   r   r   r%   rI   rE   rJ   r   r   r   r   test_groupby_groups_periods  sd    
	 z'TestGroupBy.test_groupby_groups_periodsc                 C   s   t ddg}|d d|d< t|d jjtjs6t|jdd	 }|d j}t|jtjsbt|d jdd	 }|j}t|jtjstd S )N)r        |>c )r   r   r   zM8[ns]r   r   )
r   view
issubclassr:   typerB   r   r(   r%   r   )rL   r   rr   Zgot_dtr   r   r   test_groupby_first_datetime64  s    
z)TestGroupBy.test_groupby_first_datetime64c                 C   sR   t tdtdd}|dd dd }|dd  }t|| d S )NZ20130101r   r   ra   c                 S   s   |   S r   )maxr   r   r   r   r     r   z9TestGroupBy.test_groupby_max_datetime64.<locals>.<lambda>)	r   r	   rB   r   r%   r   r   rE   r   )rL   r   rO   rr   r   r   r   test_groupby_max_datetime64  s    z'TestGroupBy.test_groupby_max_datetime64c                 C   sV   t tdtdgd d}|dd t}ttdgd dd}t|| d S )Nr   z	2000-01-1r   ra   r   r   )	r   ranger	   r%   Z	transformminr   rE   r   rL   r   rr   rO   r   r   r   test_groupby_datetime64_32_bit  s    z*TestGroupBy.test_groupby_datetime64_32_bitc                 C   sh   t jd tt jjddddtddddd	d
}|d d }|dd  }t	|| d S )N*   r   r   <   )sizez01/01/2000 00:00sUTC)r   r$   r   )factortimer   r   )
rB   randomseedr   randintr
   r%   r   rE   r   )rL   r   Zdf1Zdf2r   r   r   $test_groupby_with_timezone_selection  s    z0TestGroupBy.test_groupby_with_timezone_selectionc                 C   sp   t dgttjgd}|d d jtjks2tt ddddgi}ttj|d< |d d jtjksltd S )Nr   )r   r   r   r   r   r   r   )r   r   nowpytzutctzinfor(   )rL   r   r   r   r   test_timezone_info  s
    zTestGroupBy.test_timezone_infoc                 C   sd   t dddgd tddddd}|d	j }tdddgtdddgd	d
dd}t|| d S )Nr   r   r   r   r7   T)r   r$   )r   r   r   r   r   r   )	r   r
   r%   r   countr   r   rE   r   r   r   r   r   test_datetime_count  s    "zTestGroupBy.test_datetime_countc                 C   s   ddl m} ttjdddtjgtj|dd|dd|d	dtjgd
}t|j|_d|d< ||j  }|	d}|	d}t
| |  t
| |  t
| |  t
| |  d S )Nr   )	timedeltaz2015-07-24 10:10z2015-07-25 11:11z2015-07-23 12:12r   )daysr   r   )r   tdra   group)r   r   r   rB   nanr   r   r   Znotnar%   rE   rJ   r   r   r   last)rL   r   Zdf_testZdf_refZgrouped_testZgrouped_refr   r   r   $test_first_last_max_min_on_time_data  s(    "

z0TestGroupBy.test_first_last_max_min_on_time_datac                 C   s|   t tdtjtdgdddgd}tddd	}||d
  }||j  |d
  }|j	
d |_	t|| d S )Nz2016-06-28 09:35:35z2016-06-28 16:46:28123)r   r   r   hr"   r   )r   r	   r   r   r   r%   Znuniquer   Znotnullr5   
_with_freqrE   r   )rL   testr'   rr   rO   r   r   r   %test_nunique_with_timegrouper_and_nat  s    z1TestGroupBy.test_nunique_with_timegrouper_and_natc                 C   st   dddgt dddgdddd	d
gd}t|d}tdd}||}| }||g}| }t|| d S )NZshanghaiZbeijingz2017-08-09 13:32:23z2017-08-11 23:23:15z2017-08-11 22:23:15zdatetime64[ns]r9   r   r   r   )locationr   r   r   rt   r>   )r   r   rA   r   r%   r   rE   rJ   )rL   Z
data_framer'   r   rr   rO   r   r   r   !test_scalar_call_versus_list_call/  s    

z-TestGroupBy.test_scalar_call_versus_list_callc                 C   sn   d}t jd|ddd}tt||d}||jj }ttd|ttd|d |j	d	d}t
|| d S )
Nr   z2018-01ru   ZMonth)r   r   r$   r3   r4   r   r   r   )r   Zperiod_ranger   r   r%   r5   r   rI   r   r3   rE   r   )rL   r   r5   Zperiod_seriesrr   rO   r   r   r   test_grouper_period_indexC  s        z%TestGroupBy.test_grouper_period_indexc                 C   sj   |}|d  dd }tddddd}t|d	gt| g}td
ddddddg|dd}t|| d S )Nr   c                 S   s   dt | iS )Nre   )r&   r   r   r   r   r   Y  r   zRTestGroupBy.test_groupby_apply_timegrouper_with_nat_dict_returns.<locals>.<lambda>
2013-09-01
2013-10-01r!   r   ri   re   r   r   r   r   )r   r
   r   r   r&   r   rE   r   )rL   r+   r*   resdtimirO   r   r   r   4test_groupby_apply_timegrouper_with_nat_dict_returnsQ  s    z@TestGroupBy.test_groupby_apply_timegrouper_with_nat_dict_returnsc                 C   sb   |}|d  dd }tddddd}td	tjtjtjtjtjd
g|d dd}t|| d S )Nr   c                 S   s   t | r| jd S tjS )Nr   )r&   rD   rB   r   r   r   r   r   r   g  r   zTTestGroupBy.test_groupby_apply_timegrouper_with_nat_scalar_returns.<locals>.<lambda>r   r  r!   r   ri   r   r   r   )r   r
   r   rB   r   r   rE   r   )rL   r+   r*   r  r  rO   r   r   r   6test_groupby_apply_timegrouper_with_nat_scalar_returns`  s    zBTestGroupBy.test_groupby_apply_timegrouper_with_nat_scalar_returnsc              	   C   s   |}t ddd}tjtdd |j|dd}W 5 Q R X |jdksFt|j|j	j
dks^t|d	d
 }td}|d   j}tj|g|gdd gd}|d |jd }	t|	|dd}
t||
 d S )Nr   Z100Yr"   z`squeeze` parameterr<   T)Zsqueezer   c                 S   s   | d d S )Nr   r   r   r   r   r   r   r     r   zSTestGroupBy.test_groupby_apply_timegrouper_with_nat_apply_squeeze.<locals>.<lambda>r   )r   r   r   r   )r   rE   rF   rG   r%   Zngroupsr(   Z_selected_objZ	_get_axisZaxisZnlevelsr   r	   r@   r   r5   r   Zfrom_productZtakevaluesr   r   )rL   r    r   r)   r*   r  r#   Zorderingr  Z	ex_valuesrO   r   r   r   5test_groupby_apply_timegrouper_with_nat_apply_squeezer  s    zATestGroupBy.test_groupby_apply_timegrouper_with_nat_apply_squeezenumbac                 C   sp   |}|d j dd dd}|d  tj}t|| |dg j dd dd}|dg  tj}t|| d S )Nr   c                 S   s
   t | S r   rB   nanmeanr  r5   r   r   r   r     r   zITestGroupBy.test_groupby_agg_numba_timegrouper_with_nat.<locals>.<lambda>r	  )Zenginec                 S   s
   t | S r   r
  r  r   r   r   r     r   )Z	aggregaterB   r  rE   r   rJ   )rL   r+   r*   rr   rO   Z	result_dfZexpected_dfr   r   r   +test_groupby_agg_numba_timegrouper_with_nat  s     
 z7TestGroupBy.test_groupby_agg_numba_timegrouper_with_natN)"__name__
__module____qualname__rT   rm   markZparametrizer_   rs   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r   r  r  r  r   Z
skip_if_nor  r   r   r   r   r,   J   s<   /
  ;
:B?	'=	
r,   )!__doc__r   ior   ZnumpyrB   rm   r   Zpandas.util._test_decoratorsutilZ_test_decoratorsr   Zpandasr   r   r   r   r   r   r	   r
   r   Zpandas._testingZ_testingrE   Zpandas.core.groupby.grouperr   Zpandas.core.groupby.opsr   Zfixturer    r+   r,   r   r   r   r   <module>   s    (


