o
     \iT                     @   s   d Z ddlmZmZ ddlZddlZddlZddlZddlm	Z	m
Z
mZmZmZmZmZmZ ddlmZ ddlmZ ddlmZ ejdd Zejd	d
 ZG dd dZdS )z5
test with the TimeGrouper / grouping with datetimes
    )datetime	timedeltaN)	DataFrameDatetimeIndexIndex
MultiIndexSeries	Timestamp
date_rangeoffsets)Grouper)
BinGrouperc                  C   s`   t g dtdddddtdddddtdddd	dtddd
ddtjtdddddgd} | S )z
    DataFrame used by groupby_with_truncated_bingrouper, made into
    a separate fixture for easier reuse in
    test_groupby_apply_timegrouper_with_nat_apply_squeeze
                	   r     r   r      r   r   
      r         )QuantityDate)r   r	   pdNaT)df r   /var/www/www-root/data/www/176.119.141.140/sports-predictor/venv/lib/python3.10/site-packages/pandas/tests/groupby/test_timegrouper.pyframe_for_truncated_bingrouper   s   r!   c                 C   s:   | }t ddd}||}t|jjt|jjksJ |S )a.  
    GroupBy object such that gb._grouper is a BinGrouper and
    len(gb._grouper.result_index) < len(gb._grouper.group_keys_seq)

    Aggregations on this groupby should have

        dti = date_range("2013-09-01", "2013-10-01", freq="5D", name="Date")

    As either the index or an index level.
    r   5Dkeyfreq)r   groupbylen_grouperresult_indexgroup_keys_seq)r!   r   tdggbr   r   r    !groupby_with_truncated_bingrouper4   s
   
r-   c                   @   s  e Zd Zdd Zejdddgdd Zdd	 Zejd
g ddd Z	dd Z
dd Zdd Zdd Zdd Zdd Zdd Zdd Zdd Zd d! Zd"d# Zd$d% Zd&d' Zd(d) Zd*d+ Zd,d- Zd.d/ Zd0d1 Zd2d3 Zd4d5 Zd6d7 Zd8d9 Zejj d:d; Z!d<S )=TestGroupByc                 C   s  t d g dtdddddtdddddtdd	dd
dtdd	dd	dtdddddtdddddgd}|jdd}||fD ]}|dg}tddddd|jjd}t |rYdnddd|d}|dt	i}|rq|ddi}d|j
d< d|j
d < d!|j
d"< tjg d#d$d%|j
g d&df< |d }t|| | }|tdd' }	t|	| |tdd' }
t|
| q@d S )(NzCarl Carl Carl Carl Joe Carlr   r   r   r   r   r   r   r   r   r      r   r   Buyerr   r   r   byr   2013090120131205r"   left)r%   name	inclusiveunit )r1   r   indexr1   strCarlCarlCarl)r   r   CarlCarl)   r   Joe)r   r   )   r@   r   int64dtype)r   r@   r   r%   )r   splitr   sort_values	set_indexr
   r<   r9   astypeobjectilocnparrayresamplesumtmassert_frame_equal
sort_indexr&   r   )selfusing_infer_stringdf_originaldf_reorderedr   exp_dtiexpectedresult1	df_sortedresult2result3r   r   r    test_groupby_with_timegrouperL   sT   


 z)TestGroupBy.test_groupby_with_timegroupershould_sortTFc                 C   s   t d d g dtdddddtdddddtdd	dd
dtdd	dd	dtdddddtdddddgd}|rB|jddd}|jddd}|tdd}|jsVJ t|j	t
s^J |j}t|tshJ t|dkspJ d S )NzA A A A A BzCarl Mark Carl Joe Joe Carl)r   r   r      r   r   r   r   r   r   r   r   r   r   r/   r   Branchr1   r   r   r   Fr3   	ascendingr   drop6MErF   r   )r   rG   r   rH   rI   r&   r   
group_keys
isinstancer(   r   groupsdictr'   )rT   r_   r   grj   r   r   r    %test_groupby_with_timegrouper_methods   s,   
z1TestGroupBy.test_groupby_with_timegrouper_methodsc                 C   sX  t d d g dtdddddtdddddtdd	dd
dtdd	dd	dtdd	dd
dtdd	dd	dtdddddtdddddgdd}|jddd}||fD ]}t d g dtdddddtdddddtdddddgdddg}d}|tdddgjdd}t	|| t d g dtdddddtdddddtdddddtdddddgdddg}|td ddgjdd}t	|| qUt d d g dtdd	dddtdd	dddtdd	dd
dtdd	dd	dtdd	dd
dtdd	dd	dtdd	dddtdd	dddgdd}|jddd}||fD ]}t d! g d"tdd	dddtdd	dddtdd	dddtdd	dddtdd	dddgdddg}|td#ddgjdd}t	|| |td$ddgjdd}t d g dtdd	dddtdd	dddtdd	dddgdddg}t	|| |
 }|td$dd%dgjdd}t	|| tjtd&d' |td$d(d%dg  W d    n	1 sw   Y  |d}|td$dd)dgjdd}t	|| |td$dd)dgjdd}t	|| tjtd*d' |td$d(d)dg  W d    n	1 s<w   Y  | }|jtd |d< |td$dd%dgjdd}t d g dtdd+d,ddtdd+d,ddtdd+d,ddgdddg}t	|| d-}tjt|d' |td$ddd.dg  W d    n	1 sw   Y  t dggdgttdd	dddgt dd/d0}|td$djdd}t	|| |td$dgjdd}t	|| |jd|_|jjt ksJ |td$dd%jdd}t	|| |td$dd%gjdd}t	|| q*d S )1NzA A A A A A A Bz$Carl Mark Carl Carl Joe Joe Joe Carl)r   r   r   r   r`   r   r   r   r   r   r   r   r   r   r   r   r/   r   ra   r   r   Frc   zCarl Joe Mark)r   r   r      r0   r1   z!The default value of numeric_onlyYErF   T)numeric_onlyzCarl Mark Carl Joe)r   r   r   r      6MSzCarl Joe Mark Carl Joe)r@   r`   r      r   1D1MEr%   r$   z#'The grouper name foo is not found'matchfoo)r%   levelzThe level foo is not valid      z2The Grouper cannot specify both a key and a level!)r%   r$   rz   r%   r7   columnsr<   )r   rG   r   rI   rH   r&   r   rP   rQ   rR   reset_indexpytestraisesKeyError
ValueErrorcopyr<   r   MonthEndr   shiftr%   )rT   rV   r[   r   rY   msgresultr   r   r     test_timegrouper_with_reg_groups   s<  








z,TestGroupBy.test_timegrouper_with_reg_groupsr%   )DMEro   zQE-APRc                 C   s   t tg dg dg dg ddd}|dd |jd	d
 ddg	 
d}d|_|	 t|ddgd  }t|| |t|ddgd  }t|| d S )N)2012100220121007201301302013020220130305r   20121207r   r   r   r   r   )r   r   r   r   r   r   r   r   r   r   r   r   )i  il  i  i     io  Z   i8  g  i-  r   i!  )r/      r   rB   '   r   r   r   -   "   r   r/   )dateuser_id
whole_costcost1r   r   r   r   )	min_countrC   rF   )r   r   to_datetimerI   r&   rO   rP   dropnareorder_levelsrS   rJ   r7   r   rQ   assert_series_equal)rT   r%   r   rY   rZ   r\   r   r   r    %test_timegrouper_with_reg_groups_freqZ  s4   #&
	z1TestGroupBy.test_timegrouper_with_reg_groups_freqc                 C   s  t d g dtdddddtdddddtdd	dd
dtdd	dd	dtdddddtdddddgd}|jdd}|jg d |jddg |jdg g}g d}||fD ]$}|tddd}t||D ]\}}t|}	|	|	}
t
|
| qgqW|jdg |jdg |jdg g}g d}||fD ]*}|dtdddg}t||D ]\\}}}t|}	|	||	f}
t
|
| qq|d}|jdd}|jg d |jddg |jdg g}||fD ]#}|tdd}t||D ]\}}t|}	|	|	}
t
|
| qqd S )NzCarl Joe Joe Carl Joe Carlr   r   r   r   r   r   r   r   r   r   r/   r   r   r0   r   r2   )r   r   r   rs   )
2013-09-30
2013-10-31
2013-12-31r   r   rv   ))rA   r   )Carlr   )rA   r   r1   rF   )r   rG   r   rH   rL   r&   r   zipr	   	get_grouprQ   rR   rI   )rT   rV   rW   expected_listdt_listr   groupedtrY   dtr   g_listbr   r   r    test_timegrouper_get_group  sf   







z&TestGroupBy.test_timegrouper_get_groupc                 C   s   t ddgddgd}| }t|d |d< dd }d	}tjt|d
 |tdd	|}W d    n1 s;w   Y  d	}tjt|d
 |tddd	|}W d    n1 s`w   Y  t
|jdd|jdd d S )N
10/10/2000
11/10/2000r   r   r   valuer   c                 S   s   t | d  gdS )Nr   )rP   )r   rP   xr   r   r    sumfunc_series  s   zMTestGroupBy.test_timegrouper_apply_return_type_series.<locals>.sumfunc_series7DataFrameGroupBy.apply operated on the grouping columnsrw   r$   r   rv   Tre   )r   r   r   r   rQ   assert_produces_warningFutureWarningr&   r   applyrR   r   )rT   r   df_dtr   r   rY   r   r   r   r    )test_timegrouper_apply_return_type_series  s   z5TestGroupBy.test_timegrouper_apply_return_type_seriesc                 C   s   t ddgddgd}| }t|d |d< dd }d	}tjt|d
 |tdd	|}W d    n1 s;w   Y  tjt|d
 |tddd	|}W d    n1 s^w   Y  t
|jdd|jdd d S )Nr   r   r   r   r   r   c                 S   s
   | j  S N)r   rP   r   r   r   r    sumfunc_value  s   
zKTestGroupBy.test_timegrouper_apply_return_type_value.<locals>.sumfunc_valuer   rw   r   r   rv   Tre   )r   r   r   r   rQ   r   r   r&   r   r   r   r   )rT   r   r   r   r   rY   r   r   r   r    (test_timegrouper_apply_return_type_value  s   z4TestGroupBy.test_timegrouper_apply_return_type_valuec                 C   sb   d}t dd|d}tt|t|d|d}|dd }|j}ttt|	 t
s/J d S )	Ni  z2012/1/15min)startr%   periods)highlowr;   c                 S   s   t | j| j| jS r   )r   yearmonthdayr   r   r   r    <lambda>  s    z?TestGroupBy.test_groupby_groups_datetimeindex.<locals>.<lambda>)r
   r   rM   aranger&   rj   ri   nextiterkeysr   )rT   r   indr   r   rj   r   r   r    !test_groupby_groups_datetimeindex   s   z-TestGroupBy.test_groupby_groups_datetimeindexc           
      C   s   t dddd}tg dg dd|d}|jdd	j}g d
}dd |D }t|| |jdd	}|D ]/}||}|j|df |j|df gg}t|gdd|j	d}	t|t
d|	d}t|| q4d S )Nz
2015/01/01r   r   )r   r7   )r   r@   rq   r`   r   )r   r   r   rs   r   ABr;   rz   )z
2015-01-05z
2015-01-04z
2015-01-03z
2015-01-02z
2015-01-01c                 S   s    i | ]}t |t|gd dqS )r   r7   )r	   r   ).0r   r   r   r    
<dictcomp>  s    zBTestGroupBy.test_groupby_groups_datetimeindex2.<locals>.<dictcomp>r   r   r   )r7   r%   rE   ABr~   )r
   r   r&   rj   rQ   assert_dict_equalr   locr   rE   listrR   )
rT   r<   r   r   datesrY   r   r   dataexpected_indexr   r   r    "test_groupby_groups_datetimeindex2  s$   
z.TestGroupBy.test_groupby_groups_datetimeindex2c           	      C   s4  g d}t g d|tjdddddgd d	}|d
 dd |d
< tg ddd
d}tddgd dd}t||g}t g dg dd|ddgd}|d
dg	 }t
|| t|dd}t tjdddg dd|d}tg ddd}t g dg d d|ddgd}|jd!d"	 }t
|| d S )#N2011-07-19 07:00:002011-07-19 08:00:002011-07-19 09:00:00r   r   r   ar   r   r   r   r   r@   rC   rD   r   r   r   )labelr   value1value2r   c                 S   s   t | ddS )N
US/Pacifictz)r	   )dr   r   r    r   4      zBTestGroupBy.test_groupby_groups_datetimeindex_tz.<locals>.<lambda>r   r   r   r   r   r   r   )r   r7   r   r   r   r   r   r   r   rs   r   r   r   r   r   r   r   r   r   r   r   r   r<   r   z
Asia/Tokyor   r   r   r   r   r   r   r;   r   r   r   r   r   rq   r   rs   r@   r   r   )r   rM   r   r   r   r   r   from_arraysr&   rP   rQ   rR   	rT   r   r   exp_idx1exp_idx2exp_idxrY   r   didxr   r   r    $test_groupby_groups_datetimeindex_tz"  sN   
z0TestGroupBy.test_groupby_groups_datetimeindex_tzc                 C   sR   t dtdfdtdfgddgd}|d }|d d tdks'J d S )Nr   z
2012-07-03z
2012-07-04r   r   )r   )r   rM   
datetime64r&   firstr	   )rT   r   r   r   r   r    &test_frame_datetime64_handling_groupbya  s   z2TestGroupBy.test_frame_datetime64_handling_groupbyc              	   C   s   t tdg dg dd}|jdddjdd	 }ttd
ddtdddtdddtdddtdddgdtd}t	|| d}|dj
|}t|j|}tg dg ddd}t|j|}t	|| d S )Nr   )2000-01-28 16:47:002000-01-29 16:48:00z2000-01-30 16:49:002000-01-31 16:50:00z2000-01-01 16:50:00)America/Chicagor  America/Los_Angelesr  America/New_York)r   r   r   r   F)rh   c                 S   s   t | j| jS r   )r   r   r   tz_localizer7   r   r   r   r    r     s    z9TestGroupBy.test_groupby_multi_timezone.<locals>.<lambda>z2000-01-28 16:47:00-0600r  r   z2000-01-29 16:48:00-0600z2000-01-30 16:49:00-0800r  z2000-01-31 16:50:00-0600z2000-01-01 16:50:00-0500r  r   )r7   rE   )r  r  r  )r   r   r   r<   r7   )r   ranger&   r   r   r   r	   rK   rQ   r   r   r   r   r   r  )rT   r   r   rY   r   
res_values
exp_valuesr   r   r    test_groupby_multi_timezonej  s<   




z'TestGroupBy.test_groupby_multi_timezonec           	      C   s.  g d}t g ddd |D tjddddd	gd
 d}tjg dddd}tddgd
 dd}t||g}t g dg dd|ddgd}|ddg	 }t
|| tj|dd}t tjdddg dd|d}tjg ddd}t g dg dd|ddgd}|jd d!	 }t
|| d S )"Nr   r   c                 S   s   g | ]	}t j|d dqS )hrF   )r   Period)r   r   r   r   r    
<listcomp>  s    z;TestGroupBy.test_groupby_groups_periods.<locals>.<listcomp>r@   rC   rD   r   r   r   )r   periodr   r   r   r  r  r}   r   r   r   r   r   r   r   r   r   r   rF   r   r;   r   r   r   r   r   )r   rM   r   r   PeriodIndexr   r   r   r&   rP   rQ   rR   r   r   r   r    test_groupby_groups_periods  sL   
	z'TestGroupBy.test_groupby_groups_periodsc                 C   s   t ddg}|d d|d< t|d jjtjsJ |jdd }|d j}t|jtjs1J |d jdd }|j}t|jtjsGJ d S )N)r        |>c )r   r  r   zM8[ns]r   r   )	r   rJ   
issubclassrE   typerM   r   r&   r   )rT   r   r   got_dtr   r   r    test_groupby_first_datetime64  s   
z)TestGroupBy.test_groupby_first_datetime64c                 C   sX   t tdtdd}|dd dd d}|dd  }t	|| d S )N20130101r   r   r   c                 S   s   |   S r   )maxr   r   r   r    r     s    z9TestGroupBy.test_groupby_max_datetime64.<locals>.<lambda>zM8[s])
r   r	   rM   r   r&   r   rJ   r  rQ   r   )rT   r   rY   r   r   r   r    test_groupby_max_datetime64  s   z'TestGroupBy.test_groupby_max_datetime64c                 C   sV   t tdtdgd d}|dd d}ttdgd dd}t|| d S )Nr   z	2000-01-1r   r   r   minr   )r   r
  r	   r&   	transformr   rQ   r   rT   r   r   rY   r   r   r    test_groupby_datetime64_32_bit  s   z*TestGroupBy.test_groupby_datetime64_32_bitc                 C   sb   t tjdjddddtddddd	d
}|d d }|dd  }t	|| d S )Nr   r   r   <   )sizez01/01/2000 00:00sUTC)r   r%   r   )factortimer$  r%  )
r   rM   randomdefault_rngintegersr
   r&   r  rQ   r   )rT   r   df1df2r   r   r    $test_groupby_with_timezone_selection  s   z0TestGroupBy.test_groupby_with_timezone_selectionc                 C   sn   t dgttjgd}|d d jtjksJ t dg di}ttj|d< |d d jtjks5J d S )Nr   )r   r   r   r   r   r   r   r   )r   r   nowpytzutctzinfo)rT   r   r   r   r    test_timezone_info  s
   zTestGroupBy.test_timezone_infoc                 C   s^   t g dd tddddd}|dj }tg d	tg ddd
dd}t|| d S )Nr,  r   r-  r@   r  )r   r%   )r   r   r   )r   r   r   r   r   r	  )	r   r
   r&   r   countr   r   rQ   r   r  r   r   r    test_datetime_count  s   zTestGroupBy.test_datetime_countc                 C   s   t tjdddtjgtjtddtddtddtjgd}t|j|_d	|d
< ||j  }|d
}|d
}t	
| |  t	
| |  t	
| |  t	
| |  d S )Nz2015-07-24 10:10z2015-07-25 11:11z2015-07-23 12:12r   )daysr   r   )r   tdr   group)r   rM   nanr   r   r   r   notnar&   rQ   rR   r  r  r   last)rT   df_testdf_refgrouped_testgrouped_refr   r   r    $test_first_last_max_min_on_time_data  s0   

z0TestGroupBy.test_first_last_max_min_on_time_datac                 C   sz   t tdtjtdgg dd}tddd}||d  }||j  |d  }|j	
d |_	t|| d S )	Nz2016-06-28 09:35:35z2016-06-28 16:46:28)123)r%  r   r%  r  r#   r   )r   r	   r   r   r   r&   nuniquer%  notnullr<   
_with_freqrQ   r   )rT   testgrouperr   rY   r   r   r    %test_nunique_with_timegrouper_and_nat;  s   z1TestGroupBy.test_nunique_with_timegrouper_and_natc                 C   sn   g dt g dddg dd}t|d}tdd	}||}| }||g}| }t|| d S )
N)shanghaibeijingrH  )z2017-08-09 13:32:23z2017-08-11 23:23:15z2017-08-11 22:23:15zdatetime64[ns]rD   r,  )locationr%  r   r%  r   rF   )r   r   rI   r   r&   r2  rQ   rR   )rT   
data_framerF  r   r   rY   r   r   r    !test_scalar_call_versus_list_callN  s   

z-TestGroupBy.test_scalar_call_versus_list_callc                 C   sl   d}t jd|ddd}tt||d}||jj }tt|ttd|d |j	dd}t
|| d S )	Nr   z2018-01MMonth)r   r   r%   r7   r;   r   r   )r   period_ranger   r
  r&   r<   r   rP   r   r7   rQ   r   )rT   r   r<   period_seriesr   rY   r   r   r    test_grouper_period_indexb  s   z%TestGroupBy.test_grouper_period_indexc           	      C   st   |}|d  dd }|j}|d jj}tdddd|d}t|d	gt| g}tg d
|dd}t	
|| d S )Nr   c                 S   s   dt | iS )Nry   )r'   r   r   r   r    r   x  r   zRTestGroupBy.test_groupby_apply_timegrouper_with_nat_dict_returns.<locals>.<lambda>r   
2013-09-01
2013-10-01r"   r%   r7   r9   ry   )r   r   r   r   r   r   r   r	  )r   obj_valuesr9   r
   r   r   r'   r   rQ   r   )	rT   r-   r,   resr   r9   dtimirY   r   r   r    4test_groupby_apply_timegrouper_with_nat_dict_returnsp  s   z@TestGroupBy.test_groupby_apply_timegrouper_with_nat_dict_returnsc                 C   sv   |}|d  dd }|j}|d jj}tdddd|d}td	tjtjtjtjtjd
g|d dd}t	
|| d S )Nr   c                 S   s   t | r	| jd S tjS )Nr   )r'   rL   rM   r7  r   r   r   r    r     s    zTTestGroupBy.test_groupby_apply_timegrouper_with_nat_scalar_returns.<locals>.<lambda>r   rR  rS  r"   rT  r   r   r	  )r   rU  rV  r9   r
   r   rM   r7  rD  rQ   r   )rT   r-   r,   rW  r   r9   rX  rY   r   r   r    6test_groupby_apply_timegrouper_with_nat_scalar_returns  s   zBTestGroupBy.test_groupby_apply_timegrouper_with_nat_scalar_returnsc           	      C   s   |}t ddd}||}|jdksJ |j|jjdks J d}tjt	|d |
dd }W d    n1 s;w   Y  ttd	g|d jdd
}tg dg|tg dddd}t|| d S )Nr   100YEr#   r   r   rw   c                 S   s   | d d S )Nr   r   r   r   r   r   r    r     r   zSTestGroupBy.test_groupby_apply_timegrouper_with_nat_apply_squeeze.<locals>.<lambda>r   )rE   r7   )$   r@   r@   r   r   )r   r   r   r   r   r   r   r   )r   r&   ngroups_selected_obj	_get_axisaxisnlevelsrQ   r   r   r   r   r	   rE   r   rR   )	rT   r!   r   r+   r,   r   rW  rX  rY   r   r   r    5test_groupby_apply_timegrouper_with_nat_apply_squeeze  s    
zATestGroupBy.test_groupby_apply_timegrouper_with_nat_apply_squeezec                 C   sv   t d |}|d jdd dd}|d d}t|| |dg jdd dd}|dg d}t|| d S )Nnumbar   c                 S   
   t | S r   rM   nanmeanvaluesr<   r   r   r    r        
 zITestGroupBy.test_groupby_agg_numba_timegrouper_with_nat.<locals>.<lambda>)enginemeanc                 S   re  r   rf  rh  r   r   r    r     rj  )r   importorskip	aggregaterQ   r   rR   )rT   r-   r,   r   rY   	result_dfexpected_dfr   r   r    +test_groupby_agg_numba_timegrouper_with_nat  s   

z7TestGroupBy.test_groupby_agg_numba_timegrouper_with_natN)"__name__
__module____qualname__r^   r   markparametrizerm   r   r   r   r   r   r   r   r   r  r  r  r  r  r  r+  r1  r3  r>  rG  rL  rQ  rZ  r[  rc  
single_cpurq  r   r   r   r    r.   K   s@    8
  6
:B?	2=		
"r.   )__doc__r   r   numpyrM   r   r.  pandasr   r   r   r   r   r   r	   r
   r   pandas._testing_testingrQ   pandas.core.groupby.grouperr   pandas.core.groupby.opsr   fixturer!   r-   r.   r   r   r   r    <module>   s    (


