fume-manage-python.git

U  
¬ý°drã@s@ddlmZddlmZmZmZmZmZddlZ    ddl
mZddlm Z mZmZmZddlmZmZddlmZddlmZmZmZmZmZdd    lmZmZddlm m!Z"dd
l#m$Z$ddl%m&Z&ddl'm(Z(m)Z)m*Z*dd l+m,Z,ddl-m.Z.ddl/m0Z0erddl1m2Z2edee$ddddGdddddddddddZ3dddddddddd d!Z4dHd"ddd#d$d%Z5dIddd&d'd(Z6dJdd)d*d+Z7dKddd,d-d.Z8d/d0Z9edee$d1ddej:ej:d2dd3d4d4dd5d6d1Z;dLdddddd7d8d9Z<dMddddd:d;d<Z=dNd>d?d@dAZ>dBdBdCdDdEdFZ?dS)Oé)Úannotations)Ú TYPE_CHECKINGÚCallableÚHashableÚSequenceÚcastN)Úlib)ÚAggFuncTypeÚAggFuncTypeBaseÚAggFuncTypeDictÚ
IndexLabel)ÚAppenderÚSubstitution)Úmaybe_downcast_to_dtype)Úis_extension_array_dtypeÚis_integer_dtypeÚis_list_likeÚis_nested_list_likeÚ    is_scalar)ÚABCDataFrameÚ    ABCSeries)Ú_shared_docs)ÚGrouper)ÚIndexÚ
MultiIndexÚget_objs_combined_axis)Úconcat)Úcartesian_product)ÚSeries©Ú    DataFramez
data : DataFrameÚpivot_tableé)ÚindentsÚmeanFTÚAllr r    Úboolr)ÚdataÚaggfuncÚmarginsÚdropnaÚmargins_nameÚobservedÚsortÚreturncCs¬t|}t|}t|trg}g}|D]>} t|||||| ||||    |
d}| |¡| t| d| ¡q&t||dd}|j|ddSt||||||||||    |
}|j|ddS)N)
ÚvaluesÚindexÚcolumnsÚ
fill_valuer(r)r*r+r,r-Ú__name__r")ÚkeysÚaxisr!)Úmethod)Ú_convert_byÚ
isinstanceÚlistÚ__internal_pivot_tableÚappendÚgetattrrZ__finalize__)r'r/r0r1r(r2r)r*r+r,r-Úpiecesr4ÚfuncZ_tableÚtable©r@úPd:\z\workplace\vscode\pyvenv\venv\Lib\site-packages\pandas/core/reshape/pivot.pyr!8sJ
õ 
õ z!AggFuncTypeBase | AggFuncTypeDictcCs||}|dk    }|r¸t|r*d} t|}n
d} |g}|D]}||kr8t|q8g}||D]@}t|trn|j}z||kr| |¡WqZtk
rYqZXqZt|t|j    krú||}nB|j    }|D].}z| 
|¡}WqÂtttfk
rîYqÂXqÂt|}|j||    |
d}|  |¡}|r¶t|tr¶t|j    r¶|jdd}|D]r}||krBt||rB||krBt||sBt||tsBt||jtjrBt||||j||<qB|}|jjdkr@|r@|jjdt|}g}tt|t|D]<}|jj|}|dks||kr(| |¡n
| |¡qø| |¡}|s²t|jtr|tjt|jj|jjd}|j|d    d
}t|j    tr²tjt|j    j|j    jd}|j|dd
}|
dkrÔt|trÔ|jdd
}|dk    rì|j|dd}|r&|r||  ¡j!dd
}t"|||||||||d     }|rN| sN|j    jdkrN|j#d    dd
}t|d    krpt|d    krp|j$}t|tr|r|jddd}|S)zL
    Helper of :func:`pandas.pivot_table` for any non-list ``aggfunc``.
    NTF)r,r-Úall)Úhowr"©Únamesr©r5Zinfer)Zdowncast)ÚrowsÚcolsr(r,r+r2)rCr5)%rr9ÚKeyErrorr8rÚkeyr;Ú    TypeErrorÚlenr1ZdropÚ
ValueErrorÚgroupbyÚaggrr*rÚdtypeÚnprr0ÚnlevelsrEÚrangeÚunstackrÚfrom_arraysrÚlevelsÚreindexZ
sort_indexÚfillnaZnotnarBÚ_add_marginsZ    droplevelÚT)r'r/r0r1r(r2r)r*r+r,r-r4Z values_passedZvalues_multiÚiZ    to_filterÚxrJZgroupedZaggedÚvr?Zindex_namesZ
to_unstackÚnameÚmr@r@rAr:qs¾
 
 
 
 
ÿ
þý
üÿ
 
ÿ
ÿ
÷ r:zDataFrame | Series)r?r'r+c        Cst|tstdd|d}    |jjD]}
||j |
¡kr&t|    q&t||||}|jdkr|jjddD]}
||j |
¡krlt|    qlt    |dkr®|fdt    |d}n|}|sÖt|t
rÖ| t|||i¡S|rt ||||||||} t| ts| S| \}}}n>t|tstt|||||||} t| tsB| S| \}}}|j|j|d}|D]0}t|tr~||||<n||d||<q`dd    lm}||t|gd
j}|jj}t|jD]:}t|rÖqÄ| |g¡j}||jt|fd||<qÄ| |¡}||j_|S)Nz&margins_name argument must be a stringzConflicting name "z" in marginsér"©Ú)r2rr)r1)Úargs)r8ÚstrrMr0rEÚget_level_valuesÚ_compute_grand_marginÚndimr1rLrÚ_appendrÚ_generate_marginal_resultsÚtuplerÚAssertionErrorÚ)_generate_marginal_results_without_valuesrWÚpandasr rrZÚsetZdtypesrZ select_dtypesÚapplyr)r?r'r/rGrHr(r,r+r2ÚmsgÚlevelÚgrand_marginrJZmarginal_result_setÚresultÚmargin_keysÚ
row_marginÚkr Zmargin_dummyZ    row_namesrPr@r@rArYs|
 
 
 
ÿÿ
 
ÿ
rY)r'r+c    Cs¶|r¤i}|| ¡D]\}}zlt|tr:t||||<nLt|trzt||trht|||||<q|||||<n||||<Wqtk
rYqXq|S|||jiSdS©N)Úitemsr8rdr<ÚdictrKr0)r'r/r(r+rrrvr]r@r@rArfVs
 
rf)r+csøtdkrxg}g}    fdd}
t|dkr|||j||d |¡}d}|jd||dD]8\} }|
| }| ¡}|| ||<| |¡|     |¡q`n²ddlm}d}|jd||dD]\} }tdkrÚ|
| }n}| |¡|| |¡j}t    |j
tr$tj|g|j
j dgd|_
nt|g|j
jd    |_
| |¡|     |¡q¼|sX|St||d
}t|dkr|Sn
|}|j}    tdkrÞ||j|d |¡}| ¡}tgttt}|j
 |¡|_
nttj|jd}||    |fS)Nrcs|fdtdS)Nrar"©rL)rJ©rHr+r@rAÚ_all_keyusz,_generate_marginal_results.<locals>._all_key©r,r"©rqr5r,rrD©r^rF©r0)rLrNrOÚcopyr;rmr rorZr8r0rÚfrom_tuplesrErr^rr1Ústackr9rSZreorder_levelsrrQÚnan)r?r'r/rGrHr(r,r+Ztable_piecesrtr|ÚmarginZcat_axisrJZpieceÚall_keyr Ztransformed_piecersruZ    new_orderr@r{rArimsV
 
 
ÿ
 
ri)r?r+c sÞtdkrg}fdd}t|dkr`||j||d |¡}    |}
|    ||
<|}| |
¡q¢|jdd|d |¡}    |}
|    ||
<|}| |
¡|Sn
|}|j}trÄ|j|d |¡}nttj|jd}|||fS)Nrcs&tdkrSfdtdS)Nr"rarzr@r{r@rAr|Äsz;_generate_marginal_results_without_values.<locals>._all_keyr}r~r)rLrNror;r1rrQr) r?r'rGrHr(r,r+rtr|rrrsrur@r{rArl·s*    
rlcCsF|dkrg}n4t|s2t|tjtttfs2t|r:|g}nt|}|Srw)    rr8rQZndarrayrrrÚcallabler9)Zbyr@r@rAr7ãsÿþýr7Úpivot)r0r/rzIndexLabel | lib.NoDefault)r'r1r0r/r.cstt |¡}jddj ¡_ddjjDj_|tjkrz|tjk    rXt |¡}ng}|tjk}j|||d}nÖ|tjkrÂtjt    r¬fddt
jjD}qÚtjjj dg}nfddt |¡D}fd    d|D}    | |    ¡t     |¡}
t|r<t|ts<ttt|}j|j|
|d
}nj|j|
d}| |¡}dd|jjD|j_|S) NF)ÚdeepcSsg|]}|dk    r|ntjqSrw©rÚ    NoDefault©Ú.0r^r@r@rAÚ
<listcomp>szpivot.<locals>.<listcomp>)r;csg|]}j |¡qSr@)r0re)rr[©r'r@rArsrcsg|]}|qSr@r@)rÚidxrr@rArscsg|]}|qSr@r@)rÚcolrr@rArs)r0r1rcSsg|]}|tjk    r|ndqSrwrrr@r@rAr.s)ÚcomZconvert_to_list_likerr0rErrZ    set_indexr8rrSrRrr^ÚextendrUrrjrrrZ_constructorZ_valuesZ_constructor_slicedrT)r'r1r0r/Zcolumns_listlikerHr;ZindexedZ
index_listZdata_columnsZ
multiindexrsr@rrArñsL    
ÿ
 
 
 
ÿ
 
 
ÿ
 
ÿ
ÿ
)r)r+r*Ú    normalizer.c
CsX|dkr|dk    rtd|dk    r0|dkr0tdt|s>|g}t|sL|g}d}
dd||D}|rtt|ddd}
t||d    d
}t||dd
}t||\}} }}dd lm}tt| |tt||}|||
d}|dkròd|d<t    dd}n||d<d|i}|j
d| ||||d|}|    dk    r8t||    ||d}|j|dd}|j|dd}|S)aº 
    Compute a simple cross tabulation of two (or more) factors.
 
    By default, computes a frequency table of the factors unless an
    array of values and an aggregation function are passed.
 
    Parameters
    ----------
    index : array-like, Series, or list of arrays/Series
        Values to group by in the rows.
    columns : array-like, Series, or list of arrays/Series
        Values to group by in the columns.
    values : array-like, optional
        Array of values to aggregate according to the factors.
        Requires `aggfunc` be specified.
    rownames : sequence, default None
        If passed, must match number of row arrays passed.
    colnames : sequence, default None
        If passed, must match number of column arrays passed.
    aggfunc : function, optional
        If specified, requires `values` be specified as well.
    margins : bool, default False
        Add row/column margins (subtotals).
    margins_name : str, default 'All'
        Name of the row/column that will contain the totals
        when margins is True.
    dropna : bool, default True
        Do not include columns whose entries are all NaN.
    normalize : bool, {'all', 'index', 'columns'}, or {0,1}, default False
        Normalize by dividing all values by the sum of values.
 
        - If passed 'all' or `True`, will normalize over all values.
        - If passed 'index' will normalize over each row.
        - If passed 'columns' will normalize over each column.
        - If margins is `True`, will also normalize margin values.
 
    Returns
    -------
    DataFrame
        Cross tabulation of the data.
 
    See Also
    --------
    DataFrame.pivot : Reshape data based on column values.
    pivot_table : Create a pivot table as a DataFrame.
 
    Notes
    -----
    Any Series passed will have their name attributes used unless row or column
    names for the cross-tabulation are specified.
 
    Any input passed containing Categorical data will have **all** of its
    categories included in the cross-tabulation, even if the actual data does
    not contain any instances of a particular category.
 
    In the event that there aren't overlapping indexes an empty DataFrame will
    be returned.
 
    Reference :ref:`the user guide <reshaping.crosstabulations>` for more examples.
 
    Examples
    --------
    >>> a = np.array(["foo", "foo", "foo", "foo", "bar", "bar",
    ...               "bar", "bar", "foo", "foo", "foo"], dtype=object)
    >>> b = np.array(["one", "one", "one", "two", "one", "one",
    ...               "one", "two", "two", "two", "one"], dtype=object)
    >>> c = np.array(["dull", "dull", "shiny", "dull", "dull", "shiny",
    ...               "shiny", "dull", "shiny", "shiny", "shiny"],
    ...              dtype=object)
    >>> pd.crosstab(a, [b, c], rownames=['a'], colnames=['b', 'c'])
    b   one        two
    c   dull shiny dull shiny
    a
    bar    1     2    1     0
    foo    2     2    1     2
 
    Here 'c' and 'f' are not represented in the data and will not be
    shown in the output because dropna is True by default. Set
    dropna=False to preserve categories with no data.
 
    >>> foo = pd.Categorical(['a', 'b'], categories=['a', 'b', 'c'])
    >>> bar = pd.Categorical(['d', 'e'], categories=['d', 'e', 'f'])
    >>> pd.crosstab(foo, bar)
    col_0  d  e
    row_0
    a      1  0
    b      0  1
    >>> pd.crosstab(foo, bar, dropna=False)
    col_0  d  e  f
    row_0
    a      1  0  0
    b      0  1  0
    c      0  0  0
    Nz&aggfunc cannot be used without values.z)values cannot be used without an aggfunc.cSsg|]}t|ttfr|qSr@)r8rr)rr\r@r@rAr«szcrosstab.<locals>.<listcomp>TF)Z    intersectr-Úrow©ÚprefixrrrrÚ    __dummy__)r(r2r()r0r1r)r+r*)rr)r+)r0r5r")r1r5)r) rMrrÚ
_get_namesÚ_build_names_mapperrmr ryÚziprLr!Ú
_normalizeZrename_axis)r0r1r/ÚrownamesÚcolnamesr(r)r+r*rZ
common_idxZ    pass_objsÚrownames_mapperÚunique_rownamesÚcolnames_mapperÚunique_colnamesr r'ZdfÚkwargsr?r@r@rAÚcrosstab5sfjûþÿúù
ÿr¤)r?r)r+r.c 
CsHt|ttfsRddd}z||}Wn,tk
rP}ztd|W5d}~XYnX|dkrÎddddd    dd
}|d|d<z||}Wn,tk
r¶}ztd|W5d}~XYnX||}| d ¡}nv|dkr<|j}|j}    |jdddfj    }
||
k||
k@rt|d|jdddf}|jdddf}|jddddf}t
||dd}|dkr|| ¡}t||gdd}| d ¡}|    |_n¢|dkrÊ|| ¡}|  |¡}| d ¡}||_np|dksÞ|dkr2|| ¡}|| ¡}d|j|<t||gdd}|  |¡}| d ¡}||_|    |_ntdntd|S)Nr0r1)rr"zNot a valid normalize argumentFcSs||jddjddS©Nr"rFr©Úsum©r\r@r@rAÚ<lambda>îóz_normalize.<locals>.<lambda>cSs|| ¡Srwr¦r¨r@r@rAr©ïrªcSs|j|jddddSr¥)Údivr§r¨r@r@rAr©ðrª)rBr1r0rBTréÿÿÿÿz not in pivoted DataFrame)rr)r"rFzNot a valid margins argument)r8r&rdrIrMrXr0r1Zilocr^rr§rrhÚloc) r?rr)r+Z    axis_subsÚerrZnormalizersÚfZtable_indexZ table_columnsZlast_ind_or_colZ column_marginZindex_marginr@r@rArásd
ý
 
 
 
 
 
 
 
 
 
rrrdrcCs|dkrVg}t|D]>\}}t|tr>|jdk    r>| |j¡q| |d|¡qn*t|t|krntdt|tst|}|S)NÚ_z*arrays and names must have the same length)Ú    enumerater8rr^r;rLrkr9)ZarrsrErr[Zarrr@r@rAr1s
rz    list[str]z;tuple[dict[str, str], list[str], dict[str, str], list[str]])rrr.csdd}t| t|¡}||||B|Bfddt|D}fddt|D}fddt|D}fddt|D}||||fS)    a¤
    Given the names of a DataFrame's rows and columns, returns a set of unique row
    and column names and mappers that convert to original names.
 
    A row or column name is replaced if it is duplicate among the rows of the inputs,
    among the columns of the inputs or between the rows and the columns.
 
    Parameters
    ----------
    rownames: list[str]
    colnames: list[str]
 
    Returns
    -------
    Tuple(Dict[str, str], List[str], Dict[str, str], List[str])
 
    rownames_mapper: dict[str, str]
        a dictionary with new row names as keys and original rownames as values
    unique_rownames: list[str]
        a list of rownames with duplicate names replaced by dummy names
    colnames_mapper: dict[str, str]
        a dictionary with new column names as keys and original column names as values
    unique_colnames: list[str]
        a list of column names with duplicate names replaced by dummy names
 
    cstfdd|DS)Ncsh|]}|kr|qSr@r@r©Úseenr@rAÚ    <setcomp>bsz>_build_names_mapper.<locals>.get_duplicates.<locals>.<setcomp>)rnrDr@r²rAÚget_duplicates`sz+_build_names_mapper.<locals>.get_duplicatescs$i|]\}}|krd||qS©Zrow_r@©rr[r^©Z    dup_namesr@rAÚ
<dictcomp>gsz'_build_names_mapper.<locals>.<dictcomp>cs&g|]\}}|krd|n|qSr¶r@r·r¸r@rArjsz'_build_names_mapper.<locals>.<listcomp>cs$i|]\}}|krd||qS©Zcol_r@r·r¸r@rAr¹nscs&g|]\}}|krd|n|qSrºr@r·r¸r@rArqs)rnÚintersectionr±)rrrµZshared_namesrr r¡r¢r@r¸rArBs 
ÿ
ÿ
ÿ
ÿr)
NNNr$NFTr%FT)Nr%N)r%)r%)r%)NNNNFr%TF)r%)r)@Ú
__future__rÚtypingrrrrrÚnumpyrQZpandas._libsrZpandas._typingr    r
rrZpandas.util._decoratorsr rZpandas.core.dtypes.castrZpandas.core.dtypes.commonrrrrrZpandas.core.dtypes.genericrrZpandas.core.commonÚcoreÚcommonrZpandas.core.framerZpandas.core.groupbyrZpandas.core.indexes.apirrrZpandas.core.reshape.concatrZpandas.core.reshape.utilrZpandas.core.seriesrrmr r!r:rYrfrirlr7rrr¤rrrr@r@r@rAÚ<module>s|õ"7÷UÿÿQù,ûEö.ÿP