fume-manage-python.git

U  
¬ý°dÿDã@sþddlmZddlmZmZddlZddlZddlmZm    Z    m
Z
ddlZddl mZddlmZmZddlZddlmZddd    d
dZd)dddddddZddddddddZddddddZd*ddddddZd+dd!d"d#d#d$ddd%d&    d'd(ZdS),é)Úannotations)ÚabcÚdefaultdictN)ÚAnyÚDefaultDictÚIterable©Úconvert_json_to_lines)ÚIgnoreRaiseÚScalar)Ú    DataFrameÚstr)ÚsÚreturncCs0|ddks|ddkr|S|dd}t|S)zJ
    Helper function that converts JSON lists to line delimited JSON.
    rú[éÿÿÿÿú]ér)r©rúPd:\z\workplace\vscode\pyvenv\venv\Lib\site-packages\pandas/io/json/_normalize.pyÚconvert_to_line_delimitssrÚÚ.Úintz
int | None)ÚprefixÚsepÚlevelÚ    max_levelc
Csâd}t|tr|g}d}g}|D]°}t |¡}| ¡D]\}    }
t|    tsPt|    }    |dkr^|    }n|||    }t|
tr|dk    r ||kr |dkr6| |    ¡}
|
||<q6| |    ¡}
| t|
|||d|¡q6|     |¡q |rÞ|dS|S)a
    A simplified json_normalize
 
    Converts a nested dict into a flat dict ("record"), unlike json_normalize,
    it does not attempt to extract a subset of the data.
 
    Parameters
    ----------
    ds : dict or list of dicts
    prefix: the prefix, optional, default: ""
    sep : str, default '.'
        Nested records will generate names separated by sep,
        e.g., for sep='.', { 'foo' : { 'bar' : 0 } } -> foo.bar
    level: int, optional, default: 0
        The number of levels in the json string.
 
    max_level: int, optional, default: None
        The max depth to normalize.
 
    Returns
    -------
    d - dict or list of dicts, matching `ds`
 
    Examples
    --------
    >>> nested_to_record(
    ...     dict(flat1=1, dict1=dict(c=1, d=2), nested=dict(e=dict(c=1, d=2), d=2))
    ... )
    {'flat1': 1, 'dict1.c': 1, 'dict1.d': 2, 'nested.e.c': 1, 'nested.e.d': 2, 'nested.d': 2}
    FTrNr)
Ú
isinstanceÚdictÚcopyÚdeepcopyÚitemsr ÚpopÚupdateÚnested_to_recordÚappend)ÚdsrrrrZ    singletonZnew_dsÚdZnew_dÚkÚvZnewkeyrrrr%*s8,
 
 
 
ÿÿ
 
r%rúdict[str, Any])ÚdataÚ
key_stringÚnormalized_dictÚ    separatorrcCszt|trn| ¡D]X\}}|||}|sZtjdkrPddlm}|||}n
| |¡}t||||dqn|||<|S)a3
    Main recursive function
    Designed for the most basic use case of pd.json_normalize(data)
    intended as a performance improvement, see #15621
 
    Parameters
    ----------
    data : Any
        Type dependent on types contained within nested Json
    key_string : str
        New key (with separator(s) in) for data
    normalized_dict : dict
        The new normalized/flattened Json dict
    separator : str, default '.'
        Nested records will generate names separated by sep,
        e.g., for sep='.', { 'foo' : { 'bar' : 0 } } -> foo.bar
    )éé    r)Úremoveprefix©r,r-r.r/)rrr"ÚsysÚversion_infoZpandas.util._str_methodsr2Ú_normalise_json)r,r-r.r/ÚkeyÚvalueZnew_keyr2rrrr6{s 
 
 
ü
r6)r,r/rcCs8dd| ¡D}tdd| ¡Ddi|d}||S)aw
    Order the top level keys and then recursively go to depth
 
    Parameters
    ----------
    data : dict or list of dicts
    separator : str, default '.'
        Nested records will generate names separated by sep,
        e.g., for sep='.', { 'foo' : { 'bar' : 0 } } -> foo.bar
 
    Returns
    -------
    dict or list of dicts, matching `normalised_json_object`
    cSs i|]\}}t|ts||qSr©rr©Ú.0r)r*rrrÚ
<dictcomp>¸s
z+_normalise_json_ordered.<locals>.<dictcomp>cSs i|]\}}t|tr||qSrr9r:rrrr<ºs
rr3)r"r6)r,r/Z    top_dict_Znested_dict_rrrÚ_normalise_json_ordered©sür=zdict | list[dict]zdict | list[dict] | Any)r'rrcs@i}t|trt|d}n t|tr<fdd|D}|S|S)a
    A optimized basic json_normalize
 
    Converts a nested dict into a flat dict ("record"), unlike
    json_normalize and nested_to_record it doesn't do anything clever.
    But for the most basic use cases it enhances performance.
    E.g. pd.json_normalize(data)
 
    Parameters
    ----------
    ds : dict or list of dicts
    sep : str, default '.'
        Nested records will generate names separated by sep,
        e.g., for sep='.', { 'foo' : { 'bar' : 0 } } -> foo.bar
 
    Returns
    -------
    frame : DataFrame
    d - dict or list of dicts, matching `normalised_json_object`
 
    Examples
    --------
    >>> _simple_json_normalize(
    ...     {
    ...         "flat1": 1,
    ...         "dict1": {"c": 1, "d": 2},
    ...         "nested": {"e": {"c": 1, "d": 2}, "d": 2},
    ...     }
    ... )
    {'flat1': 1, 'dict1.c': 1, 'dict1.d': 2, 'nested.e.c': 1, 'nested.e.d': 2, 'nested.d': 2}
 
    )r,r/csg|]}t|dqS)©r)Ú_simple_json_normalize)r;Úrowr>rrÚ
<listcomp>òsz*_simple_json_normalize.<locals>.<listcomp>)rrr=Úlist)r'rZnormalised_json_objectZnormalised_json_listrr>rr?Âs+
 
r?Úraisezstr | list | Nonez"str | list[str | list[str]] | Nonez
str | Noner
r)    r,Úrecord_pathÚmetaÚmeta_prefixÚ record_prefixÚerrorsrrrcsþd"dddddfdd ddd    d
fddt|trD|sDtSt|trV|g}n$t|tjrvt|tsvt|}nt|d kr²|d kr²|d kr²    d kr²d kr²tt|dS|d krât    dd|DrÚt
|d}t|St|tsò|g}|d krg}nt|ts|g}dd|Dg
gttfddDd#ddd
f
dd ||iddt
}    d k    r¢|j    fddd}  ¡D]N\}    }
|d k    rÄ||    }    |    |krÞtd|    d tj|
td! ¡||    <qª|S)$a´
    Normalize semi-structured JSON data into a flat table.
 
    Parameters
    ----------
    data : dict or list of dicts
        Unserialized JSON objects.
    record_path : str or list of str, default None
        Path in each object to list of records. If not passed, data will be
        assumed to be an array of records.
    meta : list of paths (str or list of str), default None
        Fields to use as metadata for each record in resulting table.
    meta_prefix : str, default None
        If True, prefix records with dotted (?) path, e.g. foo.bar.field if
        meta is ['foo', 'bar'].
    record_prefix : str, default None
        If True, prefix records with dotted (?) path, e.g. foo.bar.field if
        path to records is ['foo', 'bar'].
    errors : {'raise', 'ignore'}, default 'raise'
        Configures error handling.
 
        * 'ignore' : will ignore KeyError if keys listed in meta are not
          always present.
        * 'raise' : will raise KeyError if keys listed in meta are not
          always present.
    sep : str, default '.'
        Nested records will generate names separated by sep.
        e.g., for sep='.', {'foo': {'bar': 0}} -> foo.bar.
    max_level : int, default None
        Max number of levels(depth of dict) to normalize.
        if None, normalizes all levels.
 
    Returns
    -------
    frame : DataFrame
    Normalize semi-structured JSON data into a flat table.
 
    Examples
    --------
    >>> data = [
    ...     {"id": 1, "name": {"first": "Coleen", "last": "Volk"}},
    ...     {"name": {"given": "Mark", "family": "Regner"}},
    ...     {"id": 2, "name": "Faye Raker"},
    ... ]
    >>> pd.json_normalize(data)
        id name.first name.last name.given name.family        name
    0  1.0     Coleen      Volk        NaN         NaN         NaN
    1  NaN        NaN       NaN       Mark      Regner         NaN
    2  2.0        NaN       NaN        NaN         NaN  Faye Raker
 
    >>> data = [
    ...     {
    ...         "id": 1,
    ...         "name": "Cole Volk",
    ...         "fitness": {"height": 130, "weight": 60},
    ...     },
    ...     {"name": "Mark Reg", "fitness": {"height": 130, "weight": 60}},
    ...     {
    ...         "id": 2,
    ...         "name": "Faye Raker",
    ...         "fitness": {"height": 130, "weight": 60},
    ...     },
    ... ]
    >>> pd.json_normalize(data, max_level=0)
        id        name                        fitness
    0  1.0   Cole Volk  {'height': 130, 'weight': 60}
    1  NaN    Mark Reg  {'height': 130, 'weight': 60}
    2  2.0  Faye Raker  {'height': 130, 'weight': 60}
 
    Normalizes nested data up to level 1.
 
    >>> data = [
    ...     {
    ...         "id": 1,
    ...         "name": "Cole Volk",
    ...         "fitness": {"height": 130, "weight": 60},
    ...     },
    ...     {"name": "Mark Reg", "fitness": {"height": 130, "weight": 60}},
    ...     {
    ...         "id": 2,
    ...         "name": "Faye Raker",
    ...         "fitness": {"height": 130, "weight": 60},
    ...     },
    ... ]
    >>> pd.json_normalize(data, max_level=1)
        id        name  fitness.height  fitness.weight
    0  1.0   Cole Volk             130              60
    1  NaN    Mark Reg             130              60
    2  2.0  Faye Raker             130              60
 
    >>> data = [
    ...     {
    ...         "state": "Florida",
    ...         "shortname": "FL",
    ...         "info": {"governor": "Rick Scott"},
    ...         "counties": [
    ...             {"name": "Dade", "population": 12345},
    ...             {"name": "Broward", "population": 40000},
    ...             {"name": "Palm Beach", "population": 60000},
    ...         ],
    ...     },
    ...     {
    ...         "state": "Ohio",
    ...         "shortname": "OH",
    ...         "info": {"governor": "John Kasich"},
    ...         "counties": [
    ...             {"name": "Summit", "population": 1234},
    ...             {"name": "Cuyahoga", "population": 1337},
    ...         ],
    ...     },
    ... ]
    >>> result = pd.json_normalize(
    ...     data, "counties", ["state", "shortname", ["info", "governor"]]
    ... )
    >>> result
             name  population    state shortname info.governor
    0        Dade       12345   Florida    FL    Rick Scott
    1     Broward       40000   Florida    FL    Rick Scott
    2  Palm Beach       60000   Florida    FL    Rick Scott
    3      Summit        1234   Ohio       OH    John Kasich
    4    Cuyahoga        1337   Ohio       OH    John Kasich
 
    >>> data = {"A": [1, 2]}
    >>> pd.json_normalize(data, "A", record_prefix="Prefix.")
        Prefix.0
    0          1
    1          2
 
    Returns normalized data with columns prefixed with the given string.
    Fr+z
list | strÚboolzScalar | Iterable)ÚjsÚspecÚextract_recordrc
sª|}z:t|tr4|D]}|dkr(t|||}qn||}Wnftk
r¤}zH|rftd|d|dkr|tjWY¢Std|d|d|W5d}~XYnX|S)zInternal function to pull fieldNzKey zS not found. If specifying a record_path, all elements of data should have the path.Úignorez) not found. To replace missing values of z% with np.nan, pass in errors='ignore')rrBÚKeyErrorÚnpÚnan)rJrKrLÚresultÚfieldÚe)rHrrÚ_pull_fields.
 
ÿýÿýz#json_normalize.<locals>._pull_fieldrB)rJrKrcsF||dd}t|tsBt |¡r(g}nt|d|d|d|S)z¶
        Internal function to pull field for records, and similar to
        _pull_field, but require to return list. And will raise error
        if has non iterable value.
        T)rLz has non list value z
 for path z. Must be list or null.)rrBÚpdZisnullÚ    TypeError)rJrKrQ)rTrrÚ _pull_records¡s
 
ÿz%json_normalize.<locals>._pull_recordsNr>css |]}dd| ¡DVqdS)cSsg|]}t|tqSrr9)r;ÚxrrrrAÎsz,json_normalize.<locals>.<genexpr>.<listcomp>N)Úvalues)r;ÚyrrrÚ    <genexpr>Îsz!json_normalize.<locals>.<genexpr>©rrcSs g|]}t|tr|n|gqSr)rrB)r;ÚmrrrrAàsz"json_normalize.<locals>.<listcomp>csg|]} |¡qSr)Újoin)r;Úvalr>rrrAçsrrÚNone)rrc    st|tr|g}t|dkr|D]^}tD]*\}}|dt|kr.||d||<q.||d|dd||ddq n|D]}||d}    fdd|D} t|¡tD]B\}}|dt|kræ||}n|||d}| |¡qÄ |¡qdS)Nrrr©rcs(g|] }t|tr t|dn|qS)r\)rrr%)r;Úr)rrrrrAösþÿz>json_normalize.<locals>._recursive_extract.<locals>.<listcomp>)rrÚlenÚzipr&Úextend)    r,ÚpathZ    seen_metarÚobjr_r7ZrecsZmeta_val)
Ú_metarTrWÚ_recursive_extractÚlengthsrÚ    meta_keysÚ    meta_valsÚrecordsrrrriés(
(ü
z*json_normalize.<locals>._recursive_extractracs|S)Nr)rX)rGrrÚ<lambda>óz json_normalize.<locals>.<lambda>)ÚcolumnszConflicting metadata name z, need distinguishing prefix )Zdtype)F)r)rrBrrrrr ÚNotImplementedErrorr?Úanyr%rÚrenamer"Ú
ValueErrorrOÚarrayÚobjectÚrepeat)r,rDrErFrGrHrrrQr)r*r)rhrTrWrirHrjrrkrlrGrmrrÚjson_normalize÷sfÿ
 
ÿþýüû
 
(
 
 
 
ÿrx)rrrN)r)NNNNrCrN)Ú
__future__rÚcollectionsrrr r4ÚtypingrrrÚnumpyrOZpandas._libs.writersr    Zpandas._typingr
rZpandasrUrrr%r6r=r?rxrrrrÚ<module>s6ûQ.þ7ø