
    PiD/                    :   d Z ddlmZ ddlmZmZmZ ddlZddlm	Z	 ddl
mZ ddlmZ ddlmZ dd	lmZ dd
lmZ ddlmZmZmZmZ ddlmZmZmZmZ ddlm Z  ddl!m"c m#Z$ ddl%m&Z& erddl'm(Z(m)Z) ddlm*Z* ddl+m,Z, dZ-d)dZ.d Z/d*dZ0d+dZ1	 	 	 d,d-d%Z2d.d(Z3dS )/zH
Table Schema builders

https://specs.frictionlessdata.io/table-schema/
    )annotations)TYPE_CHECKINGAnycastN)option_context)lib)ujson_loads)	timezones)find_stack_level)	_registry)is_bool_dtypeis_integer_dtypeis_numeric_dtypeis_string_dtype)CategoricalDtypeDatetimeTZDtypeExtensionDtypePeriodDtype)	DataFrame)	to_offset)DtypeObjJSONSerializable)Series)
MultiIndexz1.4.0xr   returnstrc                "   t          |           rdS t          |           rdS t          |           rdS t          j        | d          st          | t          t          f          rdS t          j        | d          rdS t          |           rdS d	S )
a  
    Convert a NumPy / pandas type to its corresponding json_table.

    Parameters
    ----------
    x : np.dtype or ExtensionDtype

    Returns
    -------
    str
        the Table Schema data types

    Notes
    -----
    This table shows the relationship between NumPy / pandas dtypes,
    and Table Schema dtypes.

    ==============  =================
    Pandas type     Table Schema type
    ==============  =================
    int64           integer
    float64         number
    bool            boolean
    datetime64[ns]  datetime
    timedelta64[ns] duration
    object          str
    categorical     any
    =============== =================
    integerbooleannumberMdatetimemdurationstringany)	r   r   r   r   is_np_dtype
isinstancer   r   r   )r   s    p/home/jaya/work/projects/VOICE-AGENT/VIET/agent-env/lib/python3.11/site-packages/pandas/io/json/_table_schema.pyas_json_table_typer+   7   s    <  y	q		 y	!		 	x	C	 	  Jq?K2P$Q$Q z	C	 	  z			 xu    c                H   t          j        | j        j         r| j        j        }t	          |          dk    r3| j        j        dk    r#t          j        dt                                 nNt	          |          dk    r;t          d |D                       r"t          j        dt                                 | S | 
                    d          } | j        j        dk    r)t          j        | j        j                  | j        _        n| j        j        pd| j        _        | S )	z?Sets index names to 'index' for regular, or 'level_x' for Multi   indexz-Index name of 'index' is not round-trippable.)
stacklevelc              3  @   K   | ]}|                     d           V  dS level_N
startswith.0r   s     r*   	<genexpr>z$set_default_names.<locals>.<genexpr>n   s.      !F!FQ!,,x"8"8!F!F!F!F!F!Fr,   z<Index names beginning with 'level_' are not round-trippable.F)deep)comall_not_noner/   nameslennamewarningswarnr   r'   copynlevelsfill_missing_names)datanmss     r*   set_default_namesrF   e   s   
)* js88q==TZ_77M?+--     XX\\c!F!F#!F!F!FFF\MN+--    99%9  DzA1$*2BCC
*/4W
Kr,   dict[str, JSONSerializable]c                ,   | j         }| j        d}n| j        }|t          |          d}t          |t                    r(|j        }|j        }dt          |          i|d<   ||d<   nt          |t                    r|j	        j
        |d<   nt          |t                    rSt          j        |j                  rd|d<   nSt          j        |j                  }t          |t                     r||d<   nt          |t"                    r
|j        |d	<   |S )
Nvalues)r>   typeenumconstraintsorderedfreqUTCtzextDtype)dtyper>   r+   r)   r   
categoriesrM   listr   rN   freqstrr   r
   is_utcrP   get_timezoner   r   )arrrR   r>   fieldcatsrM   zones          r*   !convert_pandas_type_to_json_fieldr\   }   s$   IE
xx"5))* *E
 %)** '- &T

3m"i	E;	'	' 
'
*f	E?	+	+ 'EH%% 	#E$KK)%(33D$$$ #"d	E>	*	* '!JjLr,   str | CategoricalDtypec                   | d         }|dk    r|                      dd          S |dk    r|                      dd          S |dk    r|                      dd          S |d	k    r|                      dd
          S |dk    rdS |dk    rg|                      d          rd| d          dS |                      d          r/t          | d                   }t          |          j        }d| dS dS |dk    rKd| v r'd| v r#t	          | d         d         | d                   S d| v rt          j        | d                   S dS t          d|           )a  
    Converts a JSON field descriptor into its corresponding NumPy / pandas type

    Parameters
    ----------
    field
        A JSON field descriptor

    Returns
    -------
    dtype

    Raises
    ------
    ValueError
        If the type of the provided field is unknown or currently unsupported

    Examples
    --------
    >>> convert_json_field_to_pandas_type({"name": "an_int", "type": "integer"})
    'int64'

    >>> convert_json_field_to_pandas_type(
    ...     {
    ...         "name": "a_categorical",
    ...         "type": "any",
    ...         "constraints": {"enum": ["a", "b", "c"]},
    ...         "ordered": True,
    ...     }
    ... )
    CategoricalDtype(categories=['a', 'b', 'c'], ordered=True, categories_dtype=str)

    >>> convert_json_field_to_pandas_type({"name": "a_datetime", "type": "datetime"})
    'datetime64[ns]'

    >>> convert_json_field_to_pandas_type(
    ...     {"name": "a_datetime_with_tz", "type": "datetime", "tz": "US/Central"}
    ... )
    'datetime64[ns, US/Central]'
    rJ   r&   rQ   Nr   int64r!   float64r    boolr%   timedelta64r#   rP   zdatetime64[ns, ]rN   zperiod[zdatetime64[ns]r'   rL   rM   rK   )rS   rM   objectz#Unsupported or invalid field type: )getr   r   _freqstrr   registryfind
ValueError)rY   typoffsetrN   s       r*   !convert_json_field_to_pandas_typerl      s   R -C
hyyT***				yyW---	yyY///				yyV,,,	
		}	
		99T?? 		$3U4[3333YYv 	$uV}--Fv&&/D$T$$$$##	E!!i5&8&8# /7yAQ    5  =z!23338
@3@@
A
AAr,   TrD   DataFrame | Seriesr/   ra   primary_keybool | Noneversionc                   |du rt          |           } i }g }|r| j        j        dk    rpt          d| j                  | _        t	          | j        j        | j        j        d          D ].\  }}t          |          }||d<   |                    |           /n'|                    t          | j                             | j	        dk    r=| 
                                D ]'\  }	}
|                    t          |
                     (n"|                    t          |                      ||d<   |r?| j        j        r3|1| j        j        dk    r| j        j        g|d<   n| j        j        |d<   n|||d<   |r
t          |d	<   |S )
a  
    Create a Table schema from ``data``.

    This method is a utility to generate a JSON-serializable schema
    representation of a pandas Series or DataFrame, compatible with the
    Table Schema specification. It enables structured data to be shared
    and validated in various applications, ensuring consistency and
    interoperability.

    Parameters
    ----------
    data : Series or DataFrame
        The input data for which the table schema is to be created.
    index : bool, default True
        Whether to include ``data.index`` in the schema.
    primary_key : bool or None, default True
        Column names to designate as the primary key.
        The default `None` will set `'primaryKey'` to the index
        level or levels if the index is unique.
    version : bool, default True
        Whether to include a field `pandas_version` with the version
        of pandas that last revised the table schema. This version
        can be different from the installed pandas version.

    Returns
    -------
    dict
        A dictionary representing the Table schema.

    See Also
    --------
    DataFrame.to_json : Convert the object to a JSON string.
    read_json : Convert a JSON string to pandas object.

    Notes
    -----
    See `Table Schema
    <https://pandas.pydata.org/docs/user_guide/io.html#table-schema>`__ for
    conversion types.
    Timedeltas as converted to ISO8601 duration format with
    9 decimal places after the seconds field for nanosecond precision.

    Categoricals are converted to the `any` dtype, and use the `enum` field
    constraint to list the allowed values. The `ordered` attribute is included
    in an `ordered` field.

    Examples
    --------
    >>> from pandas.io.json._table_schema import build_table_schema
    >>> df = pd.DataFrame(
    ...     {'A': [1, 2, 3],
    ...      'B': ['a', 'b', 'c'],
    ...      'C': pd.date_range('2016-01-01', freq='D', periods=3),
    ...      }, index=pd.Index(range(3), name='idx'))
    >>> build_table_schema(df)
    {'fields': [{'name': 'idx', 'type': 'integer'}, {'name': 'A', 'type': 'integer'}, {'name': 'B', 'type': 'string', 'extDtype': 'str'}, {'name': 'C', 'type': 'datetime'}], 'primaryKey': ['idx'], 'pandas_version': '1.4.0'}
    Tr.   r   )strictr>   fieldsN
primaryKeypandas_version)rF   r/   rB   r   ziplevelsr<   r\   appendndimitems	is_uniquer>   TABLE_SCHEMA_VERSION)rD   r/   rn   rp   schemars   levelr>   	new_fieldcolumnss              r*   build_table_schemar      s   J }} &&FF I:!!lDJ77DJ"4:#4dj6FtTTT ) )t=eDD	$(	&!i(((()
 MM;DJGGHHHy1}} 	@ 	@IFAMM;A>>????	@ 	7==>>>F8 +% ++*=:""$(JO#4F<  #':#3F<  		 *| 8#7 Mr,   precise_floatr   c                   t          | |          }d |d         d         D             }t          |d         |          |         }d |d         d         D             }d|                                v rt          d	          t	          d
d          5  |                    |          }ddd           n# 1 swxY w Y   d|d         v r{|                    |d         d                   }t          |j        j	                  dk    r|j        j
        dk    rd|j        _
        n d |j        j	        D             |j        _	        |S )a  
    Builds a DataFrame from a given schema

    Parameters
    ----------
    json :
        A JSON table schema
    precise_float : bool
        Flag controlling precision when decoding string to double values, as
        dictated by ``read_json``

    Returns
    -------
    df : DataFrame

    Raises
    ------
    NotImplementedError
        If the JSON table schema contains either timezone or timedelta data

    Notes
    -----
        Because :func:`DataFrame.to_json` uses the string 'index' to denote a
        name-less :class:`Index`, this function sets the name of the returned
        :class:`DataFrame` to ``None`` when said string is encountered with a
        normal :class:`Index`. For a :class:`MultiIndex`, the same limitation
        applies to any strings beginning with 'level_'. Therefore, an
        :class:`Index` name of 'index'  and :class:`MultiIndex` names starting
        with 'level_' are not supported.

    See Also
    --------
    build_table_schema : Inverse function.
    pandas.read_json
    )r   c                    g | ]
}|d          S r>    r7   rY   s     r*   
<listcomp>z&parse_table_schema.<locals>.<listcomp>w  s    FFF5vFFFr,   r}   rs   rD   )columnsc                :    i | ]}|d          t          |          S r   )rl   r   s     r*   
<dictcomp>z&parse_table_schema.<locals>.<dictcomp>z  s7        	f8??  r,   rb   z<table="orient" can not yet read ISO-formatted Timedelta datazfuture.distinguish_nan_and_naFNrt   r.   r/   c                @    g | ]}|                     d           rdn|S r2   r4   r6   s     r*   r   z&parse_table_schema.<locals>.<listcomp>  s:       :;X..5A  r,   )r	   r   rI   NotImplementedErrorr   astype	set_indexr=   r/   r<   r>   )jsonr   table	col_orderdfdtypess         r*   parse_table_schemar   R  s   H M:::EFFE(OH,EFFFI	5=)	4	4	4Y	?B 8_X.  F ''!J
 
 	
 
7	?	?  YYv               uX&&\\%/,788rx~!##x}'' $ ?Ax~  BHN Is   B66B:=B:)r   r   r   r   )r   rG   )r   r]   )TNT)
rD   rm   r/   ra   rn   ro   rp   ra   r   rG   )r   ra   r   r   )4__doc__
__future__r   typingr   r   r   r?   pandas._configr   pandas._libsr   pandas._libs.jsonr	   pandas._libs.tslibsr
   pandas.util._exceptionsr   pandas.core.dtypes.baser   rg   pandas.core.dtypes.commonr   r   r   r   pandas.core.dtypes.dtypesr   r   r   r   pandasr   pandas.core.commoncorecommonr:   pandas.tseries.frequenciesr   pandas._typingr   r   r   pandas.core.indexes.multir   r|   r+   rF   r\   rl   r   r   r   r,   r*   <module>r      s    # " " " " "         
  ) ) ) ) ) )       ) ) ) ) ) ) ) ) ) ) ) ) 4 4 4 4 4 4 9 9 9 9 9 9                                               0 0 0 0 0 0 5       
 444444  + + + +\  0   @IB IB IB IB\ #	f f f f fR@ @ @ @ @ @r,   