
    .`i2                         d dl mZ d dlmZmZ d dlmZ d dlmZm	Z	 d dl
mZ d dlmZ  G d de          Z G d	 d
e          Z G d de          ZdS )    )Any)	BaseModelField)ChatCompletionLogProbs)SamplingParamsStreamOptions)Logprobrandom_uuidc                   4   e Zd ZU  ed d          Zeed<   ee         ed<   	 dZ	edz  ed<   	 e
ed<   	 dZedz  ed	<   d
Zedz  ed<   dZedz  ed<    edd          Zedz  ed<    edd          Zeed<    edd          Zeeef         dz  ed<   dS )GenerateRequestc                       t                       S Nr
        z/home/jaya/work/projects/VOICE-AGENT/VIET/agent-env/lib/python3.11/site-packages/vllm/entrypoints/serve/disagg/protocol.py<lambda>zGenerateRequest.<lambda>       ;== 2 r   The request_id related to this request. If the caller does not set it, a random_uuid will be generated. This id is used through out the inference process and return in response.default_factorydescription
request_id	token_idsNfeaturessampling_paramsmodelFstreamstream_optionsa/  If specified, the prefix cache will be salted with the provided string to prevent an attacker to guess prompts in multi-user environments. The salt should be random, protected from access by 3rd parties, and long enough to be unpredictable (e.g., 43 characters base64-encoded, corresponding to 256 bit).defaultr   
cache_saltr   zThe priority of the request (lower means earlier handling; default: 0). Any priority other than 0 will raise an error if the served model does not use priority scheduling.priority5KVTransfer parameters used for disaggregated serving.kv_transfer_params)__name__
__module____qualname__r   r   str__annotations__listintr   r   r   r   boolr   r   r"   r#   r%   dictr   r   r   r   r   r      se        e22H  J    Cy.  HcDj0####0E3:FD4K+/NMD(///"U
 
 
Jd
 
 
 
 ED  Hc    16K1 1 1S#X-     r   r   c                   b    e Zd ZU eed<   dZedz  ed<   dZedz  ed<   dZ	e
e         dz  ed<   dS )GenerateResponseChoiceindexNlogprobsstopfinish_reasonr   )r&   r'   r(   r,   r*   r2   r   r4   r)   r   r+   r   r   r   r0   r0   B   s^         JJJ.2H$t+222 &M3:&&&"&ItCy4&&&&&r   r0   c                       e Zd ZU  ed d          Zeed<   ee         ed<   dZ	ee
eef         dz           dz  ed<    edd	          Ze
eef         dz  ed
<   dS )GenerateResponsec                       t                       S r   r
   r   r   r   r   zGenerateResponse.<lambda>L   r   r   r   r   r   choicesNprompt_logprobsr$   r    r%   )r&   r'   r(   r   r   r)   r*   r+   r0   r9   r.   r,   r	   r%   r   r   r   r   r6   r6   J   s         e22H  J    ())))>BOT$sG|,t34t;BBB05K1 1 1S#X-     r   r6   N)typingr   pydanticr   r   0vllm.entrypoints.openai.chat_completion.protocolr   'vllm.entrypoints.openai.engine.protocolr   r   vllm.logprobsr	   
vllm.utilsr   r   r0   r6   r   r   r   <module>r@      s         % % % % % % % % S S S S S S        " ! ! ! ! ! " " " " " ". . . . .i . . .b' ' ' ' 'Y ' ' '    y     r   