o
    r)i"                     @  s  d dl mZ d dlZd dlmZmZmZ d dlmZ d dlZddl	m
Z
 ddlmZmZmZmZmZmZmZ ddlmZmZ dd	lmZ dd
lmZmZ ddlmZmZ ddlmZm Z  ddl!m"Z"m#Z#m$Z$ ddl%m&Z&m'Z' ddl(m)Z) ddl*m+Z+ ddl,m-Z- ddl.m/Z/ ddl0m1Z1 ddl2m3Z3 ddl4m5Z5 ddgZ6G dd deZ7G dd deZ8G dd dZ9G dd dZ:G dd dZ;G d d! d!Z<dS )"    )annotationsN)UnionIterableOptional)Literal   )_legacy_response)BodyOmitQueryHeadersNotGivenomit	not_given)maybe_transformasync_maybe_transform)cached_property)SyncAPIResourceAsyncAPIResource)to_streamed_response_wrapper"async_to_streamed_response_wrapper)SyncCursorPageAsyncCursorPage)assistant_list_paramsassistant_create_paramsassistant_update_params)AsyncPaginatormake_request_options)	Assistant)	ChatModel)AssistantDeleted)Metadata)ReasoningEffort)AssistantToolParam)"AssistantResponseFormatOptionParam
AssistantsAsyncAssistantsc                   @     e Zd ZdZedBddZedCddZed	e	e	e	e	e	e	e	e	e	e	d
d
d
e
ddDd(d)Zed	d
d
d
e
d*dEd-d.Zed	e	e	e	e	e	e	e	e	e	e	e	d
d
d
e
d/dFd2d3Zed	e	e	e	e	d
d
d
e
d4dGd=d>Zed	d
d
d
e
d*dHd@dAZd
S )Ir%   4Build Assistants that can call models and use tools.returnAssistantsWithRawResponsec                 C     t | S a  
        This property can be used as a prefix for any HTTP method call to return
        the raw response object instead of the parsed content.

        For more information, see https://www.github.com/openai/openai-python#accessing-raw-response-data-eg-headers
        )r*   self r/   d/var/www/html/voicebot/backend/venv/lib/python3.10/site-packages/openai/resources/beta/assistants.pywith_raw_response&      zAssistants.with_raw_responseAssistantsWithStreamingResponsec                 C  r+   z
        An alternative to `.with_raw_response` that doesn't eagerly read the response body.

        For more information, see https://www.github.com/openai/openai-python#with_streaming_response
        )r3   r-   r/   r/   r0   with_streaming_response0      z"Assistants.with_streaming_response
deprecatedNdescriptioninstructionsmetadatanamereasoning_effortresponse_formattemperaturetool_resourcestoolstop_pextra_headersextra_query
extra_bodytimeoutmodelUnion[str, ChatModel]r9   Optional[str] | Omitr:   r;   Optional[Metadata] | Omitr<   r=    Optional[ReasoningEffort] | Omitr>   3Optional[AssistantResponseFormatOptionParam] | Omitr?   Optional[float] | Omitr@   6Optional[assistant_create_params.ToolResources] | OmitrA   #Iterable[AssistantToolParam] | OmitrB   rC   Headers | NonerD   Query | NonerE   Body | NonerF   'float | httpx.Timeout | None | NotGivenr   c                C  sN   ddi|pi }| j dt|||||||||	|
|dtjt||||dtdS )  
        Create an assistant with a model and instructions.

        Args:
          model: ID of the model to use. You can use the
              [List models](https://platform.openai.com/docs/api-reference/models/list) API to
              see all of your available models, or see our
              [Model overview](https://platform.openai.com/docs/models) for descriptions of
              them.

          description: The description of the assistant. The maximum length is 512 characters.

          instructions: The system instructions that the assistant uses. The maximum length is 256,000
              characters.

          metadata: Set of 16 key-value pairs that can be attached to an object. This can be useful
              for storing additional information about the object in a structured format, and
              querying for objects via API or the dashboard.

              Keys are strings with a maximum length of 64 characters. Values are strings with
              a maximum length of 512 characters.

          name: The name of the assistant. The maximum length is 256 characters.

          reasoning_effort: Constrains effort on reasoning for
              [reasoning models](https://platform.openai.com/docs/guides/reasoning). Currently
              supported values are `none`, `minimal`, `low`, `medium`, `high`, and `xhigh`.
              Reducing reasoning effort can result in faster responses and fewer tokens used
              on reasoning in a response.

              - `gpt-5.1` defaults to `none`, which does not perform reasoning. The supported
                reasoning values for `gpt-5.1` are `none`, `low`, `medium`, and `high`. Tool
                calls are supported for all reasoning values in gpt-5.1.
              - All models before `gpt-5.1` default to `medium` reasoning effort, and do not
                support `none`.
              - The `gpt-5-pro` model defaults to (and only supports) `high` reasoning effort.
              - `xhigh` is supported for all models after `gpt-5.1-codex-max`.

          response_format: Specifies the format that the model must output. Compatible with
              [GPT-4o](https://platform.openai.com/docs/models#gpt-4o),
              [GPT-4 Turbo](https://platform.openai.com/docs/models#gpt-4-turbo-and-gpt-4),
              and all GPT-3.5 Turbo models since `gpt-3.5-turbo-1106`.

              Setting to `{ "type": "json_schema", "json_schema": {...} }` enables Structured
              Outputs which ensures the model will match your supplied JSON schema. Learn more
              in the
              [Structured Outputs guide](https://platform.openai.com/docs/guides/structured-outputs).

              Setting to `{ "type": "json_object" }` enables JSON mode, which ensures the
              message the model generates is valid JSON.

              **Important:** when using JSON mode, you **must** also instruct the model to
              produce JSON yourself via a system or user message. Without this, the model may
              generate an unending stream of whitespace until the generation reaches the token
              limit, resulting in a long-running and seemingly "stuck" request. Also note that
              the message content may be partially cut off if `finish_reason="length"`, which
              indicates the generation exceeded `max_tokens` or the conversation exceeded the
              max context length.

          temperature: What sampling temperature to use, between 0 and 2. Higher values like 0.8 will
              make the output more random, while lower values like 0.2 will make it more
              focused and deterministic.

          tool_resources: A set of resources that are used by the assistant's tools. The resources are
              specific to the type of tool. For example, the `code_interpreter` tool requires
              a list of file IDs, while the `file_search` tool requires a list of vector store
              IDs.

          tools: A list of tool enabled on the assistant. There can be a maximum of 128 tools per
              assistant. Tools can be of types `code_interpreter`, `file_search`, or
              `function`.

          top_p: An alternative to sampling with temperature, called nucleus sampling, where the
              model considers the results of the tokens with top_p probability mass. So 0.1
              means only the tokens comprising the top 10% probability mass are considered.

              We generally recommend altering this or temperature but not both.

          extra_headers: Send extra headers

          extra_query: Add additional query parameters to the request

          extra_body: Add additional JSON properties to the request

          timeout: Override the client-level default timeout for this request, in seconds
        OpenAI-Betaassistants=v2/assistantsrG   r9   r:   r;   r<   r=   r>   r?   r@   rA   rB   rC   rD   rE   rF   bodyoptionscast_to)_postr   r   AssistantCreateParamsr   r   r.   rG   r9   r:   r;   r<   r=   r>   r?   r@   rA   rB   rC   rD   rE   rF   r/   r/   r0   create9   s.   lzAssistants.createrY   assistant_idstrc                C  D   |s	t d|ddi|pi }| jd| t||||dtdS )K  
        Retrieves an assistant.

        Args:
          extra_headers: Send extra headers

          extra_query: Add additional query parameters to the request

          extra_body: Add additional JSON properties to the request

          timeout: Override the client-level default timeout for this request, in seconds
        ;Expected a non-empty value for `assistant_id` but received rU   rV   /assistants/rY   r\   r]   
ValueError_getr   r   r.   rb   rC   rD   rE   rF   r/   r/   r0   retrieve      zAssistants.retriever9   r:   r;   rG   r<   r=   r>   r?   r@   rA   rB   rC   rD   rE   rF   3  Union[str, Literal['gpt-5', 'gpt-5-mini', 'gpt-5-nano', 'gpt-5-2025-08-07', 'gpt-5-mini-2025-08-07', 'gpt-5-nano-2025-08-07', 'gpt-4.1', 'gpt-4.1-mini', 'gpt-4.1-nano', 'gpt-4.1-2025-04-14', 'gpt-4.1-mini-2025-04-14', 'gpt-4.1-nano-2025-04-14', 'o3-mini', 'o3-mini-2025-01-31', 'o1', 'o1-2024-12-17', 'gpt-4o', 'gpt-4o-2024-11-20', 'gpt-4o-2024-08-06', 'gpt-4o-2024-05-13', 'gpt-4o-mini', 'gpt-4o-mini-2024-07-18', 'gpt-4.5-preview', 'gpt-4.5-preview-2025-02-27', 'gpt-4-turbo', 'gpt-4-turbo-2024-04-09', 'gpt-4-0125-preview', 'gpt-4-turbo-preview', 'gpt-4-1106-preview', 'gpt-4-vision-preview', 'gpt-4', 'gpt-4-0314', 'gpt-4-0613', 'gpt-4-32k', 'gpt-4-32k-0314', 'gpt-4-32k-0613', 'gpt-3.5-turbo', 'gpt-3.5-turbo-16k', 'gpt-3.5-turbo-0613', 'gpt-3.5-turbo-1106', 'gpt-3.5-turbo-0125', 'gpt-3.5-turbo-16k-0613']] | Omit6Optional[assistant_update_params.ToolResources] | Omitc                C  sf   |s	t d|ddi|pi }| jd| t||||||||	|
||dtjt||||dtdS )  Modifies an assistant.

        Args:
          description: The description of the assistant.

        The maximum length is 512 characters.

          instructions: The system instructions that the assistant uses. The maximum length is 256,000
              characters.

          metadata: Set of 16 key-value pairs that can be attached to an object. This can be useful
              for storing additional information about the object in a structured format, and
              querying for objects via API or the dashboard.

              Keys are strings with a maximum length of 64 characters. Values are strings with
              a maximum length of 512 characters.

          model: ID of the model to use. You can use the
              [List models](https://platform.openai.com/docs/api-reference/models/list) API to
              see all of your available models, or see our
              [Model overview](https://platform.openai.com/docs/models) for descriptions of
              them.

          name: The name of the assistant. The maximum length is 256 characters.

          reasoning_effort: Constrains effort on reasoning for
              [reasoning models](https://platform.openai.com/docs/guides/reasoning). Currently
              supported values are `none`, `minimal`, `low`, `medium`, `high`, and `xhigh`.
              Reducing reasoning effort can result in faster responses and fewer tokens used
              on reasoning in a response.

              - `gpt-5.1` defaults to `none`, which does not perform reasoning. The supported
                reasoning values for `gpt-5.1` are `none`, `low`, `medium`, and `high`. Tool
                calls are supported for all reasoning values in gpt-5.1.
              - All models before `gpt-5.1` default to `medium` reasoning effort, and do not
                support `none`.
              - The `gpt-5-pro` model defaults to (and only supports) `high` reasoning effort.
              - `xhigh` is supported for all models after `gpt-5.1-codex-max`.

          response_format: Specifies the format that the model must output. Compatible with
              [GPT-4o](https://platform.openai.com/docs/models#gpt-4o),
              [GPT-4 Turbo](https://platform.openai.com/docs/models#gpt-4-turbo-and-gpt-4),
              and all GPT-3.5 Turbo models since `gpt-3.5-turbo-1106`.

              Setting to `{ "type": "json_schema", "json_schema": {...} }` enables Structured
              Outputs which ensures the model will match your supplied JSON schema. Learn more
              in the
              [Structured Outputs guide](https://platform.openai.com/docs/guides/structured-outputs).

              Setting to `{ "type": "json_object" }` enables JSON mode, which ensures the
              message the model generates is valid JSON.

              **Important:** when using JSON mode, you **must** also instruct the model to
              produce JSON yourself via a system or user message. Without this, the model may
              generate an unending stream of whitespace until the generation reaches the token
              limit, resulting in a long-running and seemingly "stuck" request. Also note that
              the message content may be partially cut off if `finish_reason="length"`, which
              indicates the generation exceeded `max_tokens` or the conversation exceeded the
              max context length.

          temperature: What sampling temperature to use, between 0 and 2. Higher values like 0.8 will
              make the output more random, while lower values like 0.2 will make it more
              focused and deterministic.

          tool_resources: A set of resources that are used by the assistant's tools. The resources are
              specific to the type of tool. For example, the `code_interpreter` tool requires
              a list of file IDs, while the `file_search` tool requires a list of vector store
              IDs.

          tools: A list of tool enabled on the assistant. There can be a maximum of 128 tools per
              assistant. Tools can be of types `code_interpreter`, `file_search`, or
              `function`.

          top_p: An alternative to sampling with temperature, called nucleus sampling, where the
              model considers the results of the tokens with top_p probability mass. So 0.1
              means only the tokens comprising the top 10% probability mass are considered.

              We generally recommend altering this or temperature but not both.

          extra_headers: Send extra headers

          extra_query: Add additional query parameters to the request

          extra_body: Add additional JSON properties to the request

          timeout: Override the client-level default timeout for this request, in seconds
        rf   rU   rV   rg   r9   r:   r;   rG   r<   r=   r>   r?   r@   rA   rB   rY   rZ   )rj   r^   r   r   AssistantUpdateParamsr   r   r.   rb   r9   r:   r;   rG   r<   r=   r>   r?   r@   rA   rB   rC   rD   rE   rF   r/   r/   r0   update   s4    zAssistants.updateafterbeforelimitorderrC   rD   rE   rF   rx   
str | Omitry   rz   
int | Omitr{   Literal['asc', 'desc'] | OmitSyncCursorPage[Assistant]c          	      C  F   ddi|pi }| j dtt t||||t||||dtjdtdS a  Returns a list of assistants.

        Args:
          after: A cursor for use in pagination.

        `after` is an object ID that defines your place
              in the list. For instance, if you make a list request and receive 100 objects,
              ending with obj_foo, your subsequent call can include after=obj_foo in order to
              fetch the next page of the list.

          before: A cursor for use in pagination. `before` is an object ID that defines your place
              in the list. For instance, if you make a list request and receive 100 objects,
              starting with obj_foo, your subsequent call can include before=obj_foo in order
              to fetch the previous page of the list.

          limit: A limit on the number of objects to be returned. Limit can range between 1 and
              100, and the default is 20.

          order: Sort order by the `created_at` timestamp of the objects. `asc` for ascending
              order and `desc` for descending order.

          extra_headers: Send extra headers

          extra_query: Add additional query parameters to the request

          extra_body: Add additional JSON properties to the request

          timeout: Override the client-level default timeout for this request, in seconds
        rU   rV   rW   )rx   ry   rz   r{   )rC   rD   rE   rF   query)pager\   rG   )_get_api_listr   r   r   r   r   AssistantListParams	r.   rx   ry   rz   r{   rC   rD   rE   rF   r/   r/   r0   list  (   ,zAssistants.listr    c                C  rd   )H  
        Delete an assistant.

        Args:
          extra_headers: Send extra headers

          extra_query: Add additional query parameters to the request

          extra_body: Add additional JSON properties to the request

          timeout: Override the client-level default timeout for this request, in seconds
        rf   rU   rV   rg   rY   rh   rj   _deleter   r    rl   r/   r/   r0   delete  rn   zAssistants.delete)r)   r*   )r)   r3    rG   rH   r9   rI   r:   rI   r;   rJ   r<   rI   r=   rK   r>   rL   r?   rM   r@   rN   rA   rO   rB   rM   rC   rP   rD   rQ   rE   rR   rF   rS   r)   r   rb   rc   rC   rP   rD   rQ   rE   rR   rF   rS   r)   r   "rb   rc   r9   rI   r:   rI   r;   rJ   rG   rp   r<   rI   r=   rK   r>   rL   r?   rM   r@   rq   rA   rO   rB   rM   rC   rP   rD   rQ   rE   rR   rF   rS   r)   r   )rx   r|   ry   r|   rz   r}   r{   r~   rC   rP   rD   rQ   rE   rR   rF   rS   r)   r   rb   rc   rC   rP   rD   rQ   rE   rR   rF   rS   r)   r    __name__
__module____qualname____doc__r   r1   r5   typing_extensionsr7   r   r   ra   rm   rv   r   r   r/   r/   r/   r0   r%   #   ~    	 "0 8Ac                   @  r'   )Ir&   r(   r)   AsyncAssistantsWithRawResponsec                 C  r+   r,   )r   r-   r/   r/   r0   r1     r2   z!AsyncAssistants.with_raw_response$AsyncAssistantsWithStreamingResponsec                 C  r+   r4   )r   r-   r/   r/   r0   r5     r6   z'AsyncAssistants.with_streaming_responser7   Nr8   rG   rH   r9   rI   r:   r;   rJ   r<   r=   rK   r>   rL   r?   rM   r@   rN   rA   rO   rB   rC   rP   rD   rQ   rE   rR   rF   rS   r   c                  s\   ddi|pi }| j dt|||||||||	|
|dtjI dH t||||dtdI dH S )rT   rU   rV   rW   rX   NrY   rZ   )r^   r   r   r_   r   r   r`   r/   r/   r0   ra     s0   lzAsyncAssistants.createrY   rb   rc   c                  L   |s
t d|ddi|pi }| jd| t||||dtdI dH S )re   rf   rU   rV   rg   rY   rh   Nri   rl   r/   r/   r0   rm        zAsyncAssistants.retrievero   rp   rq   c                  st   |s
t d|ddi|pi }| jd| t||||||||	|
||dtjI dH t||||dtdI dH S )	rr   rf   rU   rV   rg   rs   NrY   rZ   )rj   r^   r   r   rt   r   r   ru   r/   r/   r0   rv     s6    zAsyncAssistants.updaterw   rx   r|   ry   rz   r}   r{   r~   5AsyncPaginator[Assistant, AsyncCursorPage[Assistant]]c          	      C  r   r   )r   r   r   r   r   r   r   r   r/   r/   r0   r   u  r   zAsyncAssistants.listr    c                  r   )r   rf   rU   rV   rg   rY   rh   Nr   rl   r/   r/   r0   r     r   zAsyncAssistants.delete)r)   r   )r)   r   r   r   r   )rx   r|   ry   r|   rz   r}   r{   r~   rC   rP   rD   rQ   rE   rR   rF   rS   r)   r   r   r   r/   r/   r/   r0   r&     r   c                   @     e Zd ZdddZdS )	r*   
assistantsr%   r)   Nonec                 C  P   || _ t|j| _t|j| _t|j| _t|j| _t|j| _d S N)_assistantsr   to_raw_response_wrapperra   rm   rv   r   r   r.   r   r/   r/   r0   __init__  *   z"AssistantsWithRawResponse.__init__Nr   r%   r)   r   r   r   r   r   r/   r/   r/   r0   r*         r*   c                   @  r   )	r   r   r&   r)   r   c                 C  r   r   )r   r   async_to_raw_response_wrapperra   rm   rv   r   r   r   r/   r/   r0   r     r   z'AsyncAssistantsWithRawResponse.__init__Nr   r&   r)   r   r   r/   r/   r/   r0   r     r   r   c                   @  r   )	r3   r   r%   r)   r   c                 C  F   || _ t|j| _t|j| _t|j| _t|j| _t|j| _d S r   )r   r   ra   rm   rv   r   r   r   r/   r/   r0   r     *   z(AssistantsWithStreamingResponse.__init__Nr   r   r/   r/   r/   r0   r3     r   r3   c                   @  r   )	r   r   r&   r)   r   c                 C  r   r   )r   r   ra   rm   rv   r   r   r   r/   r/   r0   r   9  r   z-AsyncAssistantsWithStreamingResponse.__init__Nr   r   r/   r/   r/   r0   r   8  r   r   )=
__future__r   r   typingr   r   r   r   httpx r   _typesr	   r
   r   r   r   r   r   _utilsr   r   _compatr   	_resourcer   r   	_responser   r   
paginationr   r   
types.betar   r   r   _base_clientr   r   types.beta.assistantr   types.shared.chat_modelr   types.beta.assistant_deletedr    types.shared_params.metadatar!   types.shared.reasoning_effortr"   types.beta.assistant_tool_paramr#   1types.beta.assistant_response_format_option_paramr$   __all__r%   r&   r*   r   r3   r   r/   r/   r/   r0   <module>   sD   $   _   _