
    Ig}}                      d dl mZ d dlZd dlmZmZmZmZmZ d dl	m
Z
mZ d dlZd dlZddlmZ ddlmZmZmZmZmZ ddlmZmZmZ dd	lmZ dd
lmZmZ ddlm Z m!Z! ddl"m#Z#m$Z$ ddl%m&Z&m'Z' ddl(m)Z) ddl*m+Z+ ddl,m-Z- ddl.m/Z/ ddl0m1Z1 ddl2m3Z3 ddl4m&Z& ddl5m6Z6 ddl7m8Z8 ddl9m:Z: ddl;m<Z< ddgZ= G d de      Z> G d de      Z? G d d      Z@ G d d       ZA G d! d"      ZB G d# d$      ZCd&d%ZDy)'    )annotationsN)DictListUnionIterableOptional)Literaloverload   )_legacy_response)	NOT_GIVENBodyQueryHeadersNotGiven)required_argsmaybe_transformasync_maybe_transform)cached_property)SyncAPIResourceAsyncAPIResource)to_streamed_response_wrapper"async_to_streamed_response_wrapper)StreamAsyncStream)ChatCompletionAudioParamcompletion_create_params)make_request_options)	ChatModel)ChatCompletion)ChatCompletionChunk)ChatCompletionModality)ChatCompletionToolParam)r   )ChatCompletionMessageParam) ChatCompletionStreamOptionsParam)$ChatCompletionPredictionContentParam)#ChatCompletionToolChoiceOptionParamCompletionsAsyncCompletionsc            !         e Zd Zedd       Zedd       Zeeeeeeeeeeeeeeeeeeeeeeeeeeeeddded	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 dd       Zeeeeeeeeeeeeeeeeeeeeeeeeeeeddded	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 dd	       Zeeeeeeeeeeeeeeeeeeeeeeeeeeeddded	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 dd
       Z e	ddgg d      eeeeeeeeeeeeeeeeeeeeeeeeeeeddded	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 dd       Zy)r(   c                    t        |       S a  
        This property can be used as a prefix for any HTTP method call to return the
        the raw response object instead of the parsed content.

        For more information, see https://www.github.com/openai/openai-python#accessing-raw-response-data-eg-headers
        )CompletionsWithRawResponseselfs    ^/var/www/html/answerous/venv/lib/python3.12/site-packages/openai/resources/chat/completions.pywith_raw_responsezCompletions.with_raw_response+   s     *$//    c                    t        |       S z
        An alternative to `.with_raw_response` that doesn't eagerly read the response body.

        For more information, see https://www.github.com/openai/openai-python#with_streaming_response
        ) CompletionsWithStreamingResponser.   s    r0   with_streaming_responsez#Completions.with_streaming_response5   s     055r2   Naudiofrequency_penaltyfunction_call	functions
logit_biaslogprobsmax_completion_tokens
max_tokensmetadata
modalitiesnparallel_tool_calls
predictionpresence_penaltyresponse_formatseedservice_tierstopstorestreamstream_optionstemperaturetool_choicetoolstop_logprobstop_puserextra_headersextra_query
extra_bodytimeoutmessagesmodelc       !             ya-  Creates a model response for the given chat conversation.

        Learn more in the
        [text generation](https://platform.openai.com/docs/guides/text-generation),
        [vision](https://platform.openai.com/docs/guides/vision), and
        [audio](https://platform.openai.com/docs/guides/audio) guides.

        Args:
          messages: A list of messages comprising the conversation so far. Depending on the
              [model](https://platform.openai.com/docs/models) you use, different message
              types (modalities) are supported, like
              [text](https://platform.openai.com/docs/guides/text-generation),
              [images](https://platform.openai.com/docs/guides/vision), and
              [audio](https://platform.openai.com/docs/guides/audio).

          model: ID of the model to use. See the
              [model endpoint compatibility](https://platform.openai.com/docs/models#model-endpoint-compatibility)
              table for details on which models work with the Chat API.

          audio: Parameters for audio output. Required when audio output is requested with
              `modalities: ["audio"]`.
              [Learn more](https://platform.openai.com/docs/guides/audio).

          frequency_penalty: Number between -2.0 and 2.0. Positive values penalize new tokens based on their
              existing frequency in the text so far, decreasing the model's likelihood to
              repeat the same line verbatim.

              [See more information about frequency and presence penalties.](https://platform.openai.com/docs/guides/text-generation)

          function_call: Deprecated in favor of `tool_choice`.

              Controls which (if any) function is called by the model. `none` means the model
              will not call a function and instead generates a message. `auto` means the model
              can pick between generating a message or calling a function. Specifying a
              particular function via `{"name": "my_function"}` forces the model to call that
              function.

              `none` is the default when no functions are present. `auto` is the default if
              functions are present.

          functions: Deprecated in favor of `tools`.

              A list of functions the model may generate JSON inputs for.

          logit_bias: Modify the likelihood of specified tokens appearing in the completion.

              Accepts a JSON object that maps tokens (specified by their token ID in the
              tokenizer) to an associated bias value from -100 to 100. Mathematically, the
              bias is added to the logits generated by the model prior to sampling. The exact
              effect will vary per model, but values between -1 and 1 should decrease or
              increase likelihood of selection; values like -100 or 100 should result in a ban
              or exclusive selection of the relevant token.

          logprobs: Whether to return log probabilities of the output tokens or not. If true,
              returns the log probabilities of each output token returned in the `content` of
              `message`.

          max_completion_tokens: An upper bound for the number of tokens that can be generated for a completion,
              including visible output tokens and
              [reasoning tokens](https://platform.openai.com/docs/guides/reasoning).

          max_tokens: The maximum number of [tokens](/tokenizer) that can be generated in the chat
              completion. This value can be used to control
              [costs](https://openai.com/api/pricing/) for text generated via API.

              This value is now deprecated in favor of `max_completion_tokens`, and is not
              compatible with
              [o1 series models](https://platform.openai.com/docs/guides/reasoning).

          metadata: Developer-defined tags and values used for filtering completions in the
              [dashboard](https://platform.openai.com/chat-completions).

          modalities: Output types that you would like the model to generate for this request. Most
              models are capable of generating text, which is the default:

              `["text"]`

              The `gpt-4o-audio-preview` model can also be used to
              [generate audio](https://platform.openai.com/docs/guides/audio). To request that
              this model generate both text and audio responses, you can use:

              `["text", "audio"]`

          n: How many chat completion choices to generate for each input message. Note that
              you will be charged based on the number of generated tokens across all of the
              choices. Keep `n` as `1` to minimize costs.

          parallel_tool_calls: Whether to enable
              [parallel function calling](https://platform.openai.com/docs/guides/function-calling#configuring-parallel-function-calling)
              during tool use.

          prediction: Static predicted output content, such as the content of a text file that is
              being regenerated.

          presence_penalty: Number between -2.0 and 2.0. Positive values penalize new tokens based on
              whether they appear in the text so far, increasing the model's likelihood to
              talk about new topics.

              [See more information about frequency and presence penalties.](https://platform.openai.com/docs/guides/text-generation)

          response_format: An object specifying the format that the model must output. Compatible with
              [GPT-4o](https://platform.openai.com/docs/models#gpt-4o),
              [GPT-4o mini](https://platform.openai.com/docs/models#gpt-4o-mini),
              [GPT-4 Turbo](https://platform.openai.com/docs/models#gpt-4-turbo-and-gpt-4) and
              all GPT-3.5 Turbo models newer than `gpt-3.5-turbo-1106`.

              Setting to `{ "type": "json_schema", "json_schema": {...} }` enables Structured
              Outputs which ensures the model will match your supplied JSON schema. Learn more
              in the
              [Structured Outputs guide](https://platform.openai.com/docs/guides/structured-outputs).

              Setting to `{ "type": "json_object" }` enables JSON mode, which ensures the
              message the model generates is valid JSON.

              **Important:** when using JSON mode, you **must** also instruct the model to
              produce JSON yourself via a system or user message. Without this, the model may
              generate an unending stream of whitespace until the generation reaches the token
              limit, resulting in a long-running and seemingly "stuck" request. Also note that
              the message content may be partially cut off if `finish_reason="length"`, which
              indicates the generation exceeded `max_tokens` or the conversation exceeded the
              max context length.

          seed: This feature is in Beta. If specified, our system will make a best effort to
              sample deterministically, such that repeated requests with the same `seed` and
              parameters should return the same result. Determinism is not guaranteed, and you
              should refer to the `system_fingerprint` response parameter to monitor changes
              in the backend.

          service_tier: Specifies the latency tier to use for processing the request. This parameter is
              relevant for customers subscribed to the scale tier service:

              - If set to 'auto', and the Project is Scale tier enabled, the system will
                utilize scale tier credits until they are exhausted.
              - If set to 'auto', and the Project is not Scale tier enabled, the request will
                be processed using the default service tier with a lower uptime SLA and no
                latency guarentee.
              - If set to 'default', the request will be processed using the default service
                tier with a lower uptime SLA and no latency guarentee.
              - When not set, the default behavior is 'auto'.

              When this parameter is set, the response body will include the `service_tier`
              utilized.

          stop: Up to 4 sequences where the API will stop generating further tokens.

          store: Whether or not to store the output of this chat completion request for use in
              our [model distillation](https://platform.openai.com/docs/guides/distillation)
              or [evals](https://platform.openai.com/docs/guides/evals) products.

          stream: If set, partial message deltas will be sent, like in ChatGPT. Tokens will be
              sent as data-only
              [server-sent events](https://developer.mozilla.org/en-US/docs/Web/API/Server-sent_events/Using_server-sent_events#Event_stream_format)
              as they become available, with the stream terminated by a `data: [DONE]`
              message.
              [Example Python code](https://cookbook.openai.com/examples/how_to_stream_completions).

          stream_options: Options for streaming response. Only set this when you set `stream: true`.

          temperature: What sampling temperature to use, between 0 and 2. Higher values like 0.8 will
              make the output more random, while lower values like 0.2 will make it more
              focused and deterministic.

              We generally recommend altering this or `top_p` but not both.

          tool_choice: Controls which (if any) tool is called by the model. `none` means the model will
              not call any tool and instead generates a message. `auto` means the model can
              pick between generating a message or calling one or more tools. `required` means
              the model must call one or more tools. Specifying a particular tool via
              `{"type": "function", "function": {"name": "my_function"}}` forces the model to
              call that tool.

              `none` is the default when no tools are present. `auto` is the default if tools
              are present.

          tools: A list of tools the model may call. Currently, only functions are supported as a
              tool. Use this to provide a list of functions the model may generate JSON inputs
              for. A max of 128 functions are supported.

          top_logprobs: An integer between 0 and 20 specifying the number of most likely tokens to
              return at each token position, each with an associated log probability.
              `logprobs` must be set to `true` if this parameter is used.

          top_p: An alternative to sampling with temperature, called nucleus sampling, where the
              model considers the results of the tokens with top_p probability mass. So 0.1
              means only the tokens comprising the top 10% probability mass are considered.

              We generally recommend altering this or `temperature` but not both.

          user: A unique identifier representing your end-user, which can help OpenAI to monitor
              and detect abuse.
              [Learn more](https://platform.openai.com/docs/guides/safety-best-practices#end-user-ids).

          extra_headers: Send extra headers

          extra_query: Add additional query parameters to the request

          extra_body: Add additional JSON properties to the request

          timeout: Override the client-level default timeout for this request, in seconds
        N "r/   rW   rX   r8   r9   r:   r;   r<   r=   r>   r?   r@   rA   rB   rC   rD   rE   rF   rG   rH   rI   rJ   rK   rL   rM   rN   rO   rP   rQ   rR   rS   rT   rU   rV   s"                                     r0   createzCompletions.create>       ` 	r2   r8   r9   r:   r;   r<   r=   r>   r?   r@   rA   rB   rC   rD   rE   rF   rG   rH   rI   rJ   rL   rM   rN   rO   rP   rQ   rR   rS   rT   rU   rV   c       !             ya-  Creates a model response for the given chat conversation.

        Learn more in the
        [text generation](https://platform.openai.com/docs/guides/text-generation),
        [vision](https://platform.openai.com/docs/guides/vision), and
        [audio](https://platform.openai.com/docs/guides/audio) guides.

        Args:
          messages: A list of messages comprising the conversation so far. Depending on the
              [model](https://platform.openai.com/docs/models) you use, different message
              types (modalities) are supported, like
              [text](https://platform.openai.com/docs/guides/text-generation),
              [images](https://platform.openai.com/docs/guides/vision), and
              [audio](https://platform.openai.com/docs/guides/audio).

          model: ID of the model to use. See the
              [model endpoint compatibility](https://platform.openai.com/docs/models#model-endpoint-compatibility)
              table for details on which models work with the Chat API.

          stream: If set, partial message deltas will be sent, like in ChatGPT. Tokens will be
              sent as data-only
              [server-sent events](https://developer.mozilla.org/en-US/docs/Web/API/Server-sent_events/Using_server-sent_events#Event_stream_format)
              as they become available, with the stream terminated by a `data: [DONE]`
              message.
              [Example Python code](https://cookbook.openai.com/examples/how_to_stream_completions).

          audio: Parameters for audio output. Required when audio output is requested with
              `modalities: ["audio"]`.
              [Learn more](https://platform.openai.com/docs/guides/audio).

          frequency_penalty: Number between -2.0 and 2.0. Positive values penalize new tokens based on their
              existing frequency in the text so far, decreasing the model's likelihood to
              repeat the same line verbatim.

              [See more information about frequency and presence penalties.](https://platform.openai.com/docs/guides/text-generation)

          function_call: Deprecated in favor of `tool_choice`.

              Controls which (if any) function is called by the model. `none` means the model
              will not call a function and instead generates a message. `auto` means the model
              can pick between generating a message or calling a function. Specifying a
              particular function via `{"name": "my_function"}` forces the model to call that
              function.

              `none` is the default when no functions are present. `auto` is the default if
              functions are present.

          functions: Deprecated in favor of `tools`.

              A list of functions the model may generate JSON inputs for.

          logit_bias: Modify the likelihood of specified tokens appearing in the completion.

              Accepts a JSON object that maps tokens (specified by their token ID in the
              tokenizer) to an associated bias value from -100 to 100. Mathematically, the
              bias is added to the logits generated by the model prior to sampling. The exact
              effect will vary per model, but values between -1 and 1 should decrease or
              increase likelihood of selection; values like -100 or 100 should result in a ban
              or exclusive selection of the relevant token.

          logprobs: Whether to return log probabilities of the output tokens or not. If true,
              returns the log probabilities of each output token returned in the `content` of
              `message`.

          max_completion_tokens: An upper bound for the number of tokens that can be generated for a completion,
              including visible output tokens and
              [reasoning tokens](https://platform.openai.com/docs/guides/reasoning).

          max_tokens: The maximum number of [tokens](/tokenizer) that can be generated in the chat
              completion. This value can be used to control
              [costs](https://openai.com/api/pricing/) for text generated via API.

              This value is now deprecated in favor of `max_completion_tokens`, and is not
              compatible with
              [o1 series models](https://platform.openai.com/docs/guides/reasoning).

          metadata: Developer-defined tags and values used for filtering completions in the
              [dashboard](https://platform.openai.com/chat-completions).

          modalities: Output types that you would like the model to generate for this request. Most
              models are capable of generating text, which is the default:

              `["text"]`

              The `gpt-4o-audio-preview` model can also be used to
              [generate audio](https://platform.openai.com/docs/guides/audio). To request that
              this model generate both text and audio responses, you can use:

              `["text", "audio"]`

          n: How many chat completion choices to generate for each input message. Note that
              you will be charged based on the number of generated tokens across all of the
              choices. Keep `n` as `1` to minimize costs.

          parallel_tool_calls: Whether to enable
              [parallel function calling](https://platform.openai.com/docs/guides/function-calling#configuring-parallel-function-calling)
              during tool use.

          prediction: Static predicted output content, such as the content of a text file that is
              being regenerated.

          presence_penalty: Number between -2.0 and 2.0. Positive values penalize new tokens based on
              whether they appear in the text so far, increasing the model's likelihood to
              talk about new topics.

              [See more information about frequency and presence penalties.](https://platform.openai.com/docs/guides/text-generation)

          response_format: An object specifying the format that the model must output. Compatible with
              [GPT-4o](https://platform.openai.com/docs/models#gpt-4o),
              [GPT-4o mini](https://platform.openai.com/docs/models#gpt-4o-mini),
              [GPT-4 Turbo](https://platform.openai.com/docs/models#gpt-4-turbo-and-gpt-4) and
              all GPT-3.5 Turbo models newer than `gpt-3.5-turbo-1106`.

              Setting to `{ "type": "json_schema", "json_schema": {...} }` enables Structured
              Outputs which ensures the model will match your supplied JSON schema. Learn more
              in the
              [Structured Outputs guide](https://platform.openai.com/docs/guides/structured-outputs).

              Setting to `{ "type": "json_object" }` enables JSON mode, which ensures the
              message the model generates is valid JSON.

              **Important:** when using JSON mode, you **must** also instruct the model to
              produce JSON yourself via a system or user message. Without this, the model may
              generate an unending stream of whitespace until the generation reaches the token
              limit, resulting in a long-running and seemingly "stuck" request. Also note that
              the message content may be partially cut off if `finish_reason="length"`, which
              indicates the generation exceeded `max_tokens` or the conversation exceeded the
              max context length.

          seed: This feature is in Beta. If specified, our system will make a best effort to
              sample deterministically, such that repeated requests with the same `seed` and
              parameters should return the same result. Determinism is not guaranteed, and you
              should refer to the `system_fingerprint` response parameter to monitor changes
              in the backend.

          service_tier: Specifies the latency tier to use for processing the request. This parameter is
              relevant for customers subscribed to the scale tier service:

              - If set to 'auto', and the Project is Scale tier enabled, the system will
                utilize scale tier credits until they are exhausted.
              - If set to 'auto', and the Project is not Scale tier enabled, the request will
                be processed using the default service tier with a lower uptime SLA and no
                latency guarentee.
              - If set to 'default', the request will be processed using the default service
                tier with a lower uptime SLA and no latency guarentee.
              - When not set, the default behavior is 'auto'.

              When this parameter is set, the response body will include the `service_tier`
              utilized.

          stop: Up to 4 sequences where the API will stop generating further tokens.

          store: Whether or not to store the output of this chat completion request for use in
              our [model distillation](https://platform.openai.com/docs/guides/distillation)
              or [evals](https://platform.openai.com/docs/guides/evals) products.

          stream_options: Options for streaming response. Only set this when you set `stream: true`.

          temperature: What sampling temperature to use, between 0 and 2. Higher values like 0.8 will
              make the output more random, while lower values like 0.2 will make it more
              focused and deterministic.

              We generally recommend altering this or `top_p` but not both.

          tool_choice: Controls which (if any) tool is called by the model. `none` means the model will
              not call any tool and instead generates a message. `auto` means the model can
              pick between generating a message or calling one or more tools. `required` means
              the model must call one or more tools. Specifying a particular tool via
              `{"type": "function", "function": {"name": "my_function"}}` forces the model to
              call that tool.

              `none` is the default when no tools are present. `auto` is the default if tools
              are present.

          tools: A list of tools the model may call. Currently, only functions are supported as a
              tool. Use this to provide a list of functions the model may generate JSON inputs
              for. A max of 128 functions are supported.

          top_logprobs: An integer between 0 and 20 specifying the number of most likely tokens to
              return at each token position, each with an associated log probability.
              `logprobs` must be set to `true` if this parameter is used.

          top_p: An alternative to sampling with temperature, called nucleus sampling, where the
              model considers the results of the tokens with top_p probability mass. So 0.1
              means only the tokens comprising the top 10% probability mass are considered.

              We generally recommend altering this or `temperature` but not both.

          user: A unique identifier representing your end-user, which can help OpenAI to monitor
              and detect abuse.
              [Learn more](https://platform.openai.com/docs/guides/safety-best-practices#end-user-ids).

          extra_headers: Send extra headers

          extra_query: Add additional query parameters to the request

          extra_body: Add additional JSON properties to the request

          timeout: Override the client-level default timeout for this request, in seconds
        Nr[   "r/   rW   rX   rK   r8   r9   r:   r;   r<   r=   r>   r?   r@   rA   rB   rC   rD   rE   rF   rG   rH   rI   rJ   rL   rM   rN   rO   rP   rQ   rR   rS   rT   rU   rV   s"                                     r0   r]   zCompletions.create0  r^   r2   c       !             yra   r[   rb   s"                                     r0   r]   zCompletions.create"  r^   r2   rW   rX   rK   c       !        :   t        |       | j                  dt        i d|d|d|d|d|d|d|d	|d
|	d|
d|d|d|d|d|d|d|||||||||||||dt        j                        t        ||| |!      t        |xs dt        t                 S Nz/chat/completionsrW   rX   r8   r9   r:   r;   r<   r=   r>   r?   r@   rA   rB   rC   rD   rE   rF   )rG   rH   rI   rJ   rK   rL   rM   rN   rO   rP   rQ   rR   )rS   rT   rU   rV   F)bodyoptionscast_torK   
stream_cls)	validate_response_format_postr   r   CompletionCreateParamsr   r    r   r!   r\   s"                                     r0   r]   zCompletions.create  sb   P 	!1zz U U ():	
 $]   !*  ,-B !*  !*  *+> !*  '(8!" &#$ !$0 "$&4#.#."$0" ;> )??A!D )+Q[el #?U12S  *
 *	
r2   )returnr-   )rn   r5   DrW   $Iterable[ChatCompletionMessageParam]rX   Union[str, ChatModel]r8   -Optional[ChatCompletionAudioParam] | NotGivenr9   Optional[float] | NotGivenr:   0completion_create_params.FunctionCall | NotGivenr;   6Iterable[completion_create_params.Function] | NotGivenr<   #Optional[Dict[str, int]] | NotGivenr=   Optional[bool] | NotGivenr>   Optional[int] | NotGivenr?   rx   r@   #Optional[Dict[str, str]] | NotGivenrA   1Optional[List[ChatCompletionModality]] | NotGivenrB   rx   rC   bool | NotGivenrD   9Optional[ChatCompletionPredictionContentParam] | NotGivenrE   rs   rF   2completion_create_params.ResponseFormat | NotGivenrG   rx   rH   /Optional[Literal['auto', 'default']] | NotGivenrI   *Union[Optional[str], List[str]] | NotGivenrJ   rw   rK   z#Optional[Literal[False]] | NotGivenrL   5Optional[ChatCompletionStreamOptionsParam] | NotGivenrM   rs   rN   .ChatCompletionToolChoiceOptionParam | NotGivenrO   ,Iterable[ChatCompletionToolParam] | NotGivenrP   rx   rQ   rs   rR   str | NotGivenrS   Headers | NonerT   Query | NonerU   Body | NonerV   'float | httpx.Timeout | None | NotGivenrn   r    )DrW   rp   rX   rq   rK   Literal[True]r8   rr   r9   rs   r:   rt   r;   ru   r<   rv   r=   rw   r>   rx   r?   rx   r@   ry   rA   rz   rB   rx   rC   r{   rD   r|   rE   rs   rF   r}   rG   rx   rH   r~   rI   r   rJ   rw   rL   r   rM   rs   rN   r   rO   r   rP   rx   rQ   rs   rR   r   rS   r   rT   r   rU   r   rV   r   rn   zStream[ChatCompletionChunk])DrW   rp   rX   rq   rK   boolr8   rr   r9   rs   r:   rt   r;   ru   r<   rv   r=   rw   r>   rx   r?   rx   r@   ry   rA   rz   rB   rx   rC   r{   rD   r|   rE   rs   rF   r}   rG   rx   rH   r~   rI   r   rJ   rw   rL   r   rM   rs   rN   r   rO   r   rP   rx   rQ   rs   rR   r   rS   r   rT   r   rU   r   rV   r   rn   ,ChatCompletion | Stream[ChatCompletionChunk])DrW   rp   rX   rq   r8   rr   r9   rs   r:   rt   r;   ru   r<   rv   r=   rw   r>   rx   r?   rx   r@   ry   rA   rz   rB   rx   rC   r{   rD   r|   rE   rs   rF   r}   rG   rx   rH   r~   rI   r   rJ   rw   rK   3Optional[Literal[False]] | Literal[True] | NotGivenrL   r   rM   rs   rN   r   rO   r   rP   rx   rQ   rs   rR   r   rS   r   rT   r   rU   r   rV   r   rn   r   
__name__
__module____qualname__r   r1   r6   r
   r   r]   r   r[   r2   r0   r(   r(   *   s<   0 0 6 6  @I8AJSLU:C.7:C/88AHQ&//8PY7@NW)2HQ;D+46?PY2;FO>G1:,5( )-$("&;DKo 7o %	o
 =o 6o Ho Jo 8o ,o  8o -o 6o Fo $o  -!o" N#o$ 5%o& L'o( ')o* F+o, 9-o. )/o0 41o2 N3o4 05o6 D7o8 <9o: /;o< *=o> ?oD &EoF "GoH  IoJ 9KoL 
Mo ob  @I8AJSLU:C.7:C/88AHQ&//8PY7@NW)2HQ;D+4PY2;FO>G1:,5( )-$("&;DKo 7o %	o
 o =o 6o Ho Jo 8o ,o  8o -o 6o Fo  $!o" -#o$ N%o& 5'o( L)o* '+o, F-o. 9/o0 )1o2 N3o4 05o6 D7o8 <9o: /;o< *=o> ?oD &EoF "GoH  IoJ 9KoL 
%Mo ob  @I8AJSLU:C.7:C/88AHQ&//8PY7@NW)2HQ;D+4PY2;FO>G1:,5( )-$("&;DKo 7o %	o
 o =o 6o Ho Jo 8o ,o  8o -o 6o Fo  $!o" -#o$ N%o& 5'o( L)o* '+o, F-o. 9/o0 )1o2 N3o4 05o6 D7o8 <9o: /;o< *=o> ?oD &EoF "GoH  IoJ 9KoL 
6Mo ob J(*IJ @I8AJSLU:C.7:C/88AHQ&//8PY7@NW)2HQ;D+4FOPY2;FO>G1:,5( )-$("&;DKR
 7R
 %	R

 =R
 6R
 HR
 JR
 8R
 ,R
  8R
 -R
 6R
 FR
 $R
  -!R
" N#R
$ 5%R
& L'R
( ')R
* F+R
, 9-R
. )/R
0 D1R
2 N3R
4 05R
6 D7R
8 <9R
: /;R
< *=R
> ?R
D &ER
F "GR
H  IR
J 9KR
L 
6MR
 KR
r2   c            !         e Zd Zedd       Zedd       Zeeeeeeeeeeeeeeeeeeeeeeeeeeeeddded	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 dd       Zeeeeeeeeeeeeeeeeeeeeeeeeeeeddded	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 dd	       Zeeeeeeeeeeeeeeeeeeeeeeeeeeeddded	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 dd
       Z e	ddgg d      eeeeeeeeeeeeeeeeeeeeeeeeeeeddded	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 	 dd       Zy)r)   c                    t        |       S r,   )AsyncCompletionsWithRawResponser.   s    r0   r1   z"AsyncCompletions.with_raw_responsek  s     /t44r2   c                    t        |       S r4   )%AsyncCompletionsWithStreamingResponser.   s    r0   r6   z(AsyncCompletions.with_streaming_responseu  s     5T::r2   Nr7   rW   rX   c       !           K   ywrZ   r[   r\   s"                                     r0   r]   zAsyncCompletions.create~       ` 	   r_   c       !           K   ywra   r[   rb   s"                                     r0   r]   zAsyncCompletions.createp  r   r   c       !           K   ywra   r[   rb   s"                                     r0   r]   zAsyncCompletions.createb  r   r   rd   c       !        j  K   t        |       | j                  dt        i d|d|d|d|d|d|d|d	|d
|	d|
d|d|d|d|d|d|d|||||||||||||dt        j                         d {   t        ||| |!      t        |xs dt        t                  d {   S 7 57 wrf   )	rk   rl   r   r   rm   r   r    r   r!   r\   s"                                     r0   r]   zAsyncCompletions.createT  s{    P 	!1ZZ,U U ():	
 $]   !*  ,-B !*  !*  *+> !*  '(8!" &#$ !$0 "$&4#.#."$0" ;> )??A! !D )+Q[el #?U"#67S   *
 *
 *	
!*
s$   A7B39B/
:0B3*B1+B31B3)rn   r   )rn   r   ro   )DrW   rp   rX   rq   rK   r   r8   rr   r9   rs   r:   rt   r;   ru   r<   rv   r=   rw   r>   rx   r?   rx   r@   ry   rA   rz   rB   rx   rC   r{   rD   r|   rE   rs   rF   r}   rG   rx   rH   r~   rI   r   rJ   rw   rL   r   rM   rs   rN   r   rO   r   rP   rx   rQ   rs   rR   r   rS   r   rT   r   rU   r   rV   r   rn   z AsyncStream[ChatCompletionChunk])DrW   rp   rX   rq   rK   r   r8   rr   r9   rs   r:   rt   r;   ru   r<   rv   r=   rw   r>   rx   r?   rx   r@   ry   rA   rz   rB   rx   rC   r{   rD   r|   rE   rs   rF   r}   rG   rx   rH   r~   rI   r   rJ   rw   rL   r   rM   rs   rN   r   rO   r   rP   rx   rQ   rs   rR   r   rS   r   rT   r   rU   r   rV   r   rn   1ChatCompletion | AsyncStream[ChatCompletionChunk])DrW   rp   rX   rq   r8   rr   r9   rs   r:   rt   r;   ru   r<   rv   r=   rw   r>   rx   r?   rx   r@   ry   rA   rz   rB   rx   rC   r{   rD   r|   rE   rs   rF   r}   rG   rx   rH   r~   rI   r   rJ   rw   rK   r   rL   r   rM   rs   rN   r   rO   r   rP   rx   rQ   rs   rR   r   rS   r   rT   r   rU   r   rV   r   rn   r   r   r[   r2   r0   r)   r)   j  s<   5 5 ; ;  @I8AJSLU:C.7:C/88AHQ&//8PY7@NW)2HQ;D+46?PY2;FO>G1:,5( )-$("&;DKo 7o %	o
 =o 6o Ho Jo 8o ,o  8o -o 6o Fo $o  -!o" N#o$ 5%o& L'o( ')o* F+o, 9-o. )/o0 41o2 N3o4 05o6 D7o8 <9o: /;o< *=o> ?oD &EoF "GoH  IoJ 9KoL 
Mo ob  @I8AJSLU:C.7:C/88AHQ&//8PY7@NW)2HQ;D+4PY2;FO>G1:,5( )-$("&;DKo 7o %	o
 o =o 6o Ho Jo 8o ,o  8o -o 6o Fo  $!o" -#o$ N%o& 5'o( L)o* '+o, F-o. 9/o0 )1o2 N3o4 05o6 D7o8 <9o: /;o< *=o> ?oD &EoF "GoH  IoJ 9KoL 
*Mo ob  @I8AJSLU:C.7:C/88AHQ&//8PY7@NW)2HQ;D+4PY2;FO>G1:,5( )-$("&;DKo 7o %	o
 o =o 6o Ho Jo 8o ,o  8o -o 6o Fo  $!o" -#o$ N%o& 5'o( L)o* '+o, F-o. 9/o0 )1o2 N3o4 05o6 D7o8 <9o: /;o< *=o> ?oD &EoF "GoH  IoJ 9KoL 
;Mo ob J(*IJ @I8AJSLU:C.7:C/88AHQ&//8PY7@NW)2HQ;D+4FOPY2;FO>G1:,5( )-$("&;DKR
 7R
 %	R

 =R
 6R
 HR
 JR
 8R
 ,R
  8R
 -R
 6R
 FR
 $R
  -!R
" N#R
$ 5%R
& L'R
( ')R
* F+R
, 9-R
. )/R
0 D1R
2 N3R
4 05R
6 D7R
8 <9R
: /;R
< *=R
> ?R
D &ER
F "GR
H  IR
J 9KR
L 
;MR
 KR
r2   c                      e Zd ZddZy)r-   c                Z    || _         t        j                  |j                        | _        y N)_completionsr   to_raw_response_wrapperr]   r/   completionss     r0   __init__z#CompletionsWithRawResponse.__init__  s%    '&>>
r2   Nr   r(   rn   Noner   r   r   r   r[   r2   r0   r-   r-         
r2   r-   c                      e Zd ZddZy)r   c                Z    || _         t        j                  |j                        | _        y r   )r   r   async_to_raw_response_wrapperr]   r   s     r0   r   z(AsyncCompletionsWithRawResponse.__init__  s%    '&DD
r2   Nr   r)   rn   r   r   r[   r2   r0   r   r     r   r2   r   c                      e Zd ZddZy)r5   c                F    || _         t        |j                        | _        y r   )r   r   r]   r   s     r0   r   z)CompletionsWithStreamingResponse.__init__  s    '2
r2   Nr   r   r[   r2   r0   r5   r5     r   r2   r5   c                      e Zd ZddZy)r   c                F    || _         t        |j                        | _        y r   )r   r   r]   r   s     r0   r   z.AsyncCompletionsWithStreamingResponse.__init__  s    '8
r2   Nr   r   r[   r2   r0   r   r     r   r2   r   c                z    t        j                  |       r&t        | t        j                        rt        d      y y )NzzYou tried to pass a `BaseModel` class to `chat.completions.create()`; You must use `beta.chat.completions.parse()` instead)inspectisclass
issubclasspydantic	BaseModel	TypeError)rF   s    r0   rk   rk     s9    'JHZHZ,[ I
 	
 -\'r2   )rF   objectrn   r   )E
__future__r   r   typingr   r   r   r   r   typing_extensionsr	   r
   httpxr    r   _typesr   r   r   r   r   _utilsr   r   r   _compatr   	_resourcer   r   	_responser   r   
_streamingr   r   
types.chatr   r   _base_clientr   types.chat_modelr   types.chat.chat_completionr     types.chat.chat_completion_chunkr!   #types.chat.chat_completion_modalityr"   %types.chat.chat_completion_tool_paramr#   &types.chat.chat_completion_audio_param(types.chat.chat_completion_message_paramr$   /types.chat.chat_completion_stream_options_paramr%   3types.chat.chat_completion_prediction_content_paramr&   3types.chat.chat_completion_tool_choice_option_paramr'   __all__r(   r)   r-   r   r5   r   rk   r[   r2   r0   <module>r      s    #  8 8 /     ? ? 
 ' : Y - 1 ) 8 C I L N R _ g f,
-}
/ }
@}
' }
@
 

 

 

 

r2   