interface ChatDeepSeekInput {
    apiKey?: string;
    audio?: ChatCompletionAudioParam;
    cache?: boolean | BaseCache<Generation[]>;
    callbackManager?: CallbackManager;
    callbacks?: Callbacks;
    configuration?: ClientOptions;
    disableStreaming?: boolean;
    frequencyPenalty?: number;
    logitBias?: Record<string, number>;
    logprobs?: boolean;
    maxCompletionTokens?: number;
    maxConcurrency?: number;
    maxRetries?: number;
    maxTokens?: number;
    metadata?: Record<string, unknown>;
    modalities?: ChatCompletionModality[];
    model?: string;
    modelKwargs?: Record<string, any>;
    modelName?: string;
    n?: number;
    onFailedAttempt?: FailedAttemptHandler;
    openAIApiKey?: string;
    prefixMessages?: ChatCompletionMessageParam[];
    presencePenalty?: number;
    reasoningEffort?: ChatCompletionReasoningEffort;
    stop?: string[];
    stopSequences?: string[];
    streamUsage?: boolean;
    streaming?: boolean;
    supportsStrictToolCalling?: boolean;
    tags?: string[];
    temperature?: number;
    timeout?: number;
    topLogprobs?: number;
    topP?: number;
    user?: string;
    verbose?: boolean;
}

Hierarchy

  • ChatOpenAIFields
    • ChatDeepSeekInput

Properties

apiKey?: string

The Deepseek API key to use for requests.

process.env.DEEPSEEK_API_KEY

Parameters for audio output. Required when audio output is requested with modalities: ["audio"]. Learn more.

cache?: boolean | BaseCache<Generation[]>
callbackManager?: CallbackManager

Use callbacks instead

callbacks?: Callbacks
configuration?: ClientOptions
disableStreaming?: boolean

Whether to disable streaming.

If streaming is bypassed, then stream() will defer to invoke().

  • If true, will always bypass streaming case.
  • If false (default), will always use streaming case if available.
frequencyPenalty?: number

Penalizes repeated tokens according to frequency

logitBias?: Record<string, number>

Dictionary used to adjust the probability of specific tokens being generated

logprobs?: boolean

Whether to return log probabilities of the output tokens or not. If true, returns the log probabilities of each output token returned in the content of message.

maxCompletionTokens?: number

Maximum number of tokens to generate in the completion. -1 returns as many tokens as possible given the prompt and the model's maximum context size. Alias for maxTokens for reasoning models.

maxConcurrency?: number

The maximum number of concurrent calls that can be made. Defaults to Infinity, which means no limit.

maxRetries?: number

The maximum number of retries that can be made for a single call, with an exponential backoff between each attempt. Defaults to 6.

maxTokens?: number

The maximum number of tokens that the model can process in a single response. This limits ensures computational efficiency and resource management.

metadata?: Record<string, unknown>
modalities?: ChatCompletionModality[]

Output types that you would like the model to generate for this request. Most models are capable of generating text, which is the default:

["text"]

The gpt-4o-audio-preview model can also be used to generate audio. To request that this model generate both text and audio responses, you can use:

["text", "audio"]

model?: string

The name of the model to use.

modelKwargs?: Record<string, any>

Holds any additional parameters that are valid to pass to openai.createCompletion that are not explicitly specified on this class.

modelName?: string

Model name to use Alias for model

Use "model" instead.

n?: number

Number of completions to generate for each prompt

onFailedAttempt?: FailedAttemptHandler

Custom handler to handle failed attempts. Takes the originally thrown error object as input, and should itself throw an error if the input error is not retryable.

openAIApiKey?: string

API key to use when making requests to OpenAI. Defaults to the value of OPENAI_API_KEY environment variable. Alias for apiKey

prefixMessages?: ChatCompletionMessageParam[]

ChatGPT messages to pass as a prefix to the prompt

presencePenalty?: number

Penalizes repeated tokens

Constrains effort on reasoning for reasoning models. Currently supported values are low, medium, and high. Reducing reasoning effort can result in faster responses and fewer tokens used on reasoning in a response.

stop?: string[]

Up to 4 sequences where the API will stop generating further tokens. The returned text will not contain the stop sequence. Alias for stopSequences

stopSequences?: string[]

Up to 4 sequences where the API will stop generating further tokens. The returned text will not contain the stop sequence.

streamUsage?: boolean

Whether or not to include token usage data in streamed chunks.

true
streaming?: boolean

Whether or not to stream responses.

supportsStrictToolCalling?: boolean

Whether the model supports the strict argument when passing in tools. If undefined the strict argument will not be passed to OpenAI.

tags?: string[]
temperature?: number

The temperature to use for sampling.

timeout?: number

Timeout to use when making requests to OpenAI.

topLogprobs?: number

An integer between 0 and 5 specifying the number of most likely tokens to return at each token position, each with an associated log probability. logprobs must be set to true if this parameter is used.

topP?: number

Total probability mass of tokens to consider at each step

user?: string

Unique string identifier representing your end-user, which can help OpenAI to monitor and detect abuse.

verbose?: boolean