interface WatsonxDeployedInputLLM {
    authenticator?: string;
    cache?: boolean | BaseCache<Generation[]>;
    callbackManager?: CallbackManager;
    callbacks?: Callbacks;
    concurrency?: number;
    decodingMethod?: undefined;
    idOrName?: string;
    includeStopSequence?: undefined;
    lengthPenalty?: undefined;
    maxConcurrency?: number;
    maxNewTokens?: undefined;
    maxRetries?: number;
    metadata?: Record<string, unknown>;
    minNewTokens?: undefined;
    model?: undefined;
    onFailedAttempt?: FailedAttemptHandler;
    randomSeed?: undefined;
    repetitionPenalty?: undefined;
    returnOptions?: undefined;
    serviceUrl: string;
    stopSequence?: undefined;
    streaming?: boolean;
    tags?: string[];
    temperature?: undefined;
    timeLimit?: undefined;
    topK?: undefined;
    topP?: undefined;
    truncateInpuTokens?: undefined;
    verbose?: boolean;
    version: string;
    watsonxCallbacks?: RequestCallbacks<any>;
}

Hierarchy

  • WatsonxDeployedParams
  • BaseLLMParams
  • Neverify<WatsonxLLMParams>
    • WatsonxDeployedInputLLM

Properties

authenticator?: string
cache?: boolean | BaseCache<Generation[]>
callbackManager?: CallbackManager

Use callbacks instead

callbacks?: Callbacks
concurrency?: number

Use maxConcurrency instead

decodingMethod?: undefined
idOrName?: string
includeStopSequence?: undefined
lengthPenalty?: undefined
maxConcurrency?: number
maxNewTokens?: undefined
maxRetries?: number
metadata?: Record<string, unknown>
minNewTokens?: undefined
model?: undefined
onFailedAttempt?: FailedAttemptHandler

Custom handler to handle failed attempts. Takes the originally thrown error object as input, and should itself throw an error if the input error is not retryable.

randomSeed?: undefined
repetitionPenalty?: undefined
returnOptions?: undefined
serviceUrl: string
stopSequence?: undefined
streaming?: boolean
tags?: string[]
temperature?: undefined
timeLimit?: undefined
topK?: undefined
topP?: undefined
truncateInpuTokens?: undefined
verbose?: boolean
version: string
watsonxCallbacks?: RequestCallbacks<any>