OptionalbaseUrl
baseUrl?: string
OptionalcheckOrPullModel
checkOrPullModel?: boolean
OptionalembeddingOnly
embeddingOnly?: boolean
Optionalf16Kv
f16Kv?: boolean
Optionalfetch
fetch?: {
(input: RequestInfo | URL, init?: RequestInit): Promise<Response>;
(input: string | Request | URL, init?: RequestInit): Promise<Response>;
}
Type Declaration
- (input: RequestInfo | URL, init?: RequestInit): Promise<Response>
Parameters
- input: RequestInfo | URL
Optionalinit: RequestInit
Returns Promise<Response>
- (input: string | Request | URL, init?: RequestInit): Promise<Response>
Parameters
- input: string | Request | URL
Optionalinit: RequestInit
Returns Promise<Response>
format?: string | Record<string, any>
OptionalfrequencyPenalty
frequencyPenalty?: number
headers?: Headers | Record<string, string>
OptionalkeepAlive
keepAlive?: string | number
OptionallogitsAll
logitsAll?: boolean
OptionallowVram
lowVram?: boolean
OptionalmainGpu
mainGpu?: number
Optionalmirostat
mirostat?: number
OptionalmirostatEta
mirostatEta?: number
OptionalmirostatTau
mirostatTau?: number
Optionalmodel
model?: string
Optionalnuma
numa?: boolean
OptionalnumBatch
numBatch?: number
OptionalnumCtx
numCtx?: number
OptionalnumGpu
numGpu?: number
OptionalnumKeep
numKeep?: number
OptionalnumPredict
numPredict?: number
OptionalnumThread
numThread?: number
OptionalpenalizeNewline
penalizeNewline?: boolean
OptionalpresencePenalty
presencePenalty?: number
OptionalrepeatLastN
repeatLastN?: number
OptionalrepeatPenalty
repeatPenalty?: number
Optionalseed
seed?: number
Optionalstop
stop?: string[]
Optionalstreaming
streaming?: boolean
Optionaltemperature
temperature?: number
OptionaltfsZ
tfsZ?: number
Optionalthink
think?: boolean
OptionaltopK
topK?: number
OptionaltopP
topP?: number
OptionaltypicalP
typicalP?: number
OptionaluseMlock
useMlock?: boolean
OptionaluseMmap
useMmap?: boolean
OptionalvocabOnly
vocabOnly?: boolean
Input to chat model class.