Class: LlamaDeuce
Llama2 LLM implementation
Hierarchy
-
BaseLLM
↳
LlamaDeuce
Constructors
constructor
• new LlamaDeuce(init?
): LlamaDeuce
Parameters
Name | Type |
---|---|
init? | Partial <LlamaDeuce > |
Returns
Overrides
BaseLLM.constructor
Defined in
packages/core/src/llm/LLM.ts:83
Properties
chatStrategy
• chatStrategy: DeuceChatStrategy
Defined in
packages/core/src/llm/LLM.ts:77
maxTokens
• Optional
maxTokens: number
Defined in
packages/core/src/llm/LLM.ts:80
model
• model: "Llama-2-70b-chat-old"
| "Llama-2-70b-chat-4bit"
| "Llama-2-13b-chat-old"
| "Llama-2-13b-chat-4bit"
| "Llama-2-7b-chat-old"
| "Llama-2-7b-chat-4bit"
Defined in
packages/core/src/llm/LLM.ts:76
replicateSession
• replicateSession: ReplicateSession
Defined in
packages/core/src/llm/LLM.ts:81
temperature
• temperature: number
Defined in
packages/core/src/llm/LLM.ts:78
topP
• topP: number
Defined in
packages/core/src/llm/LLM.ts:79
Accessors
metadata
• get
metadata(): Object
Returns
Object
Name | Type |
---|---|
contextWindow | number |
maxTokens | undefined | number |
model | "Llama-2-70b-chat-old" | "Llama-2-70b-chat-4bit" | "Llama-2-13b-chat-old" | "Llama-2-13b-chat-4bit" | "Llama-2-7b-chat-old" | "Llama-2-7b-chat-4bit" |
temperature | number |
tokenizer | undefined |
topP | number |
Overrides
BaseLLM.metadata
Defined in
packages/core/src/llm/LLM.ts:99
Methods
chat
▸ chat(params
): Promise
<AsyncIterable
<{ delta
: string
; options?
: Record
<string
, unknown
> }>>
Parameters
Name | Type |
---|---|
params | LLMChatParamsStreaming <Record <string , unknown >> |
Returns
Promise
<AsyncIterable
<{ delta
: string
; options?
: Record
<string
, unknown
> }>>
Overrides
BaseLLM.chat
Defined in
packages/core/src/llm/LLM.ts:236
▸ chat(params
): Promise
<ChatResponse
<Record
<string
, unknown
>>>
Parameters
Name | Type |
---|---|
params | LLMChatParamsNonStreaming <Record <string , unknown >> |
Returns
Promise
<ChatResponse
<Record
<string
, unknown
>>>