add keep_alive (#36)

jmorganca · web-flow · commit 5e6b91773d85 · 2024-02-02T10:38:52.000-05:00
diff --git a/README.md b/README.md
@@ -21,6 +21,7 @@ console.log(response.message.content)
 ```
 
 ## Streaming responses
+
 Response streaming can be enabled by setting `stream: true`, modifying function calls to return an `AsyncGenerator` where each part is an object in the stream.
 
 ```javascript
@@ -34,6 +35,7 @@ for await (const part of response) {
 ```
 
 ## Create
+
 ```javascript
 import ollama from 'ollama'
 
@@ -45,6 +47,7 @@ await ollama.create({ model: 'example', modelfile: modelfile })
 ```
 
 ## API
+
 The Ollama JavaScript library's API is designed around the [Ollama REST API](https://github.com/jmorganca/ollama/blob/main/docs/api.md)
 
 ### chat
@@ -61,8 +64,9 @@ ollama.chat(request)
     - `content` `<string>`: The content of the message.
     - `images` `<Uint8Array[] | string[]>`: (Optional) Images to be included in the message, either as Uint8Array or base64 encoded strings.
   - `format` `<string>`: (Optional) Set the expected format of the response (`json`).
-  - `options` `<Options>`: (Optional) Options to configure the runtime.
   - `stream` `<boolean>`: (Optional) When true an `AsyncGenerator` is returned.
+  - `keep_alive` `<string | number>`: (Optional) How long to keep the model loaded.
+  - `options` `<Options>`: (Optional) Options to configure the runtime.
 
 - Returns: `<ChatResponse>`
 
@@ -80,8 +84,9 @@ ollama.generate(request)
   - `raw` `<boolean>`: (Optional) Bypass the prompt template and pass the prompt directly to the model.
   - `images` `<Uint8Array[] | string[]>`: (Optional) Images to be included, either as Uint8Array or base64 encoded strings.
   - `format` `<string>`: (Optional) Set the expected format of the response (`json`).
-  - `options` `<Options>`: (Optional) Options to configure the runtime.
   - `stream` `<boolean>`: (Optional) When true an `AsyncGenerator` is returned.
+  - `keep_alive` `<string | number>`: (Optional) How long to keep the model loaded.
+  - `options` `<Options>`: (Optional) Options to configure the runtime.
 - Returns: `<GenerateResponse>`
 
 ### pull
@@ -176,6 +181,7 @@ ollama.embeddings(request)
 - `request` `<Object>`: The request object containing embedding parameters.
   - `model` `<string>` The name of the model used to generate the embeddings.
   - `prompt` `<string>`: The prompt used to generate the embedding.
+  - `keep_alive` `<string | number>`: (Optional) How long to keep the model loaded.
   - `options` `<Options>`: (Optional) Options to configure the runtime.
 - Returns: `<EmbeddingsResponse>`
 
diff --git a/src/interfaces.ts b/src/interfaces.ts
@@ -51,6 +51,7 @@ export interface GenerateRequest {
   raw?: boolean
   format?: string
   images?: Uint8Array[] | string[]
+  keep_alive?: string | number
 
   options?: Partial<Options>
 }
@@ -66,6 +67,7 @@ export interface ChatRequest {
   messages?: Message[]
   stream?: boolean
   format?: string
+  keep_alive?: string | number
 
   options?: Partial<Options>
 }
@@ -112,6 +114,7 @@ export interface ShowRequest {
 export interface EmbeddingsRequest {
   model: string
   prompt: string
+  keep_alive?: string | number
 
   options?: Partial<Options>
 }

Original file line number	Diff line number	Diff line change
`@@ -51,6 +51,7 @@ export interface GenerateRequest {`
`51`	`51`	`raw?: boolean`
`52`	`52`	`format?: string`
`53`	`53`	`images?: Uint8Array[] \| string[]`
	`54`	`+ keep_alive?: string \| number`
`54`	`55`
`55`	`56`	`options?: Partial<Options>`
`56`	`57`	`}`
`@@ -66,6 +67,7 @@ export interface ChatRequest {`
`66`	`67`	`messages?: Message[]`
`67`	`68`	`stream?: boolean`
`68`	`69`	`format?: string`
	`70`	`+ keep_alive?: string \| number`
`69`	`71`
`70`	`72`	`options?: Partial<Options>`
`71`	`73`	`}`
`@@ -112,6 +114,7 @@ export interface ShowRequest {`
`112`	`114`	`export interface EmbeddingsRequest {`
`113`	`115`	`model: string`
`114`	`116`	`prompt: string`
	`117`	`+ keep_alive?: string \| number`
`115`	`118`
`116`	`119`	`options?: Partial<Options>`
`117`	`120`	`}`