├── .gitignore ├── LICENSE ├── README.md ├── anthropic.js ├── anthropic_test.js ├── gemini.js ├── gemini_test.js ├── index.d.ts ├── index.js ├── package-lock.json ├── package.json ├── samples ├── anthropic-tools.txt ├── anthropic-tools2.txt ├── anthropic.txt ├── errors.txt ├── gemini-tools.txt ├── gemini-tools2.txt ├── gemini.txt ├── openai-tools.txt ├── openai-tools2.txt ├── openai.txt ├── openrouter.txt └── output.txt └── test.js /.gitignore: -------------------------------------------------------------------------------- 1 | dist/ 2 | node_modules/ 3 | -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- 1 | Copyright 2024 Anand S 2 | 3 | Permission is hereby granted, free of charge, to any person obtaining 4 | a copy of this software and associated documentation files (the 5 | "Software"), to deal in the Software without restriction, including 6 | without limitation the rights to use, copy, modify, merge, publish, 7 | distribute, sublicense, and/or sell copies of the Software, and to 8 | permit persons to whom the Software is furnished to do so, subject to 9 | the following conditions: 10 | 11 | The above copyright notice and this permission notice shall be 12 | included in all copies or substantial portions of the Software. 13 | 14 | THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, 15 | EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF 16 | MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND 17 | NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE 18 | LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION 19 | OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION 20 | WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. 21 | -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- 1 | # asyncLLM 2 | 3 | [![npm version](https://img.shields.io/npm/v/asyncllm.svg)](https://www.npmjs.com/package/asyncllm) 4 | [![License: MIT](https://img.shields.io/badge/License-MIT-yellow.svg)](https://opensource.org/licenses/MIT) 5 | 6 | Fetch LLM responses across multiple providers as an async iterable. 7 | 8 | ## Features 9 | 10 | - 🚀 Lightweight (~2KB) and dependency-free 11 | - 🔄 Works with multiple LLM providers (OpenAI, Anthropic, Gemini, and more) 12 | - 🌐 Browser and Node.js compatible 13 | - 📦 Easy to use with ES modules 14 | 15 | ## Installation 16 | 17 | ```bash 18 | npm install asyncllm 19 | ``` 20 | 21 | ## Anthropic and Gemini Adapters 22 | 23 | Adapters convert OpenAI-style request bodies to the [Anthropic](https://docs.anthropic.com/en/api/messages) or [Gemini](https://ai.google.dev/gemini-api/docs/text-generation?lang=rest) formats. For example: 24 | 25 | ```javascript 26 | import { anthropic } from "https://cdn.jsdelivr.net/npm/asyncllm@2/dist/anthropic.js"; 27 | import { gemini } from "https://cdn.jsdelivr.net/npm/asyncllm@2/dist/gemini.js"; 28 | 29 | // Create an OpenAI-style request 30 | const body = { 31 | messages: [{ role: "user", content: "Hello, world!" }], 32 | temperature: 0.5, 33 | }; 34 | 35 | // Fetch request with the Anthropic API 36 | const anthropicResponse = await fetch("https://api.anthropic.com/v1/messages", { 37 | method: "POST", 38 | headers: { "Content-Type": "application/json", "x-api-key": "YOUR_API_KEY" }, 39 | // anthropic() converts the OpenAI-style request to Anthropic's format 40 | body: JSON.stringify(anthropic({ ...body, model: "claude-3-haiku-20240307" })), 41 | }).then((r) => r.json()); 42 | 43 | // Fetch request with the Gemini API 44 | const geminiResponse = await fetch( 45 | "https://generativelanguage.googleapis.com/v1beta/models/gemini-1.5-flash-8b:generateContent", 46 | { 47 | method: "POST", 48 | headers: { "Content-Type": "application/json", Authorization: `Bearer YOUR_API_KEY` }, 49 | // gemini() converts the OpenAI-style request to Gemini's format 50 | body: JSON.stringify(gemini(body)), 51 | }, 52 | ).then((r) => r.json()); 53 | ``` 54 | 55 | Here are the parameters supported by each provider. 56 | 57 | | OpenAI Parameter | Anthropic | Gemini | 58 | | ----------------------------------- | --------- | ------ | 59 | | messages | Y | Y | 60 | | system message | Y | Y | 61 | | temperature | Y | Y | 62 | | max_tokens | Y | Y | 63 | | top_p | Y | Y | 64 | | stop sequences | Y | Y | 65 | | stream | Y | Y | 66 | | presence_penalty | | Y | 67 | | frequency_penalty | | Y | 68 | | logprobs | | Y | 69 | | top_logprobs | | Y | 70 | | n (multiple candidates) | | Y | 71 | | metadata.user_id | Y | | 72 | | tools/functions | Y | Y | 73 | | tool_choice | Y | Y | 74 | | parallel_tool_calls | Y | | 75 | | response_format.type: "json_object" | | Y | 76 | | response_format.type: "json_schema" | | Y | 77 | 78 | Content types: 79 | 80 | | OpenAI | Anthropic | Gemini | 81 | | ------ | --------- | ------ | 82 | | Text | Y | Y | 83 | | Images | Y | Y | 84 | | Audio | | Y | 85 | 86 | Image Sources 87 | 88 | | OpenAI Parameter | Anthropic | Gemini | 89 | | ---------------- | --------- | ------ | 90 | | Data URI | Y | Y | 91 | | External URLs | | Y | 92 | 93 | ## Streaming 94 | 95 | Call `asyncLLM()` just like you would use `fetch` with any LLM provider with streaming responses. 96 | 97 | - [OpenAI Streaming](https://platform.openai.com/docs/api-reference/chat/streaming). Many providers like Azure, Groq, OpenRouter, etc. follow the OpenAI API. 98 | - [Anthropic Streaming](https://docs.anthropic.com/en/api/messages-streaming) 99 | - [Gemini Streaming](https://ai.google.dev/gemini-api/docs/text-generation?lang=rest#generate-a-text-stream) 100 | 101 | The result is an async generator that yields objects with `content`, `tool`, and `args` properties. 102 | 103 | For example, to update the DOM with the LLM's response: 104 | 105 | ```html 106 | 107 | 108 | 109 |
110 | 111 | 112 | 135 | 136 | ``` 137 | 138 | ### Node.js or bundled projects 139 | 140 | ```javascript 141 | import { asyncLLM } from "asyncllm"; 142 | 143 | // Usage is the same as in the browser example 144 | ``` 145 | 146 | ## Examples 147 | 148 | ### OpenAI streaming 149 | 150 | ```javascript 151 | import { asyncLLM } from "https://cdn.jsdelivr.net/npm/asyncllm@2"; 152 | 153 | const body = { 154 | model: "gpt-4o-mini", 155 | // You MUST enable streaming, else the API will return an {error} 156 | stream: true, 157 | messages: [{ role: "user", content: "Hello, world!" }], 158 | }; 159 | 160 | for await (const data of asyncLLM("https://api.openai.com/v1/chat/completions", { 161 | method: "POST", 162 | headers: { "Content-Type": "application/json", Authorization: `Bearer ${apiKey}` }, 163 | body: JSON.stringify(body), 164 | })) { 165 | console.log(data); 166 | } 167 | ``` 168 | 169 | This will log something like this on the console: 170 | 171 | ```js 172 | { content: "", tool: undefined, args: undefined, message: { "id": "chatcmpl-...", ...} } 173 | { content: "Hello", tool: undefined, args: undefined, message: { "id": "chatcmpl-...", ...} } 174 | { content: "Hello!", tool: undefined, args: undefined, message: { "id": "chatcmpl-...", ...} } 175 | { content: "Hello! How", tool: undefined, args: undefined, message: { "id": "chatcmpl-...", ...} } 176 | ... 177 | { content: "Hello! How can I assist you today?", tool: undefined, args: undefined, message: { "id": "chatcmpl-...", ...} } 178 | ``` 179 | 180 | ### Anthropic streaming 181 | 182 | The package includes an Anthropic adapter that converts OpenAI-style requests to Anthropic's format, 183 | allowing you to use the same code structure across providers. 184 | 185 | ```javascript 186 | import { asyncLLM } from "https://cdn.jsdelivr.net/npm/asyncllm@2"; 187 | import { anthropic } from "https://cdn.jsdelivr.net/npm/asyncllm@2/dist/anthropic.js"; 188 | 189 | // You can use the anthropic() adapter to convert OpenAI-style requests to Anthropic's format. 190 | const body = anthropic({ 191 | // Same as OpenAI example above 192 | }); 193 | 194 | // Or you can use the asyncLLM() function directly with the Anthropic API endpoint. 195 | const body = { 196 | model: "claude-3-haiku-20240307", 197 | // You MUST enable streaming, else the API will return an {error} 198 | stream: true, 199 | max_tokens: 10, 200 | messages: [{ role: "user", content: "What is 2 + 2" }], 201 | }; 202 | 203 | for await (const data of asyncLLM("https://api.anthropic.com/v1/messages", { 204 | headers: { "Content-Type": "application/json", "x-api-key": apiKey }, 205 | body: JSON.stringify(body), 206 | })) { 207 | console.log(data); 208 | } 209 | ``` 210 | 211 | ### Gemini streaming 212 | 213 | The package includes a Gemini adapter that converts OpenAI-style requests to Gemini's format, 214 | allowing you to use the same code structure across providers. 215 | 216 | ```javascript 217 | import { asyncLLM } from "https://cdn.jsdelivr.net/npm/asyncllm@2"; 218 | import { gemini } from "https://cdn.jsdelivr.net/npm/asyncllm@2/dist/gemini.js"; 219 | 220 | // You can use the gemini() adapter to convert OpenAI-style requests to Gemini's format. 221 | const body = gemini({ 222 | // Same as OpenAI example above 223 | }); 224 | 225 | // Or you can use the asyncLLM() function directly with the Gemini API endpoint. 226 | const body = { 227 | contents: [{ role: "user", parts: [{ text: "What is 2+2?" }] }], 228 | }; 229 | 230 | for await (const data of asyncLLM( 231 | // You MUST use a streaming endpoint, else the API will return an {error} 232 | "https://generativelanguage.googleapis.com/v1beta/models/gemini-1.5-flash-8b:streamGenerateContent?alt=sse", 233 | { 234 | method: "POST", 235 | headers: { 236 | "Content-Type": "application/json", 237 | Authorization: `Bearer ${apiKey}`, 238 | }, 239 | body: JSON.stringify(body), 240 | }, 241 | )) { 242 | console.log(data); 243 | } 244 | ``` 245 | 246 | ### Function Calling 247 | 248 | asyncLLM supports function calling (aka tools). Here's an example with OpenAI: 249 | 250 | ```javascript 251 | for await (const { tools } of asyncLLM("https://api.openai.com/v1/chat/completions", { 252 | method: "POST", 253 | headers: { 254 | "Content-Type": "application/json", 255 | Authorization: `Bearer ${apiKey}`, 256 | }, 257 | body: JSON.stringify({ 258 | model: "gpt-4o-mini", 259 | stream: true, 260 | messages: [ 261 | { role: "system", content: "Get delivery date for order" }, 262 | { role: "user", content: "Order ID: 123456" }, 263 | ], 264 | tool_choice: "required", 265 | tools: [ 266 | { 267 | type: "function", 268 | function: { 269 | name: "get_delivery_date", 270 | parameters: { type: "object", properties: { order_id: { type: "string" } }, required: ["order_id"] }, 271 | }, 272 | }, 273 | ], 274 | }), 275 | })) { 276 | console.log(JSON.stringify(tools)); 277 | } 278 | ``` 279 | 280 | `tools` is an array of objects with `name`, `id` (for Anthropic and OpenAI, not Gemini), and `args` properties. It streams like this: 281 | 282 | ```json 283 | [{"name":"get_delivery_date","id":"call_F8YHCjnzrrTjfE4YSSpVW2Bc","args":""}] 284 | [{"name":"get_delivery_date","id":"call_F8YHCjnzrrTjfE4YSSpVW2Bc","args":"{\""}] 285 | [{"name":"get_delivery_date","id":"call_F8YHCjnzrrTjfE4YSSpVW2Bc","args":"{\"order"}] 286 | [{"name":"get_delivery_date","id":"call_F8YHCjnzrrTjfE4YSSpVW2Bc","args":"{\"order_id"}] 287 | [{"name":"get_delivery_date","id":"call_F8YHCjnzrrTjfE4YSSpVW2Bc","args":"{\"order_id\":\""}] 288 | [{"name":"get_delivery_date","id":"call_F8YHCjnzrrTjfE4YSSpVW2Bc","args":"{\"order_id\":\"123"}] 289 | [{"name":"get_delivery_date","id":"call_F8YHCjnzrrTjfE4YSSpVW2Bc","args":"{\"order_id\":\"123456"}] 290 | [{"name":"get_delivery_date","id":"call_F8YHCjnzrrTjfE4YSSpVW2Bc","args":"{\"order_id\":\"123456\"}"}] 291 | ``` 292 | 293 | Use a library like [partial-json](https://www.npmjs.com/package/partial-json) to parse the `args` incrementally. 294 | 295 | ### Streaming Config 296 | 297 | asyncLLM accepts a `config` object with the following properties: 298 | 299 | - `fetch`: Custom fetch implementation (defaults to global `fetch`). 300 | - `onResponse`: Async callback function that receives the Response object before streaming begins. If the callback returns a promise, it will be awaited before continuing the stream. 301 | 302 | Here's how you can use a custom fetch implementation: 303 | 304 | ```javascript 305 | import { asyncLLM } from "https://cdn.jsdelivr.net/npm/asyncllm@2"; 306 | 307 | const body = { 308 | // Same as OpenAI example above 309 | }; 310 | 311 | // Optional configuration. You can ignore it for most use cases. 312 | const config = { 313 | onResponse: async (response) => { 314 | console.log(response.status, response.headers); 315 | }, 316 | // You can use a custom fetch implementation if needed 317 | fetch: fetch, 318 | }; 319 | 320 | for await (const { content } of asyncLLM( 321 | "https://api.openai.com/v1/chat/completions", 322 | { 323 | method: "POST", 324 | headers: { "Content-Type": "application/json", Authorization: `Bearer ${apiKey}` }, 325 | body: JSON.stringify(body), 326 | }, 327 | config, 328 | )) { 329 | console.log(content); 330 | } 331 | ``` 332 | 333 | ## Streaming from text 334 | 335 | You can parse streamed SSE events from a text string (e.g. from a cached response) using the provided `fetchText` helper: 336 | 337 | ```javascript 338 | import { asyncLLM } from "https://cdn.jsdelivr.net/npm/asyncllm@2"; 339 | import { fetchText } from "https://cdn.jsdelivr.net/npm/asyncsse@1/dist/fetchtext.js"; 340 | 341 | const text = ` 342 | data: {"candidates": [{"content": {"parts": [{"text": "2"}],"role": "model"}}]} 343 | 344 | data: {"candidates": [{"content": {"parts": [{"text": " + 2 = 4\\n"}],"role": "model"}}]} 345 | 346 | data: {"candidates": [{"content": {"parts": [{"text": ""}],"role": "model"}}]} 347 | `; 348 | 349 | // Stream events from text 350 | for await (const event of asyncLLM(text, {}, { fetch: fetchText })) { 351 | console.log(event); 352 | } 353 | ``` 354 | 355 | This outputs: 356 | 357 | ``` 358 | { data: "Hello" } 359 | { data: "World" } 360 | ``` 361 | 362 | This is particularly useful for testing SSE parsing without making actual HTTP requests. 363 | 364 | ### Error handling 365 | 366 | If an error occurs, it will be yielded in the `error` property. For example: 367 | 368 | ```javascript 369 | for await (const { content, error } of asyncLLM("https://api.openai.com/v1/chat/completions", { 370 | method: "POST", 371 | // ... 372 | })) { 373 | if (error) console.error(error); 374 | else console.log(content); 375 | } 376 | ``` 377 | 378 | The `error` property is set if: 379 | 380 | - The underlying API (e.g. OpenAI, Anthropic, Gemini) returns an error in the response (e.g. `error.message` or `message.error` or `error`) 381 | - The fetch request fails (e.g. network error) 382 | - The response body cannot be parsed as JSON 383 | 384 | ### `asyncLLM(request: string | Request, options?: RequestInit, config?: SSEConfig): AsyncGenerator` 385 | 386 | Fetches streaming responses from LLM providers and yields events. 387 | 388 | - `request`: The URL or Request object for the LLM API endpoint 389 | - `options`: Optional [fetch options](https://developer.mozilla.org/en-US/docs/Web/API/fetch#parameters) 390 | - `config`: Optional configuration object for SSE handling 391 | - `fetch`: Custom fetch implementation (defaults to global fetch) 392 | - `onResponse`: Async callback function that receives the Response object before streaming begins. If the callback returns a promise, it will be awaited before continuing the stream. 393 | 394 | Returns an async generator that yields [`LLMEvent` objects](#llmevent). 395 | 396 | #### LLMEvent 397 | 398 | - `content`: The text content of the response 399 | - `tools`: Array of tool call objects with: 400 | - `name`: The name of the tool being called 401 | - `args`: The arguments for the tool call as a JSON-encoded string, e.g. `{"order_id":"123456"}` 402 | - `id`: Optional unique identifier for the tool call (e.g. OpenAI's `call_F8YHCjnzrrTjfE4YSSpVW2Bc` or Anthropic's `toolu_01T1x1fJ34qAmk2tNTrN7Up6`. Gemini does not return an id.) 403 | - `message`: The raw message object from the LLM provider (may include id, model, usage stats, etc.) 404 | - `error`: Error message if the request fails 405 | 406 | ## Changelog 407 | 408 | - 2.1.2: Update repo links 409 | - 2.1.1: Document standalone adapter usage 410 | - 2.1.0: Added `id` to tools to support unique tool call identifiers from providers 411 | - 2.0.1: Multiple tools support. 412 | - Breaking change: `tool` and `args` are not part of the response. Instead, it has `tools`, an array of `{ name, args }` 413 | - Fixed Gemini adapter to return `toolConfig` instead of `toolsConfig` 414 | - 1.2.2: Added streaming from text documentation via `config.fetch`. Upgrade to asyncSSE 1.3.1 (bug fix). 415 | - 1.2.1: Added `config.fetch` for custom fetch implementation 416 | - 1.2.0: Added `config.onResponse(response)` that receives the Response object before streaming begins 417 | - 1.1.3: Ensure `max_tokens` for Anthropic. Improve error handling 418 | - 1.1.1: Added [Anthropic adapter](#anthropic) 419 | - 1.1.0: Added [Gemini adapter](#gemini) 420 | - 1.0.0: Initial release with [asyncLLM](#asyncllm) and [LLMEvent](#llmevent) 421 | 422 | ## Contributing 423 | 424 | Contributions are welcome! Please feel free to submit a Pull Request. 425 | 426 | ## License 427 | 428 | This project is licensed under the MIT License - see the [LICENSE](LICENSE) file for details. 429 | -------------------------------------------------------------------------------- /anthropic.js: -------------------------------------------------------------------------------- 1 | /** 2 | * Convert an OpenAI body to an Anthropic body 3 | * @param {Object} body 4 | * @returns {Object} 5 | */ 6 | export function anthropic(body) { 7 | // System messages are specified at the top level in Anthropic 8 | const system = body.messages.find((msg) => msg.role === "system"); 9 | 10 | // Convert messages 11 | const messages = body.messages 12 | .filter((msg) => msg.role !== "system") 13 | .map((msg) => ({ 14 | role: msg.role, 15 | // Handle both text and binary content (images) 16 | content: Array.isArray(msg.content) 17 | ? msg.content.map(({ type, text, image_url }) => { 18 | if (type === "text") return { type: "text", text }; 19 | else if (type === "image_url") 20 | return { 21 | type: "image", 22 | source: anthropicSourceFromURL(image_url.url), 23 | }; 24 | // Anthropic doesn't support audio 25 | }) 26 | : msg.content, 27 | })); 28 | 29 | const parallel_tool_calls = 30 | typeof body.parallel_tool_calls == "boolean" ? { disable_parallel_tool_use: !body.parallel_tool_calls } : {}; 31 | // Map OpenAI parameters to Anthropic equivalents, only including if defined 32 | const params = { 33 | model: body.model, 34 | max_tokens: body.max_tokens ?? 4096, 35 | ...(body.metadata?.user_id ? { metadata: { user_id: body.metadata?.user_id } } : {}), 36 | ...(typeof body.stream == "boolean" ? { stream: body.stream } : {}), 37 | ...(typeof body.temperature == "number" ? { temperature: body.temperature } : {}), 38 | ...(typeof body.top_p == "number" ? { top_p: body.top_p } : {}), 39 | // Convert single string or array of stop sequences 40 | ...(typeof body.stop == "string" 41 | ? { stop_sequences: [body.stop] } 42 | : Array.isArray(body.stop) 43 | ? { stop_sequences: body.stop } 44 | : {}), 45 | // Anthropic does not support JSON mode 46 | // Convert OpenAI tool_choice to Anthropic's tools_choice 47 | ...(body.tool_choice == "auto" 48 | ? { tool_choice: { type: "auto", ...parallel_tool_calls } } 49 | : body.tool_choice == "required" 50 | ? { tool_choice: { type: "any", ...parallel_tool_calls } } 51 | : body.tool_choice == "none" 52 | ? {} 53 | : typeof body.tool_choice == "object" 54 | ? { 55 | tool_choice: { 56 | type: "tool", 57 | name: body.tool_choice.function?.name, 58 | ...parallel_tool_calls, 59 | }, 60 | } 61 | : {}), 62 | }; 63 | 64 | // Convert function definitions to Anthropic's tool format 65 | const tools = body.tools?.map((tool) => ({ 66 | name: tool.function.name, 67 | description: tool.function.description, 68 | input_schema: tool.function.parameters, 69 | })); 70 | 71 | // Only include optional configs if they exist 72 | return { 73 | ...(system ? { system: system.content } : {}), 74 | messages, 75 | ...params, 76 | ...(body.tools ? { tools } : {}), 77 | }; 78 | } 79 | 80 | // Handle data URIs in Anthropic's format. External URLs are not supported. 81 | const anthropicSourceFromURL = (url) => { 82 | if (url.startsWith("data:")) { 83 | const [base, base64Data] = url.split(","); 84 | return { 85 | type: "base64", 86 | media_type: base.replace("data:", "").replace(";base64", ""), 87 | data: base64Data, 88 | }; 89 | } 90 | }; 91 | -------------------------------------------------------------------------------- /anthropic_test.js: -------------------------------------------------------------------------------- 1 | import { anthropic } from "./anthropic.js"; 2 | 3 | function assertEquals(actual, expected, message) { 4 | if (JSON.stringify(actual) === JSON.stringify(expected)) return; 5 | throw new Error( 6 | message || `Expected:\n${JSON.stringify(expected, null, 2)}. Actual:\n${JSON.stringify(actual, null, 2)}`, 7 | ); 8 | } 9 | 10 | // 1. System message handling 11 | Deno.test("anthropic - system message handling", () => { 12 | const input = { 13 | messages: [ 14 | { role: "system", content: "You are helpful" }, 15 | { role: "user", content: "Hi" }, 16 | ], 17 | }; 18 | 19 | const expected = { 20 | system: "You are helpful", 21 | messages: [{ role: "user", content: "Hi" }], 22 | max_tokens: 4096, 23 | }; 24 | 25 | assertEquals(anthropic(input), expected); 26 | }); 27 | 28 | // 2. Basic message conversion 29 | Deno.test("anthropic - basic message conversion", () => { 30 | const input = { 31 | messages: [{ role: "user", content: "Hello" }], 32 | }; 33 | 34 | const expected = { 35 | messages: [{ role: "user", content: "Hello" }], 36 | max_tokens: 4096, 37 | }; 38 | 39 | assertEquals(anthropic(input), expected); 40 | }); 41 | 42 | // 2b. Multimodal content handling 43 | Deno.test("anthropic - multimodal content", () => { 44 | const input = { 45 | messages: [ 46 | { 47 | role: "user", 48 | content: [ 49 | { type: "text", text: "What's in this image?" }, 50 | { 51 | type: "image_url", 52 | image_url: { url: "" }, 53 | }, 54 | ], 55 | }, 56 | ], 57 | }; 58 | 59 | const expected = { 60 | messages: [ 61 | { 62 | role: "user", 63 | content: [ 64 | { type: "text", text: "What's in this image?" }, 65 | { 66 | type: "image", 67 | source: { 68 | type: "base64", 69 | media_type: "image/jpeg", 70 | data: "abc123", 71 | }, 72 | }, 73 | ], 74 | }, 75 | ], 76 | max_tokens: 4096, 77 | }; 78 | 79 | assertEquals(anthropic(input), expected); 80 | }); 81 | 82 | // 3. Parameter conversion 83 | Deno.test("anthropic - parameter conversion", () => { 84 | const input = { 85 | messages: [{ role: "user", content: "Hi" }], 86 | model: "claude-3-5-sonnet-20241002", 87 | max_tokens: 100, 88 | metadata: { user_id: "123" }, 89 | stream: true, 90 | temperature: 0.7, 91 | top_p: 0.9, 92 | stop: ["END"], 93 | }; 94 | 95 | const expected = { 96 | messages: [{ role: "user", content: "Hi" }], 97 | model: "claude-3-5-sonnet-20241002", 98 | max_tokens: 100, 99 | metadata: { user_id: "123" }, 100 | stream: true, 101 | temperature: 0.7, 102 | top_p: 0.9, 103 | stop_sequences: ["END"], 104 | }; 105 | 106 | assertEquals(anthropic(input), expected); 107 | }); 108 | 109 | // 3b. Array stop sequences 110 | Deno.test("anthropic - array stop sequences", () => { 111 | const input = { 112 | messages: [{ role: "user", content: "Hi" }], 113 | stop: ["STOP", "END"], 114 | }; 115 | 116 | const expected = { 117 | messages: [{ role: "user", content: "Hi" }], 118 | max_tokens: 4096, 119 | stop_sequences: ["STOP", "END"], 120 | }; 121 | 122 | assertEquals(anthropic(input), expected); 123 | }); 124 | 125 | // 4. Tool handling 126 | Deno.test("anthropic - tool calling configurations", () => { 127 | const input = { 128 | messages: [{ role: "user", content: "Hi" }], 129 | tool_choice: "auto", 130 | parallel_tool_calls: true, 131 | tools: [ 132 | { 133 | function: { 134 | name: "get_weather", 135 | description: "Get weather info", 136 | parameters: { 137 | type: "object", 138 | properties: { location: { type: "string" } }, 139 | }, 140 | }, 141 | }, 142 | ], 143 | }; 144 | 145 | const expected = { 146 | messages: [{ role: "user", content: "Hi" }], 147 | max_tokens: 4096, 148 | tool_choice: { type: "auto", disable_parallel_tool_use: false }, 149 | tools: [ 150 | { 151 | name: "get_weather", 152 | description: "Get weather info", 153 | input_schema: { 154 | type: "object", 155 | properties: { location: { type: "string" } }, 156 | }, 157 | }, 158 | ], 159 | }; 160 | 161 | assertEquals(anthropic(input), expected); 162 | }); 163 | 164 | // 4b. Specific tool choice 165 | Deno.test("anthropic - specific tool choice", () => { 166 | const input = { 167 | messages: [{ role: "user", content: "Hi" }], 168 | tool_choice: { function: { name: "get_weather" } }, 169 | }; 170 | 171 | const expected = { 172 | messages: [{ role: "user", content: "Hi" }], 173 | max_tokens: 4096, 174 | tool_choice: { type: "tool", name: "get_weather" }, 175 | }; 176 | 177 | assertEquals(anthropic(input), expected); 178 | }); 179 | -------------------------------------------------------------------------------- /gemini.js: -------------------------------------------------------------------------------- 1 | /** 2 | * Convert an OpenAI body to a Gemini body 3 | * @param {Object} body 4 | * @returns {Object} 5 | */ 6 | export function gemini(body) { 7 | // System messages live in a separate object in Gemini 8 | const systemMessage = body.messages.find((msg) => msg.role === "system"); 9 | const systemInstruction = systemMessage ? { systemInstruction: { parts: [{ text: systemMessage.content }] } } : {}; 10 | 11 | // Convert messages: Gemini uses "model" instead of "assistant" and has different content structure 12 | const contents = body.messages 13 | .filter((msg) => msg.role !== "system") 14 | .map((msg) => ({ 15 | role: msg.role == "assistant" ? "model" : msg.role, 16 | // Handle both text and binary content (images/audio) 17 | parts: Array.isArray(msg.content) 18 | ? msg.content.map(({ type, text, image_url, input_audio }) => { 19 | if (type === "text") return { text }; 20 | else if (type === "image_url") return geminiPartFromURL(image_url.url); 21 | else if (type == "input_audio") return geminiPartFromURL(input_audio.data); 22 | }) 23 | : [{ text: msg.content }], 24 | })); 25 | 26 | // Map OpenAI parameters to Gemini equivalents, only including if defined 27 | const generationConfig = { 28 | ...(typeof body.temperature == "number" ? { temperature: body.temperature } : {}), 29 | ...(typeof body.max_tokens == "number" ? { maxOutputTokens: body.max_tokens } : {}), 30 | ...(typeof body.max_completion_tokens == "number" ? { maxOutputTokens: body.max_completion_tokens } : {}), 31 | ...(typeof body.top_p == "number" ? { topP: body.top_p } : {}), 32 | ...(typeof body.presence_penalty == "number" ? { presencePenalty: body.presence_penalty } : {}), 33 | ...(typeof body.frequency_penalty == "number" ? { frequencyPenalty: body.frequency_penalty } : {}), 34 | ...(typeof body.logprobs == "boolean" ? { responseLogprobs: body.logprobs } : {}), 35 | ...(typeof body.top_logprobs == "number" ? { logprobs: body.top_logprobs } : {}), 36 | ...(typeof body.n == "number" ? { candidateCount: body.n } : {}), 37 | // Convert single string or array of stop sequences 38 | ...(typeof body.stop == "string" 39 | ? { stopSequences: [body.stop] } 40 | : Array.isArray(body.stop) 41 | ? { stopSequences: body.stop } 42 | : {}), 43 | // Handle JSON response formatting and schemas 44 | ...(body.response_format?.type == "json_object" 45 | ? { responseMimeType: "application/json" } 46 | : body.response_format?.type == "json_schema" 47 | ? { 48 | responseMimeType: "application/json", 49 | responseSchema: geminiSchema(structuredClone(body.response_format?.json_schema?.schema)), 50 | } 51 | : {}), 52 | }; 53 | 54 | // Convert OpenAI tool_choice to Gemini's function calling modes 55 | const toolConfig = 56 | body.tool_choice == "auto" 57 | ? { function_calling_config: { mode: "AUTO" } } 58 | : body.tool_choice == "required" 59 | ? { function_calling_config: { mode: "ANY" } } 60 | : body.tool_choice == "none" 61 | ? { function_calling_config: { mode: "NONE" } } 62 | : typeof body.tool_choice == "object" 63 | ? { 64 | function_calling_config: { 65 | mode: "ANY", 66 | allowed_function_names: [body.tool_choice.function?.name], 67 | }, 68 | } 69 | : {}; 70 | 71 | // Convert function definitions to Gemini's tool format 72 | const tools = body.tools 73 | ? { 74 | functionDeclarations: body.tools.map((tool) => ({ 75 | name: tool.function.name, 76 | description: tool.function.description, 77 | parameters: geminiSchema(structuredClone(tool.function.parameters)), 78 | })), 79 | } 80 | : {}; 81 | 82 | // Only include optional configs if they exist 83 | return { 84 | ...systemInstruction, 85 | contents, 86 | ...(Object.keys(generationConfig).length > 0 ? { generationConfig } : {}), 87 | ...(body.tool_choice ? { toolConfig } : {}), 88 | ...(body.tools ? { tools } : {}), 89 | }; 90 | } 91 | 92 | // Handle both data URIs and external URLs in Gemini's required format 93 | const geminiPartFromURL = (url) => { 94 | if (url.startsWith("data:")) { 95 | const [base, base64Data] = url.split(","); 96 | return { 97 | inlineData: { 98 | mimeType: base.replace("data:", "").replace(";base64", ""), 99 | data: base64Data, 100 | }, 101 | }; 102 | } 103 | return { fileData: { fileUri: url } }; 104 | }; 105 | 106 | // Gemini doesn't support additionalProperties in schemas. Recursively remove it. 107 | function geminiSchema(obj) { 108 | if (Array.isArray(obj)) obj.forEach(geminiSchema); 109 | else if (obj && typeof obj === "object") { 110 | for (const key in obj) { 111 | if (key === "additionalProperties") delete obj[key]; 112 | else geminiSchema(obj[key]); 113 | } 114 | } 115 | return obj; 116 | } 117 | -------------------------------------------------------------------------------- /gemini_test.js: -------------------------------------------------------------------------------- 1 | import { gemini } from "./gemini.js"; 2 | 3 | function assertEquals(actual, expected, message) { 4 | if (JSON.stringify(actual) === JSON.stringify(expected)) return; 5 | throw new Error( 6 | message || `Expected:\n${JSON.stringify(expected, null, 2)}. Actual:\n${JSON.stringify(actual, null, 2)}`, 7 | ); 8 | } 9 | 10 | Deno.test("gemini - basic message conversion", () => { 11 | const input = { 12 | messages: [{ role: "user", content: "Hello" }], 13 | }; 14 | 15 | const expected = { 16 | contents: [{ role: "user", parts: [{ text: "Hello" }] }], 17 | }; 18 | 19 | assertEquals(gemini(input), expected); 20 | }); 21 | 22 | Deno.test("gemini - system message handling", () => { 23 | const input = { 24 | messages: [ 25 | { role: "system", content: "You are helpful" }, 26 | { role: "user", content: "Hi" }, 27 | ], 28 | }; 29 | 30 | const expected = { 31 | systemInstruction: { parts: [{ text: "You are helpful" }] }, 32 | contents: [{ role: "user", parts: [{ text: "Hi" }] }], 33 | }; 34 | 35 | assertEquals(gemini(input), expected); 36 | }); 37 | 38 | Deno.test("gemini - assistant message conversion", () => { 39 | const input = { 40 | messages: [ 41 | { role: "user", content: "Hi" }, 42 | { role: "assistant", content: "Hello" }, 43 | ], 44 | }; 45 | 46 | const expected = { 47 | contents: [ 48 | { role: "user", parts: [{ text: "Hi" }] }, 49 | { role: "model", parts: [{ text: "Hello" }] }, 50 | ], 51 | }; 52 | 53 | assertEquals(gemini(input), expected); 54 | }); 55 | 56 | Deno.test("gemini - multimodal content", () => { 57 | const input = { 58 | messages: [ 59 | { 60 | role: "user", 61 | content: [ 62 | { type: "text", text: "What's in this image?" }, 63 | { 64 | type: "image_url", 65 | image_url: { url: "" }, 66 | }, 67 | { 68 | type: "input_audio", 69 | input_audio: { data: "https://example.com/audio.mp3" }, 70 | }, 71 | ], 72 | }, 73 | ], 74 | }; 75 | 76 | const expected = { 77 | contents: [ 78 | { 79 | role: "user", 80 | parts: [ 81 | { text: "What's in this image?" }, 82 | { inlineData: { mimeType: "image/jpeg", data: "abc123" } }, 83 | { fileData: { fileUri: "https://example.com/audio.mp3" } }, 84 | ], 85 | }, 86 | ], 87 | }; 88 | 89 | assertEquals(gemini(input), expected); 90 | }); 91 | 92 | Deno.test("gemini - generation config parameters", () => { 93 | const input = { 94 | messages: [{ role: "user", content: "Hi" }], 95 | temperature: 0.7, 96 | max_tokens: 100, 97 | top_p: 0.9, 98 | presence_penalty: 0.5, 99 | frequency_penalty: 0.5, 100 | logprobs: true, 101 | top_logprobs: 3, 102 | n: 2, 103 | stop: ["END"], 104 | response_format: { type: "json_object" }, 105 | }; 106 | 107 | const expected = { 108 | contents: [{ role: "user", parts: [{ text: "Hi" }] }], 109 | generationConfig: { 110 | temperature: 0.7, 111 | maxOutputTokens: 100, 112 | topP: 0.9, 113 | presencePenalty: 0.5, 114 | frequencyPenalty: 0.5, 115 | responseLogprobs: true, 116 | logprobs: 3, 117 | candidateCount: 2, 118 | stopSequences: ["END"], 119 | responseMimeType: "application/json", 120 | }, 121 | }; 122 | 123 | assertEquals(gemini(input), expected); 124 | }); 125 | 126 | Deno.test("gemini - tool calling configurations", () => { 127 | const input = { 128 | messages: [{ role: "user", content: "Hi" }], 129 | tool_choice: "auto", 130 | tools: [ 131 | { 132 | function: { 133 | name: "get_weather", 134 | description: "Get weather info", 135 | parameters: { 136 | type: "object", 137 | properties: { location: { type: "string" } }, 138 | required: ["location"], 139 | additionalProperties: false, 140 | }, 141 | }, 142 | }, 143 | ], 144 | }; 145 | 146 | const expected = { 147 | contents: [{ role: "user", parts: [{ text: "Hi" }] }], 148 | toolConfig: { function_calling_config: { mode: "AUTO" } }, 149 | tools: { 150 | functionDeclarations: [ 151 | { 152 | name: "get_weather", 153 | description: "Get weather info", 154 | parameters: { 155 | type: "object", 156 | properties: { location: { type: "string" } }, 157 | required: ["location"], 158 | }, 159 | }, 160 | ], 161 | }, 162 | }; 163 | 164 | assertEquals(gemini(input), expected); 165 | }); 166 | 167 | Deno.test("gemini - specific tool choice", () => { 168 | const input = { 169 | messages: [{ role: "user", content: "Hi" }], 170 | tool_choice: { function: { name: "get_weather" } }, 171 | }; 172 | 173 | const expected = { 174 | contents: [{ role: "user", parts: [{ text: "Hi" }] }], 175 | toolConfig: { 176 | function_calling_config: { 177 | mode: "ANY", 178 | allowed_function_names: ["get_weather"], 179 | }, 180 | }, 181 | }; 182 | 183 | assertEquals(gemini(input), expected); 184 | }); 185 | 186 | Deno.test("gemini - json schema response format", () => { 187 | const input = { 188 | messages: [{ role: "user", content: "Hi" }], 189 | response_format: { 190 | type: "json_schema", 191 | json_schema: { 192 | schema: { 193 | type: "object", 194 | properties: { 195 | name: { type: "string" }, 196 | age: { type: "number" }, 197 | additionalProperties: false, 198 | }, 199 | }, 200 | }, 201 | }, 202 | }; 203 | 204 | const expected = { 205 | contents: [{ role: "user", parts: [{ text: "Hi" }] }], 206 | generationConfig: { 207 | responseMimeType: "application/json", 208 | responseSchema: { 209 | type: "object", 210 | properties: { name: { type: "string" }, age: { type: "number" } }, 211 | }, 212 | }, 213 | }; 214 | 215 | assertEquals(gemini(input), expected); 216 | }); 217 | 218 | Deno.test("gemini - required tool choice", () => { 219 | const input = { 220 | messages: [{ role: "user", content: "Hi" }], 221 | tool_choice: "required", 222 | }; 223 | 224 | const expected = { 225 | contents: [{ role: "user", parts: [{ text: "Hi" }] }], 226 | toolConfig: { function_calling_config: { mode: "ANY" } }, 227 | }; 228 | 229 | assertEquals(gemini(input), expected); 230 | }); 231 | 232 | Deno.test("gemini - none tool choice", () => { 233 | const input = { 234 | messages: [{ role: "user", content: "Hi" }], 235 | tool_choice: "none", 236 | }; 237 | 238 | const expected = { 239 | contents: [{ role: "user", parts: [{ text: "Hi" }] }], 240 | toolConfig: { function_calling_config: { mode: "NONE" } }, 241 | }; 242 | 243 | assertEquals(gemini(input), expected); 244 | }); 245 | 246 | Deno.test("gemini - string stop sequence", () => { 247 | const input = { messages: [{ role: "user", content: "Hi" }], stop: "STOP" }; 248 | 249 | const expected = { 250 | contents: [{ role: "user", parts: [{ text: "Hi" }] }], 251 | generationConfig: { stopSequences: ["STOP"] }, 252 | }; 253 | 254 | assertEquals(gemini(input), expected); 255 | }); 256 | 257 | Deno.test("gemini - max_completion_tokens parameter", () => { 258 | const input = { 259 | messages: [{ role: "user", content: "Hi" }], 260 | max_completion_tokens: 150, 261 | }; 262 | 263 | const expected = { 264 | contents: [{ role: "user", parts: [{ text: "Hi" }] }], 265 | generationConfig: { maxOutputTokens: 150 }, 266 | }; 267 | 268 | assertEquals(gemini(input), expected); 269 | }); 270 | -------------------------------------------------------------------------------- /index.d.ts: -------------------------------------------------------------------------------- 1 | import { SSEConfig } from "asyncsse"; 2 | 3 | export interface LLMTool { 4 | id?: string; 5 | name?: string; 6 | args?: string; 7 | } 8 | 9 | export interface LLMEvent { 10 | content?: string; 11 | tools?: LLMTool[]; 12 | error?: string; 13 | message?: Record; 14 | } 15 | 16 | export function asyncLLM( 17 | request: string | Request, 18 | options?: RequestInit, 19 | config?: SSEConfig 20 | ): AsyncGenerator; 21 | -------------------------------------------------------------------------------- /index.js: -------------------------------------------------------------------------------- 1 | import { asyncSSE } from "asyncsse"; 2 | 3 | /** 4 | * asyncLLM yields events when streaming from a streaming LLM endpoint. 5 | * 6 | * @param {Request} request 7 | * @param {RequestInit} options 8 | * @param {SSEConfig} config 9 | * @returns {AsyncGenerator, void, unknown>} 10 | * 11 | * @example 12 | * for await (const event of asyncLLM("https://api.openai.com/v1/chat/completions", { 13 | * method: "POST", 14 | * headers: { 15 | * "Content-Type": "application/json", 16 | * "Authorization": "Bearer YOUR_API_KEY", 17 | * }, 18 | * body: JSON.stringify({ 19 | * model: "gpt-3.5-turbo", 20 | * messages: [{ role: "user", content: "Hello, world!" }], 21 | * }), 22 | * }, { 23 | * onResponse: async (response) => { 24 | * console.log(response.status, response.headers); 25 | * }, 26 | * })) { 27 | * console.log(event); 28 | * } 29 | */ 30 | export async function* asyncLLM(request, options = {}, config = {}) { 31 | let content, 32 | tools = []; 33 | 34 | function latestTool() { 35 | if (!tools.length) tools.push({}); 36 | return tools.at(-1); 37 | } 38 | 39 | for await (const event of asyncSSE(request, options, config)) { 40 | // OpenAI and Cloudflare AI Workers use "[DONE]" to indicate the end of the stream 41 | if (event.data === "[DONE]") break; 42 | 43 | if (event.error) { 44 | yield event; 45 | continue; 46 | } 47 | 48 | let message; 49 | try { 50 | message = JSON.parse(event.data); 51 | } catch (error) { 52 | yield { error: error.message, data: event.data }; 53 | continue; 54 | } 55 | 56 | // Handle errors. asyncSSE yields { error: ... } if the fetch fails. 57 | // OpenAI, Anthropic, and Gemini return {"error": ...}. 58 | // OpenRouter returns {"message":{"error": ...}}. 59 | const error = message.message?.error ?? message.error?.message ?? message.error ?? event.error; 60 | if (error) { 61 | yield { error }; 62 | continue; 63 | } 64 | 65 | // Attempt to parse with each provider's format 66 | let hasNewData = false; 67 | for (const parser of Object.values(providers)) { 68 | const extract = parser(message); 69 | hasNewData = !isEmpty(extract.content) || extract.tools.length > 0; 70 | if (!isEmpty(extract.content)) content = (content ?? "") + extract.content; 71 | for (const { name, args, id } of extract.tools) { 72 | if (!isEmpty(name)) { 73 | const tool = { name }; 74 | if (!isEmpty(id)) tool.id = id; 75 | tools.push(tool); 76 | } 77 | if (!isEmpty(args)) { 78 | const tool = latestTool(); 79 | tool.args = (tool.args ?? "") + args; 80 | } 81 | } 82 | if (hasNewData) break; 83 | } 84 | 85 | if (hasNewData) { 86 | const data = { content, message }; 87 | if (!isEmpty(content)) data.content = content; 88 | if (tools.length) data.tools = tools; 89 | yield data; 90 | } 91 | } 92 | } 93 | 94 | // Return the delta from each message as { content, tools } 95 | // content delta is string | undefined 96 | // tools delta is [{ name?: string, args?: string }] | [] 97 | const providers = { 98 | // Azure, OpenRouter, Groq, and a few others follow OpenAI's format 99 | openai: (m) => ({ 100 | content: m.choices?.[0]?.delta?.content, 101 | tools: (m.choices?.[0]?.delta?.tool_calls ?? []).map((tool) => ({ 102 | id: tool.id, 103 | name: tool.function.name, 104 | args: tool.function.arguments, 105 | })), 106 | }), 107 | anthropic: (m) => ({ 108 | content: m.delta?.text, 109 | tools: !isEmpty(m.content_block?.name) 110 | ? [{ name: m.content_block.name, id: m.content_block.id }] 111 | : !isEmpty(m.delta?.partial_json) 112 | ? [{ args: m.delta?.partial_json }] 113 | : [], 114 | }), 115 | gemini: (m) => ({ 116 | content: m.candidates?.[0]?.content?.parts?.[0]?.text, 117 | tools: (m.candidates?.[0]?.content?.parts ?? []) 118 | .map((part) => part.functionCall) 119 | .filter((d) => d) 120 | .map((d) => ({ name: d.name, args: JSON.stringify(d.args) })), 121 | }), 122 | cloudflare: (m) => ({ 123 | content: m.response, 124 | tools: [], 125 | }), 126 | }; 127 | 128 | const isEmpty = (value) => value === undefined || value === null; 129 | -------------------------------------------------------------------------------- /package-lock.json: -------------------------------------------------------------------------------- 1 | { 2 | "name": "asyncllm", 3 | "version": "2.1.1", 4 | "lockfileVersion": 3, 5 | "requires": true, 6 | "packages": { 7 | "": { 8 | "name": "asyncllm", 9 | "version": "2.1.1", 10 | "license": "MIT", 11 | "dependencies": { 12 | "asyncsse": "^1.3.1" 13 | }, 14 | "engines": { 15 | "node": ">=14.0.0" 16 | } 17 | }, 18 | "node_modules/asyncsse": { 19 | "version": "1.3.1", 20 | "resolved": "https://registry.npmjs.org/asyncsse/-/asyncsse-1.3.1.tgz", 21 | "integrity": "sha512-sPd7NAmOKAl+optdLYe0zyaXqMf4PCYNtkHvSddRs4cZs40i/zdG+1h8qrkg2QKoUsRmwoUaTuv+5iKkT5iv7w==", 22 | "license": "MIT", 23 | "engines": { 24 | "node": ">=14.0.0" 25 | } 26 | } 27 | } 28 | } 29 | -------------------------------------------------------------------------------- /package.json: -------------------------------------------------------------------------------- 1 | { 2 | "name": "asyncllm", 3 | "version": "2.1.2", 4 | "description": "Fetch streaming LLM responses as an async iterable", 5 | "main": "dist/asyncllm.js", 6 | "type": "module", 7 | "module": "index.js", 8 | "exports": { 9 | ".": "./dist/asyncllm.js", 10 | "./anthropic": "./dist/anthropic.js", 11 | "./gemini": "./dist/gemini.js" 12 | }, 13 | "scripts": { 14 | "test": "deno test --allow-net --allow-read", 15 | "build-asyncllm": "npx -y esbuild index.js --bundle --minify --format=esm --outfile=dist/asyncllm.js", 16 | "build-gemini": "npx -y esbuild gemini.js --bundle --minify --format=esm --outfile=dist/gemini.js", 17 | "build-anthropic": "npx -y esbuild anthropic.js --bundle --minify --format=esm --outfile=dist/anthropic.js", 18 | "build": "npm run build-asyncllm && npm run build-gemini && npm run build-anthropic", 19 | "lint": "npx prettier@3.3 --write *.js *.md", 20 | "prepublishOnly": "npm run lint && npm run build" 21 | }, 22 | "keywords": [ 23 | "sse", 24 | "fetch", 25 | "async", 26 | "iterable", 27 | "server-sent-events", 28 | "streaming", 29 | "llm", 30 | "openai", 31 | "anthropic", 32 | "gemini", 33 | "cloudflare" 34 | ], 35 | "author": "S Anand ", 36 | "license": "MIT", 37 | "repository": { 38 | "type": "git", 39 | "url": "https://github.com/sanand0/asyncllm.git" 40 | }, 41 | "bugs": { 42 | "url": "https://github.com/sanand0/asyncllm/issues" 43 | }, 44 | "homepage": "https://github.com/sanand0/asyncllm#readme", 45 | "engines": { 46 | "node": ">=14.0.0" 47 | }, 48 | "prettier": { 49 | "printWidth": 120 50 | }, 51 | "files": [ 52 | "README.md", 53 | "dist", 54 | "index.js", 55 | "index.d.ts" 56 | ], 57 | "dependencies": { 58 | "asyncsse": "^1.3.1" 59 | } 60 | } 61 | -------------------------------------------------------------------------------- /samples/anthropic-tools.txt: -------------------------------------------------------------------------------- 1 | event: message_start 2 | data: {"type":"message_start","message":{"id":"msg_014p7gG3wDgGV9EUtLvnow3U","type":"message","role":"assistant","model":"claude-3-haiku-20240307","stop_sequence":null,"usage":{"input_tokens":472,"output_tokens":2},"content":[],"stop_reason":null}} 3 | 4 | event: content_block_start 5 | data: {"type":"content_block_start","index":0,"content_block":{"type":"text","text":""}} 6 | 7 | event: ping 8 | data: {"type": "ping"} 9 | 10 | event: content_block_delta 11 | data: {"type":"content_block_delta","index":0,"delta":{"type":"text_delta","text":"Okay"}} 12 | 13 | event: content_block_delta 14 | data: {"type":"content_block_delta","index":0,"delta":{"type":"text_delta","text":","}} 15 | 16 | event: content_block_delta 17 | data: {"type":"content_block_delta","index":0,"delta":{"type":"text_delta","text":" let"}} 18 | 19 | event: content_block_delta 20 | data: {"type":"content_block_delta","index":0,"delta":{"type":"text_delta","text":"'s"}} 21 | 22 | event: content_block_delta 23 | data: {"type":"content_block_delta","index":0,"delta":{"type":"text_delta","text":" check"}} 24 | 25 | event: content_block_delta 26 | data: {"type":"content_block_delta","index":0,"delta":{"type":"text_delta","text":" the"}} 27 | 28 | event: content_block_delta 29 | data: {"type":"content_block_delta","index":0,"delta":{"type":"text_delta","text":" weather"}} 30 | 31 | event: content_block_delta 32 | data: {"type":"content_block_delta","index":0,"delta":{"type":"text_delta","text":" for"}} 33 | 34 | event: content_block_delta 35 | data: {"type":"content_block_delta","index":0,"delta":{"type":"text_delta","text":" San"}} 36 | 37 | event: content_block_delta 38 | data: {"type":"content_block_delta","index":0,"delta":{"type":"text_delta","text":" Francisco"}} 39 | 40 | event: content_block_delta 41 | data: {"type":"content_block_delta","index":0,"delta":{"type":"text_delta","text":","}} 42 | 43 | event: content_block_delta 44 | data: {"type":"content_block_delta","index":0,"delta":{"type":"text_delta","text":" CA"}} 45 | 46 | event: content_block_delta 47 | data: {"type":"content_block_delta","index":0,"delta":{"type":"text_delta","text":":"}} 48 | 49 | event: content_block_stop 50 | data: {"type":"content_block_stop","index":0} 51 | 52 | event: content_block_start 53 | data: {"type":"content_block_start","index":1,"content_block":{"type":"tool_use","id":"toolu_01T1x1fJ34qAmk2tNTrN7Up6","name":"get_weather","input":{}}} 54 | 55 | event: content_block_delta 56 | data: {"type":"content_block_delta","index":1,"delta":{"type":"input_json_delta","partial_json":""}} 57 | 58 | event: content_block_delta 59 | data: {"type":"content_block_delta","index":1,"delta":{"type":"input_json_delta","partial_json":"{\"location\":"}} 60 | 61 | event: content_block_delta 62 | data: {"type":"content_block_delta","index":1,"delta":{"type":"input_json_delta","partial_json":" \"San"}} 63 | 64 | event: content_block_delta 65 | data: {"type":"content_block_delta","index":1,"delta":{"type":"input_json_delta","partial_json":" Francisc"}} 66 | 67 | event: content_block_delta 68 | data: {"type":"content_block_delta","index":1,"delta":{"type":"input_json_delta","partial_json":"o,"}} 69 | 70 | event: content_block_delta 71 | data: {"type":"content_block_delta","index":1,"delta":{"type":"input_json_delta","partial_json":" CA\""}} 72 | 73 | event: content_block_delta 74 | data: {"type":"content_block_delta","index":1,"delta":{"type":"input_json_delta","partial_json":", "}} 75 | 76 | event: content_block_delta 77 | data: {"type":"content_block_delta","index":1,"delta":{"type":"input_json_delta","partial_json":"\"unit\": \"fah"}} 78 | 79 | event: content_block_delta 80 | data: {"type":"content_block_delta","index":1,"delta":{"type":"input_json_delta","partial_json":"renheit\"}"}} 81 | 82 | event: content_block_stop 83 | data: {"type":"content_block_stop","index":1} 84 | 85 | event: message_delta 86 | data: {"type":"message_delta","delta":{"stop_reason":"tool_use","stop_sequence":null},"usage":{"output_tokens":89}} 87 | 88 | event: message_stop 89 | data: {"type":"message_stop"} 90 | -------------------------------------------------------------------------------- /samples/anthropic-tools2.txt: -------------------------------------------------------------------------------- 1 | event: message_start 2 | data: {"type":"message_start","message":{"id":"msg_01NpRfBZDJHQvTKGtrwFJheH","type":"message","role":"assistant","model":"claude-3-haiku-20240307","content":[],"stop_reason":null,"stop_sequence":null,"usage":{"input_tokens":482,"output_tokens":8}} } 3 | 4 | event: content_block_start 5 | data: {"type":"content_block_start","index":0,"content_block":{"type":"tool_use","id":"toolu_015yB3TjTS1RBaM7VScM2MQY","name":"get_order","input":{}} } 6 | 7 | event: ping 8 | data: {"type": "ping"} 9 | 10 | event: content_block_delta 11 | data: {"type":"content_block_delta","index":0,"delta":{"type":"input_json_delta","partial_json":""} } 12 | 13 | event: content_block_delta 14 | data: {"type":"content_block_delta","index":0,"delta":{"type":"input_json_delta","partial_json":"{\"id\": \"1"} } 15 | 16 | event: content_block_delta 17 | data: {"type":"content_block_delta","index":0,"delta":{"type":"input_json_delta","partial_json":"23456\"}"} } 18 | 19 | event: content_block_stop 20 | data: {"type":"content_block_stop","index":0 } 21 | 22 | event: content_block_start 23 | data: {"type":"content_block_start","index":1,"content_block":{"type":"tool_use","id":"toolu_013VAZTYqMJm2JuRCqEA4kam","name":"get_customer","input":{}} } 24 | 25 | event: content_block_delta 26 | data: {"type":"content_block_delta","index":1,"delta":{"type":"input_json_delta","partial_json":""} } 27 | 28 | event: content_block_delta 29 | data: {"type":"content_block_delta","index":1,"delta":{"type":"input_json_delta","partial_json":"{\"id\": \""} } 30 | 31 | event: content_block_delta 32 | data: {"type":"content_block_delta","index":1,"delta":{"type":"input_json_delta","partial_json":"789"} } 33 | 34 | event: content_block_delta 35 | data: {"type":"content_block_delta","index":1,"delta":{"type":"input_json_delta","partial_json":"0\"}"} } 36 | 37 | event: content_block_stop 38 | data: {"type":"content_block_stop","index":1 } 39 | 40 | event: message_delta 41 | data: {"type":"message_delta","delta":{"stop_reason":"tool_use","stop_sequence":null},"usage":{"output_tokens":76} } 42 | 43 | event: message_stop 44 | data: {"type":"message_stop" } 45 | -------------------------------------------------------------------------------- /samples/anthropic.txt: -------------------------------------------------------------------------------- 1 | event: message_start 2 | data: {"type":"message_start","message":{"id":"msg_013uu3QExnpT3UYsC9mo2Em8","type":"message","role":"assistant","model":"claude-3-haiku-20240307","content":[],"stop_reason":null,"stop_sequence":null,"usage":{"input_tokens":19,"output_tokens":3}}} 3 | 4 | event: content_block_start 5 | data: {"type":"content_block_start","index":0,"content_block":{"type":"text","text":""}} 6 | 7 | event: ping 8 | data: {"type": "ping"} 9 | 10 | event: content_block_delta 11 | data: {"type":"content_block_delta","index":0,"delta":{"type":"text_delta","text":"2 "}} 12 | 13 | event: content_block_delta 14 | data: {"type":"content_block_delta","index":0,"delta":{"type":"text_delta","text":"+ 2 "}} 15 | 16 | event: content_block_delta 17 | data: {"type":"content_block_delta","index":0,"delta":{"type":"text_delta","text":"= 4."}} 18 | 19 | event: content_block_stop 20 | data: {"type":"content_block_stop","index":0} 21 | 22 | event: message_delta 23 | data: {"type":"message_delta","delta":{"stop_reason":"end_turn","stop_sequence":null},"usage":{"output_tokens":14}} 24 | 25 | event: message_stop 26 | data: {"type":"message_stop"} 27 | -------------------------------------------------------------------------------- /samples/errors.txt: -------------------------------------------------------------------------------- 1 | data: invalid json 2 | 3 | data: {"error": {"message": "OpenAI API error", "type": "api_error"}} 4 | 5 | data: {"error": {"type": "invalid_request_error", "message": "Anthropic API error"}} 6 | 7 | data: {"error": {"code": 400, "message": "Gemini API error"}} 8 | 9 | data: {"message": {"error": "OpenRouter API error"}} 10 | 11 | data: 12 | -------------------------------------------------------------------------------- /samples/gemini-tools.txt: -------------------------------------------------------------------------------- 1 | data: {"candidates": [{"content": {"parts": [{"functionCall": {"name": "take_notes","args": {"note": "Capitalism and socialism are two of the most prevalent economic systems in the world. Capitalism is characterized by private ownership of the means of production, free markets, and the pursuit of profit. Socialism, on the other hand, emphasizes social ownership of the means of production, with the goal of achieving social equality and economic justice. The two systems have been the subject of much debate, with proponents of each arguing for its superiority. Capitalism is often praised for its efficiency and innovation, while socialism is lauded for its potential to reduce inequality and provide for the needs of the most vulnerable. However, both systems have their drawbacks. Capitalism can lead to economic instability and social inequality, while socialism can stifle innovation and reduce individual freedom. Ultimately, the best economic system for a given society depends on its specific circumstances and values."}}}],"role": "model"},"finishReason": "STOP","index": 0,"safetyRatings": [{"category": "HARM_CATEGORY_SEXUALLY_EXPLICIT","probability": "NEGLIGIBLE"},{"category": "HARM_CATEGORY_HARASSMENT","probability": "NEGLIGIBLE"},{"category": "HARM_CATEGORY_DANGEROUS_CONTENT","probability": "NEGLIGIBLE"},{"category": "HARM_CATEGORY_HATE_SPEECH","probability": "NEGLIGIBLE"}]}],"usageMetadata": {"promptTokenCount": 50,"candidatesTokenCount": 174,"totalTokenCount": 224}} 2 | -------------------------------------------------------------------------------- /samples/gemini-tools2.txt: -------------------------------------------------------------------------------- 1 | data: {"candidates": [{"content": {"parts": [{"functionCall": {"name": "get_order","args": {"id": "123456"}}},{"functionCall": {"name": "get_customer","args": {"id": "7890"}}}],"role": "model"},"safetyRatings": [{"category": "HARM_CATEGORY_HATE_SPEECH","probability": "NEGLIGIBLE"},{"category": "HARM_CATEGORY_DANGEROUS_CONTENT","probability": "NEGLIGIBLE"},{"category": "HARM_CATEGORY_HARASSMENT","probability": "NEGLIGIBLE"},{"category": "HARM_CATEGORY_SEXUALLY_EXPLICIT","probability": "NEGLIGIBLE"}]}],"usageMetadata": {"promptTokenCount": 104,"totalTokenCount": 104},"modelVersion": "gemini-1.5-flash-8b-001"} 2 | 3 | data: {"candidates": [{"content": {"parts": [{"text": ""}],"role": "model"},"avgLogprobs": "NaN"}],"usageMetadata": {"promptTokenCount": 104,"totalTokenCount": 104},"modelVersion": "gemini-1.5-flash-8b-001"} 4 | 5 | data: {"candidates": [{"content": {"parts": [{"text": ""}],"role": "model"},"finishReason": "STOP"}],"usageMetadata": {"promptTokenCount": 104,"candidatesTokenCount": 18,"totalTokenCount": 122},"modelVersion": "gemini-1.5-flash-8b-001"} 6 | -------------------------------------------------------------------------------- /samples/gemini.txt: -------------------------------------------------------------------------------- 1 | data: {"candidates": [{"content": {"parts": [{"text": "2"}],"role": "model"}}],"usageMetadata": {"promptTokenCount": 13,"totalTokenCount": 13}} 2 | 3 | data: {"candidates": [{"content": {"parts": [{"text": " + 2 = 4\n"}],"role": "model"},"safetyRatings": [{"category": "HARM_CATEGORY_HATE_SPEECH","probability": "NEGLIGIBLE"},{"category": "HARM_CATEGORY_DANGEROUS_CONTENT","probability": "NEGLIGIBLE"},{"category": "HARM_CATEGORY_HARASSMENT","probability": "NEGLIGIBLE"},{"category": "HARM_CATEGORY_SEXUALLY_EXPLICIT","probability": "NEGLIGIBLE"}]}],"usageMetadata": {"promptTokenCount": 13,"totalTokenCount": 13}} 4 | 5 | data: {"candidates": [{"content": {"parts": [{"text": ""}],"role": "model"},"finishReason": "STOP"}],"usageMetadata": {"promptTokenCount": 13,"candidatesTokenCount": 8,"totalTokenCount": 21}} 6 | -------------------------------------------------------------------------------- /samples/openai-tools.txt: -------------------------------------------------------------------------------- 1 | data: {"id":"chatcmpl-AIYHs3Xp2vOtDdtgJUaTpUVMKk3a8","object":"chat.completion.chunk","created":1728985068,"model":"gpt-4o-mini-2024-07-18","system_fingerprint":"fp_e2bde53e6e","choices":[{"index":0,"delta":{"role":"assistant","content":null,"tool_calls":[{"index":0,"id":"call_F8YHCjnzrrTjfE4YSSpVW2Bc","type":"function","function":{"name":"get_delivery_date","arguments":""}}],"refusal":null},"logprobs":null,"finish_reason":null}]} 2 | 3 | data: {"id":"chatcmpl-AIYHs3Xp2vOtDdtgJUaTpUVMKk3a8","object":"chat.completion.chunk","created":1728985068,"model":"gpt-4o-mini-2024-07-18","system_fingerprint":"fp_e2bde53e6e","choices":[{"index":0,"delta":{"tool_calls":[{"index":0,"function":{"arguments":"{\""}}]},"logprobs":null,"finish_reason":null}]} 4 | 5 | data: {"id":"chatcmpl-AIYHs3Xp2vOtDdtgJUaTpUVMKk3a8","object":"chat.completion.chunk","created":1728985068,"model":"gpt-4o-mini-2024-07-18","system_fingerprint":"fp_e2bde53e6e","choices":[{"index":0,"delta":{"tool_calls":[{"index":0,"function":{"arguments":"order"}}]},"logprobs":null,"finish_reason":null}]} 6 | 7 | data: {"id":"chatcmpl-AIYHs3Xp2vOtDdtgJUaTpUVMKk3a8","object":"chat.completion.chunk","created":1728985068,"model":"gpt-4o-mini-2024-07-18","system_fingerprint":"fp_e2bde53e6e","choices":[{"index":0,"delta":{"tool_calls":[{"index":0,"function":{"arguments":"_id"}}]},"logprobs":null,"finish_reason":null}]} 8 | 9 | data: {"id":"chatcmpl-AIYHs3Xp2vOtDdtgJUaTpUVMKk3a8","object":"chat.completion.chunk","created":1728985068,"model":"gpt-4o-mini-2024-07-18","system_fingerprint":"fp_e2bde53e6e","choices":[{"index":0,"delta":{"tool_calls":[{"index":0,"function":{"arguments":"\":\""}}]},"logprobs":null,"finish_reason":null}]} 10 | 11 | data: {"id":"chatcmpl-AIYHs3Xp2vOtDdtgJUaTpUVMKk3a8","object":"chat.completion.chunk","created":1728985068,"model":"gpt-4o-mini-2024-07-18","system_fingerprint":"fp_e2bde53e6e","choices":[{"index":0,"delta":{"tool_calls":[{"index":0,"function":{"arguments":"123"}}]},"logprobs":null,"finish_reason":null}]} 12 | 13 | data: {"id":"chatcmpl-AIYHs3Xp2vOtDdtgJUaTpUVMKk3a8","object":"chat.completion.chunk","created":1728985068,"model":"gpt-4o-mini-2024-07-18","system_fingerprint":"fp_e2bde53e6e","choices":[{"index":0,"delta":{"tool_calls":[{"index":0,"function":{"arguments":"456"}}]},"logprobs":null,"finish_reason":null}]} 14 | 15 | data: {"id":"chatcmpl-AIYHs3Xp2vOtDdtgJUaTpUVMKk3a8","object":"chat.completion.chunk","created":1728985068,"model":"gpt-4o-mini-2024-07-18","system_fingerprint":"fp_e2bde53e6e","choices":[{"index":0,"delta":{"tool_calls":[{"index":0,"function":{"arguments":"\"}"}}]},"logprobs":null,"finish_reason":null}]} 16 | 17 | data: {"id":"chatcmpl-AIYHs3Xp2vOtDdtgJUaTpUVMKk3a8","object":"chat.completion.chunk","created":1728985068,"model":"gpt-4o-mini-2024-07-18","system_fingerprint":"fp_e2bde53e6e","choices":[{"index":0,"delta":{},"logprobs":null,"finish_reason":"tool_calls"}]} 18 | 19 | data: [DONE] 20 | 21 | -------------------------------------------------------------------------------- /samples/openai-tools2.txt: -------------------------------------------------------------------------------- 1 | data: {"id":"chatcmpl-AQ3zpRW1u9JcFF4vG4yvlRk6Dl0Nk","object":"chat.completion.chunk","created":1730775253,"model":"gpt-4o-mini-2024-07-18","system_fingerprint":"fp_9b78b61c52","choices":[{"index":0,"delta":{"role":"assistant","content":null},"logprobs":null,"finish_reason":null}]} 2 | 3 | data: {"id":"chatcmpl-AQ3zpRW1u9JcFF4vG4yvlRk6Dl0Nk","object":"chat.completion.chunk","created":1730775253,"model":"gpt-4o-mini-2024-07-18","system_fingerprint":"fp_9b78b61c52","choices":[{"index":0,"delta":{"tool_calls":[{"index":0,"id":"call_wnH2cswb4JAnm69pUAP4MNEN","type":"function","function":{"name":"get_order","arguments":""}}]},"logprobs":null,"finish_reason":null}]} 4 | 5 | data: {"id":"chatcmpl-AQ3zpRW1u9JcFF4vG4yvlRk6Dl0Nk","object":"chat.completion.chunk","created":1730775253,"model":"gpt-4o-mini-2024-07-18","system_fingerprint":"fp_9b78b61c52","choices":[{"index":0,"delta":{"tool_calls":[{"index":0,"function":{"arguments":"{\"id"}}]},"logprobs":null,"finish_reason":null}]} 6 | 7 | data: {"id":"chatcmpl-AQ3zpRW1u9JcFF4vG4yvlRk6Dl0Nk","object":"chat.completion.chunk","created":1730775253,"model":"gpt-4o-mini-2024-07-18","system_fingerprint":"fp_9b78b61c52","choices":[{"index":0,"delta":{"tool_calls":[{"index":0,"function":{"arguments":"\": \"1"}}]},"logprobs":null,"finish_reason":null}]} 8 | 9 | data: {"id":"chatcmpl-AQ3zpRW1u9JcFF4vG4yvlRk6Dl0Nk","object":"chat.completion.chunk","created":1730775253,"model":"gpt-4o-mini-2024-07-18","system_fingerprint":"fp_9b78b61c52","choices":[{"index":0,"delta":{"tool_calls":[{"index":0,"function":{"arguments":"23456\""}}]},"logprobs":null,"finish_reason":null}]} 10 | 11 | data: {"id":"chatcmpl-AQ3zpRW1u9JcFF4vG4yvlRk6Dl0Nk","object":"chat.completion.chunk","created":1730775253,"model":"gpt-4o-mini-2024-07-18","system_fingerprint":"fp_9b78b61c52","choices":[{"index":0,"delta":{"tool_calls":[{"index":0,"function":{"arguments":"}"}}]},"logprobs":null,"finish_reason":null}]} 12 | 13 | data: {"id":"chatcmpl-AQ3zpRW1u9JcFF4vG4yvlRk6Dl0Nk","object":"chat.completion.chunk","created":1730775253,"model":"gpt-4o-mini-2024-07-18","system_fingerprint":"fp_9b78b61c52","choices":[{"index":0,"delta":{"tool_calls":[{"index":1,"id":"call_f4GVABhbwSOLoaisOBOajnsm","type":"function","function":{"name":"get_customer","arguments":""}}]},"logprobs":null,"finish_reason":null}]} 14 | 15 | data: {"id":"chatcmpl-AQ3zpRW1u9JcFF4vG4yvlRk6Dl0Nk","object":"chat.completion.chunk","created":1730775253,"model":"gpt-4o-mini-2024-07-18","system_fingerprint":"fp_9b78b61c52","choices":[{"index":0,"delta":{"tool_calls":[{"index":1,"function":{"arguments":"{\"id"}}]},"logprobs":null,"finish_reason":null}]} 16 | 17 | data: {"id":"chatcmpl-AQ3zpRW1u9JcFF4vG4yvlRk6Dl0Nk","object":"chat.completion.chunk","created":1730775253,"model":"gpt-4o-mini-2024-07-18","system_fingerprint":"fp_9b78b61c52","choices":[{"index":0,"delta":{"tool_calls":[{"index":1,"function":{"arguments":"\": \"7"}}]},"logprobs":null,"finish_reason":null}]} 18 | 19 | data: {"id":"chatcmpl-AQ3zpRW1u9JcFF4vG4yvlRk6Dl0Nk","object":"chat.completion.chunk","created":1730775253,"model":"gpt-4o-mini-2024-07-18","system_fingerprint":"fp_9b78b61c52","choices":[{"index":0,"delta":{"tool_calls":[{"index":1,"function":{"arguments":"890\"}"}}]},"logprobs":null,"finish_reason":null}]} 20 | 21 | data: {"id":"chatcmpl-AQ3zpRW1u9JcFF4vG4yvlRk6Dl0Nk","object":"chat.completion.chunk","created":1730775253,"model":"gpt-4o-mini-2024-07-18","system_fingerprint":"fp_9b78b61c52","choices":[{"index":0,"delta":{},"logprobs":null,"finish_reason":"tool_calls"}]} 22 | 23 | data: [DONE] 24 | -------------------------------------------------------------------------------- /samples/openai.txt: -------------------------------------------------------------------------------- 1 | data: {"id":"chatcmpl-AIXwzd0Ul2u3WWUqaXvmzE4o5Th8b","object":"chat.completion.chunk","created":1728983773,"model":"gpt-4o-2024-08-06","system_fingerprint":"fp_6b68a8204b","choices":[{"index":0,"delta":{"role":"assistant","content":"","refusal":null},"logprobs":null,"finish_reason":null}]} 2 | 3 | data: {"id":"chatcmpl-AIXwzd0Ul2u3WWUqaXvmzE4o5Th8b","object":"chat.completion.chunk","created":1728983773,"model":"gpt-4o-2024-08-06","system_fingerprint":"fp_6b68a8204b","choices":[{"index":0,"delta":{"content":"Hello"},"logprobs":null,"finish_reason":null}]} 4 | 5 | data: {"id":"chatcmpl-AIXwzd0Ul2u3WWUqaXvmzE4o5Th8b","object":"chat.completion.chunk","created":1728983773,"model":"gpt-4o-2024-08-06","system_fingerprint":"fp_6b68a8204b","choices":[{"index":0,"delta":{"content":"!"},"logprobs":null,"finish_reason":null}]} 6 | 7 | data: {"id":"chatcmpl-AIXwzd0Ul2u3WWUqaXvmzE4o5Th8b","object":"chat.completion.chunk","created":1728983773,"model":"gpt-4o-2024-08-06","system_fingerprint":"fp_6b68a8204b","choices":[{"index":0,"delta":{"content":" How"},"logprobs":null,"finish_reason":null}]} 8 | 9 | data: {"id":"chatcmpl-AIXwzd0Ul2u3WWUqaXvmzE4o5Th8b","object":"chat.completion.chunk","created":1728983773,"model":"gpt-4o-2024-08-06","system_fingerprint":"fp_6b68a8204b","choices":[{"index":0,"delta":{"content":" can"},"logprobs":null,"finish_reason":null}]} 10 | 11 | data: {"id":"chatcmpl-AIXwzd0Ul2u3WWUqaXvmzE4o5Th8b","object":"chat.completion.chunk","created":1728983773,"model":"gpt-4o-2024-08-06","system_fingerprint":"fp_6b68a8204b","choices":[{"index":0,"delta":{"content":" I"},"logprobs":null,"finish_reason":null}]} 12 | 13 | data: {"id":"chatcmpl-AIXwzd0Ul2u3WWUqaXvmzE4o5Th8b","object":"chat.completion.chunk","created":1728983773,"model":"gpt-4o-2024-08-06","system_fingerprint":"fp_6b68a8204b","choices":[{"index":0,"delta":{"content":" assist"},"logprobs":null,"finish_reason":null}]} 14 | 15 | data: {"id":"chatcmpl-AIXwzd0Ul2u3WWUqaXvmzE4o5Th8b","object":"chat.completion.chunk","created":1728983773,"model":"gpt-4o-2024-08-06","system_fingerprint":"fp_6b68a8204b","choices":[{"index":0,"delta":{"content":" you"},"logprobs":null,"finish_reason":null}]} 16 | 17 | data: {"id":"chatcmpl-AIXwzd0Ul2u3WWUqaXvmzE4o5Th8b","object":"chat.completion.chunk","created":1728983773,"model":"gpt-4o-2024-08-06","system_fingerprint":"fp_6b68a8204b","choices":[{"index":0,"delta":{"content":" today"},"logprobs":null,"finish_reason":null}]} 18 | 19 | data: {"id":"chatcmpl-AIXwzd0Ul2u3WWUqaXvmzE4o5Th8b","object":"chat.completion.chunk","created":1728983773,"model":"gpt-4o-2024-08-06","system_fingerprint":"fp_6b68a8204b","choices":[{"index":0,"delta":{"content":"?"},"logprobs":null,"finish_reason":null}]} 20 | 21 | data: {"id":"chatcmpl-AIXwzd0Ul2u3WWUqaXvmzE4o5Th8b","object":"chat.completion.chunk","created":1728983773,"model":"gpt-4o-2024-08-06","system_fingerprint":"fp_6b68a8204b","choices":[{"index":0,"delta":{},"logprobs":null,"finish_reason":"stop"}]} 22 | 23 | data: [DONE] 24 | -------------------------------------------------------------------------------- /samples/openrouter.txt: -------------------------------------------------------------------------------- 1 | : OPENROUTER PROCESSING 2 | 3 | : OPENROUTER PROCESSING 4 | 5 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":""},"finish_reason":null,"logprobs":null}]} 6 | 7 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":" The"},"finish_reason":null,"logprobs":null}]} 8 | 9 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":" sum"},"finish_reason":null,"logprobs":null}]} 10 | 11 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":" of"},"finish_reason":null,"logprobs":null}]} 12 | 13 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":" "},"finish_reason":null,"logprobs":null}]} 14 | 15 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":"2"},"finish_reason":null,"logprobs":null}]} 16 | 17 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":" and"},"finish_reason":null,"logprobs":null}]} 18 | 19 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":" "},"finish_reason":null,"logprobs":null}]} 20 | 21 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":"2"},"finish_reason":null,"logprobs":null}]} 22 | 23 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":" is"},"finish_reason":null,"logprobs":null}]} 24 | 25 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":" "},"finish_reason":null,"logprobs":null}]} 26 | 27 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":"4"},"finish_reason":null,"logprobs":null}]} 28 | 29 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":"."},"finish_reason":null,"logprobs":null}]} 30 | 31 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":" This"},"finish_reason":null,"logprobs":null}]} 32 | 33 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":" is"},"finish_reason":null,"logprobs":null}]} 34 | 35 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":" a"},"finish_reason":null,"logprobs":null}]} 36 | 37 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":" basic"},"finish_reason":null,"logprobs":null}]} 38 | 39 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":" arithmetic"},"finish_reason":null,"logprobs":null}]} 40 | 41 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":" operation"},"finish_reason":null,"logprobs":null}]} 42 | 43 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":" where"},"finish_reason":null,"logprobs":null}]} 44 | 45 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":" you"},"finish_reason":null,"logprobs":null}]} 46 | 47 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":" add"},"finish_reason":null,"logprobs":null}]} 48 | 49 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":" the"},"finish_reason":null,"logprobs":null}]} 50 | 51 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":" two"},"finish_reason":null,"logprobs":null}]} 52 | 53 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":" numbers"},"finish_reason":null,"logprobs":null}]} 54 | 55 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":" together"},"finish_reason":null,"logprobs":null}]} 56 | 57 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":" to"},"finish_reason":null,"logprobs":null}]} 58 | 59 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":" get"},"finish_reason":null,"logprobs":null}]} 60 | 61 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":" the"},"finish_reason":null,"logprobs":null}]} 62 | 63 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":" total"},"finish_reason":null,"logprobs":null}]} 64 | 65 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":"."},"finish_reason":null,"logprobs":null}]} 66 | 67 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":" "},"finish_reason":null,"logprobs":null}]} 68 | 69 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":"\n"},"finish_reason":null,"logprobs":null}]} 70 | 71 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":"\n"},"finish_reason":null,"logprobs":null}]} 72 | 73 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":"Here"},"finish_reason":null,"logprobs":null}]} 74 | 75 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":"'"},"finish_reason":null,"logprobs":null}]} 76 | 77 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":"s"},"finish_reason":null,"logprobs":null}]} 78 | 79 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":" the"},"finish_reason":null,"logprobs":null}]} 80 | 81 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":" calculation"},"finish_reason":null,"logprobs":null}]} 82 | 83 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":":"},"finish_reason":null,"logprobs":null}]} 84 | 85 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":"\n"},"finish_reason":null,"logprobs":null}]} 86 | 87 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":"\n"},"finish_reason":null,"logprobs":null}]} 88 | 89 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":"2"},"finish_reason":null,"logprobs":null}]} 90 | 91 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":" +"},"finish_reason":null,"logprobs":null}]} 92 | 93 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":" "},"finish_reason":null,"logprobs":null}]} 94 | 95 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":"2"},"finish_reason":null,"logprobs":null}]} 96 | 97 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":" ="},"finish_reason":null,"logprobs":null}]} 98 | 99 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":" "},"finish_reason":null,"logprobs":null}]} 100 | 101 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":"4"},"finish_reason":null,"logprobs":null}]} 102 | 103 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":"\n"},"finish_reason":null,"logprobs":null}]} 104 | 105 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":"\n"},"finish_reason":null,"logprobs":null}]} 106 | 107 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":"So"},"finish_reason":null,"logprobs":null}]} 108 | 109 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":","},"finish_reason":null,"logprobs":null}]} 110 | 111 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":" the"},"finish_reason":null,"logprobs":null}]} 112 | 113 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":" answer"},"finish_reason":null,"logprobs":null}]} 114 | 115 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":" to"},"finish_reason":null,"logprobs":null}]} 116 | 117 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":" your"},"finish_reason":null,"logprobs":null}]} 118 | 119 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":" question"},"finish_reason":null,"logprobs":null}]} 120 | 121 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":" is"},"finish_reason":null,"logprobs":null}]} 122 | 123 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":" "},"finish_reason":null,"logprobs":null}]} 124 | 125 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":"4"},"finish_reason":null,"logprobs":null}]} 126 | 127 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":"."},"finish_reason":null,"logprobs":null}]} 128 | 129 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":""},"finish_reason":"stop","logprobs":null}]} 130 | 131 | : OPENROUTER PROCESSING 132 | 133 | data: {"id":"gen-1729004990-gTyfUdC2AMGEv0NpAg7u","provider":"Azure","model":"microsoft/phi-3.5-mini-128k-instruct","object":"chat.completion.chunk","created":1729004990,"choices":[{"index":0,"delta":{"role":"assistant","content":""},"finish_reason":null,"logprobs":null}],"usage":{"prompt_tokens":17,"completion_tokens":62,"total_tokens":79}} 134 | 135 | data: [DONE] 136 | -------------------------------------------------------------------------------- /samples/output.txt: -------------------------------------------------------------------------------- 1 | data: {"candidates": [{"content": {"parts": [{"functionCall": {"name": "take_notes","args": {"note": "Capitalism and socialism are two of the most prevalent economic systems in the world. Capitalism is characterized by private ownership of the means of production, free markets, and the pursuit of profit. Socialism, on the other hand, emphasizes social ownership of the means of production, with the goal of achieving social equality and economic justice. The two systems have been the subject of much debate, with proponents of each arguing for its superiority. Capitalism is often praised for its efficiency and innovation, while socialism is lauded for its potential to reduce inequality and provide for the needs of the most vulnerable. However, both systems have their drawbacks. Capitalism can lead to economic instability and social inequality, while socialism can stifle innovation and reduce individual freedom. Ultimately, the best economic system for a given society depends on its specific circumstances and values."}}}],"role": "model"},"finishReason": "STOP","index": 0,"safetyRatings": [{"category": "HARM_CATEGORY_SEXUALLY_EXPLICIT","probability": "NEGLIGIBLE"},{"category": "HARM_CATEGORY_HARASSMENT","probability": "NEGLIGIBLE"},{"category": "HARM_CATEGORY_DANGEROUS_CONTENT","probability": "NEGLIGIBLE"},{"category": "HARM_CATEGORY_HATE_SPEECH","probability": "NEGLIGIBLE"}]}],"usageMetadata": {"promptTokenCount": 50,"candidatesTokenCount": 174,"totalTokenCount": 224}} 2 | 3 | -------------------------------------------------------------------------------- /test.js: -------------------------------------------------------------------------------- 1 | import { asyncLLM } from "./index.js"; 2 | 3 | const PORT = 8080; 4 | const BASE_URL = `http://localhost:${PORT}`; 5 | 6 | function assertEquals(actual, expected, message) { 7 | if (JSON.stringify(actual) === JSON.stringify(expected)) return; 8 | throw new Error( 9 | message || `Expected:\n${JSON.stringify(expected, null, 2)}. Actual:\n${JSON.stringify(actual, null, 2)}`, 10 | ); 11 | } 12 | 13 | Deno.serve({ port: PORT }, async (req) => { 14 | const url = new URL(req.url); 15 | const file = await Deno.readFile(`samples${url.pathname}`); 16 | return new Response(file, { 17 | headers: { "Content-Type": "text/event-stream" }, 18 | }); 19 | }); 20 | 21 | /* 22 | curl -X POST https://llmfoundry.straive.com/openai/v1/chat/completions \ 23 | -H "Authorization: Bearer $LLMFOUNDRY_TOKEN:asyncllm" \ 24 | -H "Content-Type: application/json" \ 25 | -d '{"model": "gpt-4o-mini", "stream": true, "messages": [{"role": "user", "content": "Hello world"}]}' 26 | */ 27 | Deno.test("asyncLLM - OpenAI", async () => { 28 | const results = await Array.fromAsync(asyncLLM(`${BASE_URL}/openai.txt`)); 29 | 30 | assertEquals(results.length, 10); 31 | assertEquals(results[0].content, ""); 32 | assertEquals(results[1].content, "Hello"); 33 | assertEquals(results[9].content, "Hello! How can I assist you today?"); 34 | assertEquals(results.at(-1).tools, undefined); 35 | }); 36 | 37 | /* 38 | curl -X POST https://llmfoundry.straive.com/openai/v1/chat/completions \ 39 | -H "Authorization: Bearer $LLMFOUNDRY_TOKEN:asyncllm" \ 40 | -H "Content-Type: application/json" \ 41 | -d '{ 42 | "model": "gpt-4o-mini", 43 | "stream": true, 44 | "messages": [ 45 | {"role": "system", "content": "Call get_delivery_date with the order ID."}, 46 | {"role": "user", "content": "123456"} 47 | ], 48 | "tools": [ 49 | { 50 | "type": "function", 51 | "function": { 52 | "name": "get_delivery_date", 53 | "description": "Get the delivery date for a customer order.", 54 | "parameters": { 55 | "type": "object", 56 | "properties": { "order_id": { "type": "string", "description": "The customer order ID." } }, 57 | "required": ["order_id"], 58 | "additionalProperties": false 59 | } 60 | } 61 | } 62 | ] 63 | }' 64 | */ 65 | Deno.test("asyncLLM - OpenAI with tool calls", async () => { 66 | let index = 0; 67 | let data = {}; 68 | for await (data of asyncLLM(`${BASE_URL}/openai-tools.txt`)) { 69 | if (index == 0) { 70 | assertEquals(data.tools[0].name, "get_delivery_date"); 71 | assertEquals(data.tools[0].id, "call_F8YHCjnzrrTjfE4YSSpVW2Bc"); 72 | assertEquals(data.tools[0].args, ""); 73 | } 74 | if (index == 1) assertEquals(data.tools[0].args, '{"'); 75 | if (index == 7) assertEquals(data.tools[0].args, '{"order_id":"123456"}'); 76 | if (index == 7) assertEquals(data.content, undefined); 77 | index++; 78 | } 79 | assertEquals(JSON.parse(data.tools[0].args), { order_id: "123456" }); 80 | assertEquals(index, 8); 81 | }); 82 | 83 | /* 84 | curl -X POST https://llmfoundry.straive.com/openai/v1/chat/completions \ 85 | -H "Authorization: Bearer $LLMFOUNDRY_TOKEN:asyncllm" \ 86 | -H "Content-Type: application/json" \ 87 | -d '{ 88 | "model": "gpt-4o-mini", 89 | "stream": true, 90 | "messages": [ 91 | { "role": "system", "content": "Call get_order({order_id}) AND get_customer({customer_id}) in parallel" }, 92 | { "role": "user", "content": "Order ID: 123456, Customer ID: 7890" } 93 | ], 94 | "tool_choice": "required", 95 | "tools": [ 96 | { 97 | "type": "function", 98 | "function": { "name": "get_order", "parameters": { "type": "object", "properties": { "id": { "type": "string" } }, "required": ["id"] } } 99 | }, 100 | { 101 | "type": "function", 102 | "function": { "name": "get_customer", "parameters": { "type": "object", "properties": { "id": { "type": "string" } }, "required": ["id"] } } 103 | } 104 | ] 105 | } 106 | } 107 | */ 108 | Deno.test("asyncLLM - OpenAI with multiple tool calls", async () => { 109 | let index = 0; 110 | let data = {}; 111 | for await (data of asyncLLM(`${BASE_URL}/openai-tools2.txt`)) { 112 | if (index === 0) { 113 | assertEquals(data.tools[0], { 114 | name: "get_order", 115 | id: "call_wnH2cswb4JAnm69pUAP4MNEN", 116 | args: "", 117 | }); 118 | } 119 | if (index === 5) assertEquals(data.tools[0].args, '{"id": "123456"}'); 120 | if (index === 6) { 121 | assertEquals(data.tools[1], { 122 | name: "get_customer", 123 | id: "call_f4GVABhbwSOLoaisOBOajnsm", 124 | args: '{"id', 125 | }); 126 | } 127 | if (index === 9) assertEquals(data.tools[1].args, '{"id": "7890"}'); 128 | index++; 129 | } 130 | assertEquals(index, 9); 131 | assertEquals(data.tools[0], { name: "get_order", id: "call_wnH2cswb4JAnm69pUAP4MNEN", args: '{"id": "123456"}' }); 132 | assertEquals(data.tools[1], { name: "get_customer", id: "call_f4GVABhbwSOLoaisOBOajnsm", args: '{"id": "7890"}' }); 133 | }); 134 | 135 | /* 136 | curl -X POST https://llmfoundry.straive.com/anthropic/v1/messages \ 137 | -H "Authorization: Bearer $LLMFOUNDRY_TOKEN:asyncllm" \ 138 | -H "Content-Type: application/json" \ 139 | -d '{"model": "claude-3-haiku-20240307", "stream": true, "max_tokens": 10, "messages": [{"role": "user", "content": "What is 2 + 2"}]}' 140 | */ 141 | Deno.test("asyncLLM - Anthropic", async () => { 142 | const results = await Array.fromAsync(asyncLLM(`${BASE_URL}/anthropic.txt`)); 143 | 144 | assertEquals(results.length, 3); 145 | assertEquals(results[0].content, "2 "); 146 | assertEquals(results[1].content, "2 + 2 "); 147 | assertEquals(results[2].content, "2 + 2 = 4."); 148 | assertEquals(results.at(-1).tools, undefined); 149 | }); 150 | 151 | Deno.test("asyncLLM - Anthropic with tool calls", async () => { 152 | let index = 0; 153 | let data = {}; 154 | for await (data of asyncLLM(`${BASE_URL}/anthropic-tools.txt`)) { 155 | if (index === 0) assertEquals(data.content, "Okay"); 156 | if (index === 12) assertEquals(data.content, "Okay, let's check the weather for San Francisco, CA:"); 157 | if (index === 13) assertEquals(data.tools[0], { name: "get_weather", id: "toolu_01T1x1fJ34qAmk2tNTrN7Up6" }); 158 | if (index === 14) assertEquals(data.tools[0].args, ""); 159 | index++; 160 | } 161 | assertEquals(data.tools[0].name, "get_weather"); 162 | assertEquals(data.tools[0].id, "toolu_01T1x1fJ34qAmk2tNTrN7Up6"); 163 | assertEquals(JSON.parse(data.tools[0].args), { 164 | location: "San Francisco, CA", 165 | unit: "fahrenheit", 166 | }); 167 | assertEquals(index, 23); 168 | }); 169 | 170 | /* 171 | curl -X POST https://llmfoundry.straive.com/anthropic/v1/messages \ 172 | -H "Authorization: Bearer $LLMFOUNDRY_TOKEN:asyncllm" \ 173 | -H "Content-Type: application/json" \ 174 | -d '{ 175 | "system": "Call get_order({order_id}) AND get_customer({customer_id}) in parallel", 176 | "messages": [{ "role": "user", "content": "Order ID: 123456, Customer ID: 7890" }], 177 | "model": "claude-3-haiku-20240307", 178 | "max_tokens": 4096, 179 | "stream": true, 180 | "tool_choice": { "type": "any", "disable_parallel_tool_use": false }, 181 | "tools": [ 182 | { "name": "get_order", "input_schema": { "type": "object", "properties": { "id": { "type": "string" } }, "required": ["id"] } }, 183 | { "name": "get_customer", "input_schema": { "type": "object", "properties": { "id": { "type": "string" } }, "required": ["id"] } } 184 | ] 185 | } 186 | }` 187 | */ 188 | Deno.test("asyncLLM - Anthropic with multiple tool calls", async () => { 189 | let index = 0; 190 | let data = {}; 191 | for await (data of asyncLLM(`${BASE_URL}/anthropic-tools2.txt`)) { 192 | if (index === 0) assertEquals(data.tools[0], { name: "get_order", id: "toolu_015yB3TjTS1RBaM7VScM2MQY" }); 193 | if (index === 2) assertEquals(data.tools[0].args, '{"id": "1'); 194 | if (index === 7) 195 | assertEquals(data.tools[1], { name: "get_customer", id: "toolu_013VAZTYqMJm2JuRCqEA4kam", args: '{"id": "789' }); 196 | index++; 197 | } 198 | assertEquals(index, 9); 199 | assertEquals(data.tools[0], { name: "get_order", id: "toolu_015yB3TjTS1RBaM7VScM2MQY", args: '{"id": "123456"}' }); 200 | assertEquals(data.tools[1], { name: "get_customer", id: "toolu_013VAZTYqMJm2JuRCqEA4kam", args: '{"id": "7890"}' }); 201 | }); 202 | 203 | /* 204 | curl -X POST https://llmfoundry.straive.com/gemini/v1beta/models/gemini-1.5-flash-8b:streamGenerateContent?alt=sse \ 205 | -H "Authorization: Bearer $LLMFOUNDRY_TOKEN:asyncllm" \ 206 | -H "Content-Type: application/json" \ 207 | -d '{ 208 | "system_instruction": { "parts": [{ "text": "You are a helpful assistant" }] }, 209 | "contents": [{ "role": "user", "parts": [{ "text": "What is 2+2?" }] }] 210 | }' 211 | */ 212 | Deno.test("asyncLLM - Gemini", async () => { 213 | const results = await Array.fromAsync(asyncLLM(`${BASE_URL}/gemini.txt`)); 214 | 215 | assertEquals(results.length, 3); 216 | assertEquals(results[0].content, "2"); 217 | assertEquals(results[1].content, "2 + 2 = 4\n"); 218 | assertEquals(results[2].content, "2 + 2 = 4\n"); 219 | assertEquals(results.at(-1).tools, undefined); 220 | }); 221 | 222 | /* 223 | curl -X POST https://llmfoundry.straive.com/gemini/v1beta/models/gemini-1.5-flash-latest:streamGenerateContent?alt=sse \ 224 | -H "Authorization: Bearer $LLMFOUNDRY_TOKEN:asyncllm" \ 225 | -H "Content-Type: application/json" \ 226 | -d '{ 227 | "contents": { "role": "user", "parts": { "text": "Call take_notes passing it an essay about capitalism vs socialism" } }, 228 | "tools": [ 229 | { 230 | "function_declarations": [ 231 | { 232 | "name": "take_notes", 233 | "description": "Take notes about a topic", 234 | "parameters": { 235 | "type": "object", 236 | "properties": { "note": { "type": "string" } }, 237 | "required": ["note"] 238 | } 239 | } 240 | ] 241 | } 242 | ] 243 | }' 244 | */ 245 | Deno.test("asyncLLM - Gemini with tool calls", async () => { 246 | let index = 0; 247 | let data = {}; 248 | for await (data of asyncLLM(`${BASE_URL}/gemini-tools.txt`)) { 249 | if (index === 0) assertEquals(data.tools[0].name, "take_notes"); 250 | if (index === 0) assertEquals(data.tools[0].args.startsWith('{"note":"Capitalism'), true); 251 | index++; 252 | } 253 | assertEquals(data.content, undefined); 254 | assertEquals(JSON.parse(data.tools[0].args).note.startsWith("Capitalism and socialism"), true); 255 | assertEquals(JSON.parse(data.tools[0].args).note.endsWith("specific circumstances and values."), true); 256 | assertEquals(index, 1); 257 | }); 258 | 259 | /* 260 | curl -X POST https://llmfoundry.straive.com/gemini/v1beta/models/gemini-1.5-flash-latest:streamGenerateContent?alt=sse \ 261 | -H "Authorization: Bearer $LLMFOUNDRY_TOKEN:asyncllm" \ 262 | -H "Content-Type: application/json" \ 263 | -d '{ 264 | "systemInstruction": {"parts": [{"text": "Call get_order({order_id}) AND get_customer({customer_id}) in parallel"}]}, 265 | "contents": [{"role": "user", "parts": [{ "text": "Order ID: 123456, Customer ID: 7890" }] }], 266 | "toolConfig": { "function_calling_config": { "mode": "ANY" } }, 267 | "tools": { 268 | "functionDeclarations": [ 269 | { 270 | "name": "get_order", 271 | "parameters": { "type": "object", "properties": { "id": { "type": "string" } }, "required": ["id"] } 272 | }, 273 | { 274 | "name": "get_customer", 275 | "parameters": { "type": "object", "properties": { "id": { "type": "string" } }, "required": ["id"] } 276 | } 277 | ] 278 | } 279 | } 280 | }` 281 | */ 282 | Deno.test("asyncLLM - Gemini with multiple tool calls", async () => { 283 | let index = 0; 284 | let data = {}; 285 | for await (data of asyncLLM(`${BASE_URL}/gemini-tools2.txt`)) { 286 | if (index === 0) { 287 | assertEquals(data.tools[0], { name: "get_order", args: '{"id":"123456"}' }); 288 | assertEquals(data.tools[1], { name: "get_customer", args: '{"id":"7890"}' }); 289 | } 290 | index++; 291 | } 292 | assertEquals(index, 3); 293 | assertEquals(data.tools[0].name, "get_order"); 294 | assertEquals(JSON.parse(data.tools[0].args), { id: "123456" }); 295 | assertEquals(data.tools[1].name, "get_customer"); 296 | assertEquals(JSON.parse(data.tools[1].args), { id: "7890" }); 297 | }); 298 | 299 | /* 300 | curl -X POST https://llmfoundry.straive.com/openrouter/v1/chat/completions \ 301 | -H "Authorization: Bearer $LLMFOUNDRY_TOKEN:asyncllm" \ 302 | -H "Content-Type: application/json" \ 303 | -d '{"model": "meta-llama/llama-3.2-11b-vision-instruct", "stream": true, "messages": [{"role": "user", "content": "What is 2 + 2"}]}' 304 | */ 305 | Deno.test("asyncLLM - OpenRouter", async () => { 306 | const results = await Array.fromAsync(asyncLLM(`${BASE_URL}/openrouter.txt`)); 307 | 308 | assertEquals(results.length, 64); 309 | assertEquals(results[0].content, ""); 310 | assertEquals(results[1].content, " The"); 311 | assertEquals(results[2].content, " The sum"); 312 | assertEquals( 313 | results.at(-1).content, 314 | " The sum of 2 and 2 is 4. This is a basic arithmetic operation where you add the two numbers together to get the total. \n\nHere's the calculation:\n\n2 + 2 = 4\n\nSo, the answer to your question is 4.", 315 | ); 316 | assertEquals(results.at(-1).tools, undefined); 317 | }); 318 | 319 | Deno.test("asyncLLM - Error handling", async () => { 320 | const results = await Array.fromAsync(asyncLLM(`${BASE_URL}/errors.txt`)); 321 | 322 | assertEquals(results.length, 6); 323 | 324 | // Malformed JSON 325 | assertEquals(results[0].error, "Unexpected token 'i', \"invalid json\" is not valid JSON"); 326 | 327 | // OpenAI-style error 328 | assertEquals(results[1].error, "OpenAI API error"); 329 | 330 | // Anthropic-style error 331 | assertEquals(results[2].error, "Anthropic API error"); 332 | 333 | // Gemini-style error 334 | assertEquals(results[3].error, "Gemini API error"); 335 | 336 | // OpenRouter-style error 337 | assertEquals(results[4].error, "OpenRouter API error"); 338 | 339 | // No data 340 | assertEquals(results[5].error, "Unexpected end of JSON input"); 341 | }); 342 | 343 | Deno.test("asyncLLM - Config callback", async () => { 344 | let responseStatus = 0; 345 | let contentType = ""; 346 | 347 | const results = await Array.fromAsync( 348 | asyncLLM( 349 | `${BASE_URL}/openai.txt`, 350 | {}, 351 | { 352 | onResponse: async (response) => { 353 | responseStatus = response.status; 354 | contentType = response.headers.get("Content-Type"); 355 | }, 356 | }, 357 | ), 358 | ); 359 | 360 | assertEquals(responseStatus, 200); 361 | assertEquals(contentType, "text/event-stream"); 362 | assertEquals(results.length, 10); // Verify normal operation still works 363 | }); 364 | 365 | Deno.test("asyncLLM - Config callback error handling", async () => { 366 | let responseStatus = 0; 367 | 368 | const results = await Array.fromAsync( 369 | asyncLLM( 370 | `${BASE_URL}/errors.txt`, 371 | {}, 372 | { 373 | onResponse: async (response) => { 374 | responseStatus = response.status; 375 | }, 376 | }, 377 | ), 378 | ); 379 | 380 | assertEquals(responseStatus, 200); 381 | assertEquals(results[0].error, "Unexpected token 'i', \"invalid json\" is not valid JSON"); 382 | }); 383 | 384 | Deno.test("asyncLLM - Request object input", async () => { 385 | const request = new Request(`${BASE_URL}/openai.txt`); 386 | const results = await Array.fromAsync(asyncLLM(request)); 387 | 388 | assertEquals(results.length, 10); 389 | }); 390 |