├── .gitignore
├── public
    ├── social_share.png
    ├── favicon.svg
    └── logo.svg
├── .env.example
├── tsconfig.json
├── .markdownlint-cli2.cjs
├── src
    ├── styles
    │   └── global.css
    ├── content
    │   ├── config.ts
    │   ├── blog-zh
    │   │   ├── 2025-09-16-instant-model-mentions_zh.md
    │   │   ├── 2025-09-18-smart-quick-chat-dialog-positioning_zh.md
    │   │   ├── 2025-08-19-chatollama-deepagents-integration_zh.md
    │   │   ├── 2025-08-25-langchain-upgrade-chat-fix_zh.md
    │   │   ├── 2025-08-19-feature-flags-in-docker-and-nuxt_zh.md
    │   │   ├── 2025-08-18-ui-improvements-and-chat-fixes_zh.md
    │   │   ├── 2025-08-25-docker-langchain-module-resolution-fix_zh.md
    │   │   ├── 2025-09-11-building-contextual-quick-chat-inspired-by-ai-ides_zh.md
    │   │   ├── 2025-08-26-model-api-refactoring-parallel-execution_zh.md
    │   │   ├── 2025-08-28-openai-langchain-image-parsing-fix_zh.md
    │   │   └── 2025-09-09-improving-ai-chat-experience-with-smart-title-generation_zh.md
    │   └── blog
    │   │   ├── 2025-09-16-instant-model-mentions.md
    │   │   ├── 2025-09-18-smart-quick-chat-dialog-positioning.md
    │   │   ├── 2025-08-19-feature-flags-in-docker-and-nuxt.md
    │   │   ├── 2025-08-18-ui-improvements-and-chat-fixes.md
    │   │   ├── 2025-08-25-langchain-upgrade-chat-fix.md
    │   │   ├── 2025-08-19-chatollama-deepagents-integration.md
    │   │   ├── 2025-09-09-improving-ai-chat-experience-with-smart-title-generation.md
    │   │   ├── 2025-08-25-docker-langchain-module-resolution-fix.md
    │   │   └── 2025-08-26-model-api-refactoring-parallel-execution.md
    ├── pages
    │   ├── blog
    │   │   ├── [...slug].astro
    │   │   └── index.astro
    │   ├── zh
    │   │   ├── blog
    │   │   │   ├── [...slug].astro
    │   │   │   └── index.astro
    │   │   └── index.astro
    │   └── index.astro
    ├── utils
    │   ├── blog.ts
    │   └── i18n.ts
    ├── components
    │   └── BlogCard.astro
    └── layouts
    │   ├── BlogLayout.astro
    │   └── BaseLayout.astro
├── astro.config.mjs
├── package.json
├── content
    ├── zh
    │   ├── 20250916-instant-model-mentions_zh.md
    │   ├── 20250819-chatollama-deepagents-integration_zh.md
    │   ├── 20250825-langchain-upgrade-chat-fix_zh.md
    │   ├── 20250819-feature-flags-in-docker-and-nuxt_zh.md
    │   ├── 20250818-ui-improvements-and-chat-fixes_zh.md
    │   ├── 20250825-docker-langchain-module-resolution-fix_zh.md
    │   ├── 20250826-model-api-refactoring-parallel-execution_zh.md
    │   └── 20250828-openai-langchain-image-parsing-fix_zh.md
    ├── 20250916-instant-model-mentions.md
    ├── 20250819-feature-flags-in-docker-and-nuxt.md
    ├── 20250818-ui-improvements-and-chat-fixes.md
    ├── 20250825-langchain-upgrade-chat-fix.md
    ├── 20250825-docker-langchain-module-resolution-fix.md
    ├── 20250826-model-api-refactoring-parallel-execution.md
    ├── 20250909-improving-ai-chat-experience-with-smart-title-generation.md
    └── 20250828-openai-langchain-image-parsing-fix.md
└── tailwind.config.mjs


/.gitignore:
--------------------------------------------------------------------------------
1 | node_modules
2 | .astro
3 | .DS_Store
4 | dist
5 | .env
6 | 


--------------------------------------------------------------------------------
/public/social_share.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/sugarforever/chat-ollama-blog/main/public/social_share.png


--------------------------------------------------------------------------------
/.env.example:
--------------------------------------------------------------------------------
1 | # Base site settings
2 | SITE_URL=https://blog.chatollama.cloud
3 | # Set to true to enable draft previews in dev
4 | ENABLE_DRAFTS=false
5 | 


--------------------------------------------------------------------------------
/public/favicon.svg:
--------------------------------------------------------------------------------
1 | <svg width="32" height="32" viewBox="0 0 32 32" fill="none" xmlns="http://www.w3.org/2000/svg">
2 |   <rect width="32" height="32" fill="white"/>
3 |   <path d="M8 8h16v2H8V8zm0 6h16v2H8v-2zm0 6h12v2H8v-2z" fill="black"/>
4 | </svg>


--------------------------------------------------------------------------------
/tsconfig.json:
--------------------------------------------------------------------------------
 1 | {
 2 |   "extends": "astro/tsconfigs/strict",
 3 |   "compilerOptions": {
 4 |     "baseUrl": ".",
 5 |     "paths": {
 6 |       "@/*": ["src/*"],
 7 |       "@/components/*": ["src/components/*"],
 8 |       "@/layouts/*": ["src/layouts/*"],
 9 |       "@/utils/*": ["src/utils/*"]
10 |     }
11 |   }
12 | }


--------------------------------------------------------------------------------
/.markdownlint-cli2.cjs:
--------------------------------------------------------------------------------
 1 | module.exports = {
 2 |   config: {
 3 |     default: true,
 4 |     MD013: false,
 5 |     MD009: false,
 6 |     MD022: false,
 7 |     MD031: false,
 8 |     MD032: false,
 9 |     MD025: false,
10 |     MD036: false,
11 |     MD040: false,
12 |     MD041: false,
13 |     MD047: false,
14 |     MD026: false,
15 |   },
16 |   ignores: ['src/content/**/*.mdx'],
17 | };
18 | 


--------------------------------------------------------------------------------
/src/styles/global.css:
--------------------------------------------------------------------------------
 1 | @import url('https://fonts.googleapis.com/css2?family=Inter:wght@400;500;600;700&display=swap');
 2 | 
 3 | @tailwind base;
 4 | @tailwind components;
 5 | @tailwind utilities;
 6 | 
 7 | html {
 8 |   font-family: 'Inter', system-ui, sans-serif;
 9 | }
10 | 
11 | /* Custom scrollbar */
12 | ::-webkit-scrollbar {
13 |   width: 8px;
14 | }
15 | 
16 | ::-webkit-scrollbar-track {
17 |   background: #f1f1f1;
18 | }
19 | 
20 | ::-webkit-scrollbar-thumb {
21 |   background: #c1c1c1;
22 |   border-radius: 4px;
23 | }
24 | 
25 | ::-webkit-scrollbar-thumb:hover {
26 |   background: #a8a8a8;
27 | }


--------------------------------------------------------------------------------
/src/content/config.ts:
--------------------------------------------------------------------------------
 1 | import { defineCollection, z } from 'astro:content';
 2 | 
 3 | const blogSchema = z.object({
 4 |   title: z.string(),
 5 |   date: z.string().or(z.date()).optional(),
 6 |   feature: z.string().optional(),
 7 |   timeToShip: z.string().optional(),
 8 |   description: z.string().optional(),
 9 |   tags: z.array(z.string()).optional(),
10 | });
11 | 
12 | export const collections = {
13 |   'blog': defineCollection({
14 |     type: 'content',
15 |     schema: blogSchema,
16 |   }),
17 |   'blog-zh': defineCollection({
18 |     type: 'content',
19 |     schema: blogSchema,
20 |   }),
21 | };


--------------------------------------------------------------------------------
/astro.config.mjs:
--------------------------------------------------------------------------------
 1 | import { defineConfig } from 'astro/config';
 2 | import mdx from '@astrojs/mdx';
 3 | import tailwind from '@astrojs/tailwind';
 4 | 
 5 | export default defineConfig({
 6 |   site: 'https://blog.chatollama.cloud',
 7 |   integrations: [
 8 |     mdx(),
 9 |     tailwind({
10 |       applyBaseStyles: false,
11 |     }),
12 |   ],
13 |   markdown: {
14 |     shikiConfig: {
15 |       theme: 'github-light',
16 |       wrap: true
17 |     }
18 |   },
19 |   i18n: {
20 |     defaultLocale: "en",
21 |     locales: ["en", "zh"],
22 |     routing: {
23 |       prefixDefaultLocale: false
24 |     }
25 |   }
26 | });


--------------------------------------------------------------------------------
/src/pages/blog/[...slug].astro:
--------------------------------------------------------------------------------
 1 | ---
 2 | import { getCollection } from 'astro:content';
 3 | import BlogLayout from '@/layouts/BlogLayout.astro';
 4 | 
 5 | export async function getStaticPaths() {
 6 |   const posts = await getCollection('blog');
 7 |   return posts.map((post) => ({
 8 |     params: { slug: post.slug },
 9 |     props: post,
10 |   }));
11 | }
12 | 
13 | const post = Astro.props;
14 | const { Content } = await post.render();
15 | ---
16 | 
17 | <BlogLayout
18 |   title={post.data.title}
19 |   date={new Date(post.data.date || '2025-01-01')}
20 |   feature={post.data.feature}
21 |   timeToShip={post.data.timeToShip}
22 |   description={post.data.description}
23 | >
24 |   <Content />
25 | </BlogLayout>


--------------------------------------------------------------------------------
/src/pages/zh/blog/[...slug].astro:
--------------------------------------------------------------------------------
 1 | ---
 2 | import { getCollection } from 'astro:content';
 3 | import BlogLayout from '@/layouts/BlogLayout.astro';
 4 | 
 5 | export async function getStaticPaths() {
 6 |   const posts = await getCollection('blog-zh');
 7 |   return posts.map((post) => ({
 8 |     params: { slug: post.slug },
 9 |     props: post,
10 |   }));
11 | }
12 | 
13 | const post = Astro.props;
14 | const { Content } = await post.render();
15 | ---
16 | 
17 | <BlogLayout
18 |   title={post.data.title}
19 |   date={new Date(post.data.date || '2025-01-01')}
20 |   feature={post.data.feature}
21 |   timeToShip={post.data.timeToShip}
22 |   description={post.data.description}
23 | >
24 |   <Content />
25 | </BlogLayout>


--------------------------------------------------------------------------------
/src/pages/zh/blog/index.astro:
--------------------------------------------------------------------------------
 1 | ---
 2 | import BaseLayout from '@/layouts/BaseLayout.astro';
 3 | import BlogCard from '@/components/BlogCard.astro';
 4 | import { getBlogPosts } from '@/utils/blog';
 5 | import { useTranslations } from '@/utils/i18n';
 6 | 
 7 | const t = useTranslations('zh');
 8 | const posts = await getBlogPosts('zh');
 9 | ---
10 | 
11 | <BaseLayout title="博客 - 所有文章">
12 |   <div class="max-w-4xl mx-auto px-6 py-12">
13 |     <header class="mb-12">
14 |       <h1 class="text-4xl font-bold mb-4">{t('blog.allPosts')}</h1>
15 |       <p class="text-lg text-gray-600">
16 |         {posts.length} 篇关于人工智能、软件开发和创新的文章。
17 |       </p>
18 |     </header>
19 | 
20 |     <div class="space-y-6">
21 |       {posts.map((post) => (
22 |         <BlogCard post={post} />
23 |       ))}
24 |     </div>
25 |   </div>
26 | </BaseLayout>


--------------------------------------------------------------------------------
/src/pages/blog/index.astro:
--------------------------------------------------------------------------------
 1 | ---
 2 | import BaseLayout from '@/layouts/BaseLayout.astro';
 3 | import BlogCard from '@/components/BlogCard.astro';
 4 | import { getBlogPosts } from '@/utils/blog';
 5 | import { useTranslations } from '@/utils/i18n';
 6 | 
 7 | const t = useTranslations('en');
 8 | const posts = await getBlogPosts('en');
 9 | ---
10 | 
11 | <BaseLayout title="Blog - All Posts">
12 |   <div class="max-w-4xl mx-auto px-6 py-12">
13 |     <header class="mb-12">
14 |       <h1 class="text-4xl font-bold mb-4">{t('blog.allPosts')}</h1>
15 |       <p class="text-lg text-gray-600">
16 |         {posts.length} posts about AI, software development, and innovation.
17 |       </p>
18 |     </header>
19 | 
20 |     <div class="space-y-6">
21 |       {posts.map((post) => (
22 |         <BlogCard post={post} />
23 |       ))}
24 |     </div>
25 |   </div>
26 | </BaseLayout>


--------------------------------------------------------------------------------
/package.json:
--------------------------------------------------------------------------------
 1 | {
 2 |   "name": "chat-ollama-blog",
 3 |   "version": "1.0.0",
 4 |   "description": "",
 5 |   "main": "index.js",
 6 |   "scripts": {
 7 |     "dev": "astro dev",
 8 |     "start": "astro dev",
 9 |     "build": "astro build",
10 |     "preview": "astro preview",
11 |     "astro": "astro"
12 |   },
13 |   "repository": {
14 |     "type": "git",
15 |     "url": "git+https://github.com/sugarforever/chat-ollama-blog.git"
16 |   },
17 |   "keywords": [],
18 |   "author": "",
19 |   "license": "ISC",
20 |   "type": "commonjs",
21 |   "bugs": {
22 |     "url": "https://github.com/sugarforever/chat-ollama-blog/issues"
23 |   },
24 |   "homepage": "https://github.com/sugarforever/chat-ollama-blog#readme",
25 |   "dependencies": {
26 |     "@astrojs/mdx": "^4.3.5",
27 |     "@astrojs/tailwind": "^6.0.2",
28 |     "@tailwindcss/typography": "^0.5.16",
29 |     "@vercel/analytics": "^1.5.0",
30 |     "astro": "^5.13.7",
31 |     "tailwindcss": "^3.4.17"
32 |   }
33 | }
34 | 


--------------------------------------------------------------------------------
/public/logo.svg:
--------------------------------------------------------------------------------
 1 | <?xml version="1.0" encoding="UTF-8"?>
 2 | <svg id="_layer_1" data-name="layer1" xmlns="http://www.w3.org/2000/svg" viewBox="0 0 175.39 175.39">
 3 |   <defs>
 4 |     <style>
 5 |       .cls-1 {
 6 |         fill: #231815;
 7 |       }
 8 | 
 9 |       .cls-1, .cls-2, .cls-3 {
10 |         stroke-width: 0px;
11 |       }
12 | 
13 |       .cls-2 {
14 |         fill: #f7b52c;
15 |       }
16 | 
17 |       .cls-3 {
18 |         fill: #fff;
19 |       }
20 |     </style>
21 |   </defs>
22 |   <circle class="cls-1" cx="87.7" cy="87.7" r="87.7"/>
23 |   <g>
24 |     <rect class="cls-3" x="46.46" y="56.77" width="20.62" height="61.86"/>
25 |     <rect class="cls-3" x="67.08" y="36.15" width="41.24" height="20.62"/>
26 |     <rect class="cls-3" x="67.08" y="118.62" width="41.24" height="20.62"/>
27 |     <rect class="cls-2" x="108.31" y="56.77" width="20.62" height="20.62"/>
28 |     <rect class="cls-3" x="108.31" y="98.01" width="20.62" height="20.62"/>
29 |   </g>
30 | </svg>


--------------------------------------------------------------------------------
/src/utils/blog.ts:
--------------------------------------------------------------------------------
 1 | import { getCollection } from 'astro:content';
 2 | 
 3 | export interface BlogPost {
 4 |   id: string;
 5 |   slug: string;
 6 |   body: string;
 7 |   collection: string;
 8 |   data: {
 9 |     title: string;
10 |     date: Date;
11 |     feature?: string;
12 |     timeToShip?: string;
13 |     [key: string]: any;
14 |   };
15 | }
16 | 
17 | export async function getBlogPosts(locale: 'en' | 'zh' = 'en'): Promise<BlogPost[]> {
18 |   try {
19 |     const collection = locale === 'zh' ? 'blog-zh' : 'blog';
20 |     const posts = await getCollection(collection);
21 | 
22 |     return posts
23 |       .map(post => ({
24 |         ...post,
25 |         data: {
26 |           ...post.data,
27 |           date: new Date(post.data.date || extractDateFromFilename(post.id))
28 |         }
29 |       }))
30 |       .sort((a, b) => b.data.date.getTime() - a.data.date.getTime());
31 |   } catch (error) {
32 |     console.warn(`No posts found for locale: ${locale}`);
33 |     return [];
34 |   }
35 | }
36 | 
37 | export function extractDateFromFilename(filename: string): string {
38 |   const match = filename.match(/(\d{4}-\d{2}-\d{2})/);
39 |   return match ? match[1] : new Date().toISOString().split('T')[0];
40 | }
41 | 
42 | 


--------------------------------------------------------------------------------
/content/zh/20250916-instant-model-mentions_zh.md:
--------------------------------------------------------------------------------
 1 | # 使用 @ 提及即时切换模型对话
 2 | 
 3 | **日期：** 2025年9月16日  
 4 | **功能：** 在消息里直接点名模型，让下一条回复换成对应模型  
 5 | **上线耗时：** 约 1 天  
 6 | 
 7 | ## 🎯 为什么要做这个功能
 8 | 
 9 | 长对话默认绑定同一个模型可以保持语境一致，但如果临时想问问别的模型，就必须反复打开设置面板切换：
10 | 
11 | 1. 打开会话设置  
12 | 2. 改掉默认模型  
13 | 3. 发送问题等待回答  
14 | 4. 再切回原来的默认模型  
15 | 
16 | 当你需要对比不同供应商、或者只想用某个模型补一句答案时，这套流程既慢又容易忘记切回来。我们希望它像标记同事一样轻松。
17 | 
18 | ## 💡 功能概述
19 | 
20 | 现在在消息中输入 `@模型名` 就能临时“劫持”本次请求，回复会来自被点名的模型，而会话默认模型完全不动。
21 | 
22 | - 提及单个模型（例如 `@gpt-4o-mini`）即可只改动本条信息。  
23 | - 连续提及多个模型（例如 `@openrouter/claude-3.5-sonnet @llama3`）可以一次性并行提问。  
24 | - 不写 `@` 时仍使用会话默认模型，体验与之前一致。
25 | 
26 | 输入框在你键入 `@` 后会弹出模型家族与实时搜索，并支持键盘导航，不必死记硬背模型 ID。
27 | 
28 | ## 🔍 核心实现细节
29 | 
30 | ### 1. 解析提及同时保持提示干净
31 | `ChatInputBox.vue` 在用户输入时同步解析提及，将结果记录在 `hijackedModels`，并把原始文本里的 `@模型` 去掉，生成 `sanitizedContent`。服务器收到的就是这份干净内容，模型提示里不会留下 `@claude` 一类的符号。
32 | 
33 | ### 2. 单条消息生效的覆盖策略
34 | `Chat.vue` 在发送前先看 `hijackedModels` 是否存在。一旦检测到，就只对本次请求临时替换模型；会话侧栏的默认配置完全不会被修改。消息历史也会使用 `sanitizedContent`，确保回放时内容干净。
35 | 
36 | ### 3. 提及在界面上是“一等公民”
37 | 我们更新了 `ModelMentionText.vue`，无论是简单模型名还是 `openrouter/claude-3.5-sonnet` 这样的命名空间，都能渲染成统一的徽标。自动生成标题的逻辑同样读取去除提及后的文本，不会把对话命名成“@gpt-4o mini 讨论”。
38 | 
39 | ## ✅ 最终效果
40 | 
41 | - 一键临时切换模型，默认配置安全无副作用。  
42 | - 键盘即可操作，适合高频对比不同模型。  
43 | - 消息记录与模型提示保持整洁，即使用户频繁提及模型。  
44 | 
45 | 现在就试试：在输入框里输入 `@`，选择一个模型，享受无阻力的模型对比体验。
46 | 


--------------------------------------------------------------------------------
/src/content/blog-zh/2025-09-16-instant-model-mentions_zh.md:
--------------------------------------------------------------------------------
 1 | ---
 2 | title: "使用 @ 提及即时切换模型对话"
 3 | date: "2025-09-16"
 4 | description: "Blog post about 使用 @ 提及即时切换模型对话"
 5 | ---
 6 | 
 7 | 
 8 | **日期：** 2025年9月16日  
 9 | **功能：** 在消息里直接点名模型，让下一条回复换成对应模型  
10 | **上线耗时：** 约 1 天  
11 | 
12 | ## 🎯 为什么要做这个功能
13 | 
14 | 长对话默认绑定同一个模型可以保持语境一致，但如果临时想问问别的模型，就必须反复打开设置面板切换：
15 | 
16 | 1. 打开会话设置  
17 | 2. 改掉默认模型  
18 | 3. 发送问题等待回答  
19 | 4. 再切回原来的默认模型  
20 | 
21 | 当你需要对比不同供应商、或者只想用某个模型补一句答案时，这套流程既慢又容易忘记切回来。我们希望它像标记同事一样轻松。
22 | 
23 | ## 💡 功能概述
24 | 
25 | 现在在消息中输入 `@模型名` 就能临时“劫持”本次请求，回复会来自被点名的模型，而会话默认模型完全不动。
26 | 
27 | - 提及单个模型（例如 `@gpt-4o-mini`）即可只改动本条信息。  
28 | - 连续提及多个模型（例如 `@openrouter/claude-3.5-sonnet @llama3`）可以一次性并行提问。  
29 | - 不写 `@` 时仍使用会话默认模型，体验与之前一致。
30 | 
31 | 输入框在你键入 `@` 后会弹出模型家族与实时搜索，并支持键盘导航，不必死记硬背模型 ID。
32 | 
33 | ## 🔍 核心实现细节
34 | 
35 | ### 1. 解析提及同时保持提示干净
36 | `ChatInputBox.vue` 在用户输入时同步解析提及，将结果记录在 `hijackedModels`，并把原始文本里的 `@模型` 去掉，生成 `sanitizedContent`。服务器收到的就是这份干净内容，模型提示里不会留下 `@claude` 一类的符号。
37 | 
38 | ### 2. 单条消息生效的覆盖策略
39 | `Chat.vue` 在发送前先看 `hijackedModels` 是否存在。一旦检测到，就只对本次请求临时替换模型；会话侧栏的默认配置完全不会被修改。消息历史也会使用 `sanitizedContent`，确保回放时内容干净。
40 | 
41 | ### 3. 提及在界面上是“一等公民”
42 | 我们更新了 `ModelMentionText.vue`，无论是简单模型名还是 `openrouter/claude-3.5-sonnet` 这样的命名空间，都能渲染成统一的徽标。自动生成标题的逻辑同样读取去除提及后的文本，不会把对话命名成“@gpt-4o mini 讨论”。
43 | 
44 | ## ✅ 最终效果
45 | 
46 | - 一键临时切换模型，默认配置安全无副作用。  
47 | - 键盘即可操作，适合高频对比不同模型。  
48 | - 消息记录与模型提示保持整洁，即使用户频繁提及模型。  
49 | 
50 | 现在就试试：在输入框里输入 `@`，选择一个模型，享受无阻力的模型对比体验。
51 | 


--------------------------------------------------------------------------------
/src/content/blog-zh/2025-09-18-smart-quick-chat-dialog-positioning_zh.md:
--------------------------------------------------------------------------------
 1 | ---
 2 | title: "智能快速聊天对话框定位：更好的用户体验"
 3 | date: "2025-09-18"
 4 | description: "ChatOllama 快速聊天功能的重大改进，具备智能对话框定位和增强的视口感知能力"
 5 | ---
 6 | 
 7 | 我们刚刚推出了 ChatOllama 快速聊天功能的重大改进，解决了用户在屏幕边缘选择文本时遇到的常见问题。快速聊天对话框现在可以智能定位，确保始终保持在视口内，同时为 AI 回复提供更多空间。
 8 | 
 9 | ## 问题所在
10 | 
11 | 之前，当用户在屏幕右下角或视口边缘附近选择文本时，快速聊天对话框会部分出现在可见区域之外或完全被截断。这使得阅读 AI 回复和与对话框交互变得困难。此外，对话框相当狭窄（320px），限制了可以舒适显示的文本量。
12 | 
13 | ## 解决方案
14 | 
15 | 我们的新智能定位算法通过几个关键改进解决了这些问题：
16 | 
17 | ### 1. 智能定位逻辑
18 | 
19 | 对话框现在遵循复杂的定位策略：
20 | 
21 | - **水平定位**：首先尝试定位在选定文本的右侧，如果空间不足则定位在左侧，如果两侧都不行则水平居中
22 | - **垂直定位**：首先尝试定位在选择区域下方，如果需要则定位在上方，最后选择垂直居中
23 | - **视口感知**：始终确保对话框保持在屏幕边界内，具有适当的边距
24 | 
25 | ### 2. 更大的对话框尺寸
26 | 
27 | - **宽度增加**：从 320px 增加到 480px，提高可读性
28 | - **动态高度**：根据回复内容长度自动调整
29 | - **回复区域**：最大高度从 160px 增加到 320px
30 | - **更好的排版**：回复文本大小从超小号增加到小号，提高可读性
31 | 
32 | ### 3. 动态内容适应
33 | 
34 | 对话框现在根据 AI 回复长度计算最佳尺寸，确保较长的回复有足够的空间，同时保持较短回复的紧凑性。
35 | 
36 | ## 技术实现
37 | 
38 | 定位算法使用几个关键常量：
39 | 
40 | ```typescript
41 | const DIALOG_WIDTH = 480  // 从 320px 增加
42 | const DIALOG_MIN_HEIGHT = 280
43 | const DIALOG_MAX_HEIGHT = 600  // 回复较长时的最大高度
44 | const VIEWPORT_PADDING = 20
45 | const OFFSET_FROM_SELECTION = 10
46 | ```
47 | 
48 | 智能定位逻辑确保对话框：
49 | - 与视口边缘保持 20px 边距
50 | - 与选定文本保持 10px 距离
51 | - 根据回复内容动态调整高度
52 | - 永远不会被截断或出现在可见区域之外
53 | 
54 | ## 对用户体验的影响
55 | 
56 | 这些改进带来了几个实质性的好处：
57 | 
58 | 1. **更好的可访问性**：用户现在可以在屏幕的任何地方选择文本，无需担心对话框定位问题
59 | 2. **改善的可读性**：更大的对话框和文本大小使 AI 回复更容易阅读
60 | 3. **更智能的行为**：对话框自动适应不同的屏幕尺寸和选择位置


--------------------------------------------------------------------------------
/tailwind.config.mjs:
--------------------------------------------------------------------------------
 1 | /** @type {import('tailwindcss').Config} */
 2 | export default {
 3 |   content: ['./src/**/*.{astro,html,js,jsx,md,mdx,svelte,ts,tsx,vue}'],
 4 |   theme: {
 5 |     extend: {
 6 |       fontFamily: {
 7 |         mono: ['SF Mono', 'Monaco', 'Inconsolata', 'Fira Code', 'Consolas', 'monospace'],
 8 |         sans: ['Inter', '-apple-system', 'BlinkMacSystemFont', 'sans-serif'],
 9 |       },
10 |       typography: {
11 |         DEFAULT: {
12 |           css: {
13 |             maxWidth: '65ch',
14 |             color: '#000',
15 |             a: {
16 |               color: '#000',
17 |               textDecorationLine: 'underline',
18 |               textDecorationColor: '#666',
19 |               '&:hover': {
20 |                 textDecorationColor: '#000',
21 |               },
22 |             },
23 |             'h1,h2,h3,h4': {
24 |               color: '#000',
25 |             },
26 |             code: {
27 |               color: '#000',
28 |               backgroundColor: '#f5f5f5',
29 |               padding: '0.2em 0.4em',
30 |               borderRadius: '0.25rem',
31 |               fontWeight: '400',
32 |             },
33 |             'code::before': {
34 |               content: '""'
35 |             },
36 |             'code::after': {
37 |               content: '""'
38 |             },
39 |             pre: {
40 |               backgroundColor: '#f8f8f8',
41 |               border: '1px solid #e5e5e5',
42 |             },
43 |             blockquote: {
44 |               borderLeftColor: '#000',
45 |               color: '#666',
46 |             },
47 |           },
48 |         },
49 |       },
50 |     },
51 |   },
52 |   plugins: [
53 |     require('@tailwindcss/typography'),
54 |   ],
55 | }


--------------------------------------------------------------------------------
/src/pages/zh/index.astro:
--------------------------------------------------------------------------------
 1 | ---
 2 | import BaseLayout from '@/layouts/BaseLayout.astro';
 3 | import BlogCard from '@/components/BlogCard.astro';
 4 | import { getBlogPosts } from '@/utils/blog';
 5 | import { useTranslations } from '@/utils/i18n';
 6 | 
 7 | const t = useTranslations('zh');
 8 | const posts = await getBlogPosts('zh');
 9 | const latestPosts = posts.slice(0, 6);
10 | ---
11 | 
12 | <BaseLayout title="ChatOllama 博客 - 最新更新">
13 |   <div class="max-w-4xl mx-auto px-6 py-12">
14 |     <header class="mb-12 text-center">
15 |       <p class="text-lg text-gray-600 max-w-2xl mx-auto mb-6">
16 |         {t('site.subtitle')}
17 |       </p>
18 |       <p class="text-base text-gray-500 max-w-2xl mx-auto mb-6">
19 |         {t('meta.description')}
20 |       </p>
21 |       <div>
22 |         <a href="https://chatollama.cloud" target="_blank" class="inline-flex items-center px-4 py-2 bg-black text-white rounded hover:bg-gray-800 transition-colors">
23 |           体验 ChatOllama
24 |           <svg class="ml-2 w-4 h-4" fill="none" stroke="currentColor" viewBox="0 0 24 24">
25 |             <path stroke-linecap="round" stroke-linejoin="round" stroke-width="2" d="M10 6H6a2 2 0 00-2 2v10a2 2 0 002 2h10a2 2 0 002-2v-4M14 4h6m0 0v6m0-6L10 14"></path>
26 |           </svg>
27 |         </a>
28 |       </div>
29 |     </header>
30 | 
31 |     <section>
32 |       <div class="flex items-center justify-between mb-8">
33 |         <h2 class="text-2xl font-semibold">{t('blog.latestPosts')}</h2>
34 |         <a href="/zh/blog" class="text-sm font-medium hover:text-gray-600 transition-colors">
35 |           {t('blog.allPosts')} →
36 |         </a>
37 |       </div>
38 | 
39 |       <div class="space-y-6">
40 |         {latestPosts.map((post) => (
41 |           <BlogCard post={post} />
42 |         ))}
43 |       </div>
44 |     </section>
45 |   </div>
46 | </BaseLayout>


--------------------------------------------------------------------------------
/src/pages/index.astro:
--------------------------------------------------------------------------------
 1 | ---
 2 | import BaseLayout from '@/layouts/BaseLayout.astro';
 3 | import BlogCard from '@/components/BlogCard.astro';
 4 | import { getBlogPosts } from '@/utils/blog';
 5 | import { useTranslations } from '@/utils/i18n';
 6 | 
 7 | const t = useTranslations('en');
 8 | const posts = await getBlogPosts('en');
 9 | const latestPosts = posts.slice(0, 6);
10 | ---
11 | 
12 | <BaseLayout title="ChatOllama Blog - Latest Updates">
13 |   <div class="max-w-4xl mx-auto px-6 py-12">
14 |     <header class="mb-12 text-center">
15 |       <p class="text-lg text-gray-600 max-w-2xl mx-auto mb-6">
16 |         {t('site.subtitle')}
17 |       </p>
18 |       <p class="text-base text-gray-500 max-w-2xl mx-auto mb-6">
19 |         {t('meta.description')}
20 |       </p>
21 |       <div>
22 |         <a href="https://chatollama.cloud" target="_blank" class="inline-flex items-center px-4 py-2 bg-black text-white rounded hover:bg-gray-800 transition-colors">
23 |           Try ChatOllama
24 |           <svg class="ml-2 w-4 h-4" fill="none" stroke="currentColor" viewBox="0 0 24 24">
25 |             <path stroke-linecap="round" stroke-linejoin="round" stroke-width="2" d="M10 6H6a2 2 0 00-2 2v10a2 2 0 002 2h10a2 2 0 002-2v-4M14 4h6m0 0v6m0-6L10 14"></path>
26 |           </svg>
27 |         </a>
28 |       </div>
29 |     </header>
30 | 
31 |     <section>
32 |       <div class="flex items-center justify-between mb-8">
33 |         <h2 class="text-2xl font-semibold">{t('blog.latestPosts')}</h2>
34 |         <a href="/blog" class="text-sm font-medium hover:text-gray-600 transition-colors">
35 |           {t('blog.allPosts')} →
36 |         </a>
37 |       </div>
38 | 
39 |       <div class="space-y-6">
40 |         {latestPosts.map((post) => (
41 |           <BlogCard post={post} />
42 |         ))}
43 |       </div>
44 |     </section>
45 |   </div>
46 | </BaseLayout>


--------------------------------------------------------------------------------
/src/components/BlogCard.astro:
--------------------------------------------------------------------------------
 1 | ---
 2 | import { formatDate, getLangFromUrl, useTranslations, type Locale } from '@/utils/i18n';
 3 | import type { BlogPost } from '@/utils/blog';
 4 | 
 5 | export interface Props {
 6 |   post: BlogPost;
 7 | }
 8 | 
 9 | const { post } = Astro.props;
10 | const lang = getLangFromUrl(Astro.url) as Locale;
11 | const t = useTranslations(lang);
12 | 
13 | const href = lang === 'en' ? `/blog/${post.slug}` : `/zh/blog/${post.slug}`;
14 | ---
15 | 
16 | <article class="border border-gray-200 rounded-lg p-6 hover:border-gray-300 transition-colors">
17 |   <header class="mb-3">
18 |     <h2 class="text-xl font-semibold mb-2">
19 |       <a href={href} class="hover:text-gray-600 transition-colors">
20 |         {post.data.title}
21 |       </a>
22 |     </h2>
23 | 
24 |     <div class="flex flex-wrap items-center gap-3 text-sm text-gray-600">
25 |       <time datetime={post.data.date.toISOString()}>
26 |         {formatDate(post.data.date, lang)}
27 |       </time>
28 |       {post.data.feature && (
29 |         <span class="px-2 py-1 bg-gray-100 rounded text-xs">
30 |           {post.data.feature}
31 |         </span>
32 |       )}
33 |       {post.data.timeToShip && (
34 |         <span class="px-2 py-1 bg-gray-100 rounded text-xs">
35 |           {post.data.timeToShip}
36 |         </span>
37 |       )}
38 |     </div>
39 |   </header>
40 | 
41 |   {post.data.description && (
42 |     <p class="text-gray-700 mb-4 leading-relaxed">
43 |       {post.data.description}
44 |     </p>
45 |   )}
46 | 
47 |   <footer>
48 |     <a
49 |       href={href}
50 |       class="inline-flex items-center text-sm font-medium hover:text-gray-600 transition-colors"
51 |     >
52 |       {t('blog.readMore')}
53 |       <svg class="ml-1 w-4 h-4" fill="none" stroke="currentColor" viewBox="0 0 24 24">
54 |         <path stroke-linecap="round" stroke-linejoin="round" stroke-width="2" d="M9 5l7 7-7 7"></path>
55 |       </svg>
56 |     </a>
57 |   </footer>
58 | </article>


--------------------------------------------------------------------------------
/src/utils/i18n.ts:
--------------------------------------------------------------------------------
 1 | export type Locale = 'en' | 'zh';
 2 | 
 3 | export const languages = {
 4 |   en: 'English',
 5 |   zh: '中文'
 6 | };
 7 | 
 8 | export const defaultLang: Locale = 'en';
 9 | 
10 | export const ui = {
11 |   en: {
12 |     'nav.home': 'Home',
13 |     'nav.blog': 'Blog',
14 |     'nav.about': 'About',
15 |     'nav.project': 'ChatOllama',
16 |     'blog.readMore': 'Read more',
17 |     'blog.allPosts': 'All Posts',
18 |     'blog.latestPosts': 'Latest Posts',
19 |     'blog.publishedOn': 'Published on',
20 |     'meta.description': 'Official blog of ChatOllama - Open source chatbot platform with AI agents, knowledge bases, and multi-modal chat',
21 |     'lang.switch': 'Switch to Chinese',
22 |     'site.title': 'ChatOllama Blog',
23 |     'site.subtitle': 'Updates, features, and insights from the ChatOllama team',
24 |   },
25 |   zh: {
26 |     'nav.home': '首页',
27 |     'nav.blog': '博客',
28 |     'nav.about': '关于',
29 |     'nav.project': 'ChatOllama',
30 |     'blog.readMore': '阅读更多',
31 |     'blog.allPosts': '所有文章',
32 |     'blog.latestPosts': '最新文章',
33 |     'blog.publishedOn': '发布于',
34 |     'meta.description': 'ChatOllama 官方博客 - 开源聊天机器人平台，支持AI代理、知识库和多模态聊天',
35 |     'lang.switch': 'Switch to English',
36 |     'site.title': 'ChatOllama 博客',
37 |     'site.subtitle': 'ChatOllama 团队的更新、功能和见解',
38 |   }
39 | } as const;
40 | 
41 | export function getLangFromUrl(url: URL): Locale {
42 |   const [, lang] = url.pathname.split('/');
43 |   if (lang in ui) return lang as Locale;
44 |   return defaultLang;
45 | }
46 | 
47 | export function useTranslations(lang: Locale) {
48 |   return function t(key: keyof typeof ui[typeof defaultLang]) {
49 |     return ui[lang][key] || ui[defaultLang][key];
50 |   }
51 | }
52 | 
53 | export function formatDate(date: Date, locale: Locale = 'en'): string {
54 |   return new Intl.DateTimeFormat(locale === 'zh' ? 'zh-CN' : 'en-US', {
55 |     year: 'numeric',
56 |     month: 'long',
57 |     day: 'numeric'
58 |   }).format(date);
59 | }


--------------------------------------------------------------------------------
/content/zh/20250819-chatollama-deepagents-integration_zh.md:
--------------------------------------------------------------------------------
 1 | # ChatOllama 集成 DeepAgents：为开源 AI 聊天带来深度研究能力
 2 | 
 3 | 大家好！今天想和大家分享一个令人兴奋的更新 —— 我为 ChatOllama 集成了 DeepAgents，这让我们的开源 AI 聊天应用具备了强大的深度研究能力。
 4 | 
 5 | ## 什么是 DeepAgents？
 6 | 
 7 | 在开始之前，让我先介绍一下 DeepAgents。传统的 AI 智能体通常采用简单的"LLM + 工具调用"模式，虽然能完成基本任务，但在面对复杂、多步骤的研究工作时往往力不从心。这些"浅层"智能体缺乏规划能力，无法有效地分解和执行复杂任务。
 8 | 
 9 | DeepAgents 的出现改变了这一现状。它借鉴了 Claude Code、Deep Research 等成功应用的设计理念，通过四个核心组件构建真正"深度"的智能体：
10 | 
11 | - **🎯 规划工具**：帮助智能体制定和跟踪结构化计划
12 | - **🤖 子智能体**：专门处理特定任务，实现上下文隔离
13 | - **📁 文件系统**：提供持久化状态管理
14 | - **📝 精细提示**：基于成功案例优化的系统提示
15 | 
16 | 这种架构让智能体能够像人类研究员一样工作：分解复杂问题、制定研究计划、调用专门工具、整理和分析信息，最终产出高质量的研究报告。
17 | 
18 | ## 为什么选择集成到 ChatOllama？
19 | 
20 | 作为一个专注于本地化 AI 体验的开源项目，ChatOllama 一直致力于为用户提供强大而易用的 AI 工具。DeepAgents 的加入让我们能够：
21 | 
22 | ### 1. **提供专业级研究能力**
23 | 现在用户可以直接在 ChatOllama 中进行深度研究，智能体会自动：
24 | - 制定研究计划
25 | - 搜索相关信息
26 | - 分析和整合数据
27 | - 生成结构化报告
28 | 
29 | ### 2. **无缝的 MCP 集成**
30 | DeepAgents 原生支持 MCP（模型上下文协议），这意味着集成过程异常顺畅。我们只需要：
31 | ```javascript
32 | // 简单的集成代码
33 | const agent = createDeepAgent({
34 |   tools: mcpTools,
35 |   instructions: researchInstructions
36 | })
37 | ```
38 | 
39 | ### 3. **保持开源精神**
40 | DeepAgents 本身就是开源的，这与 ChatOllama 的理念完美契合。用户可以完全控制自己的数据和研究过程。
41 | 
42 | ## 技术实现亮点
43 | 
44 | ### 智能的流式处理
45 | 我们实现了服务器端的智能内容处理，确保：
46 | - AI 响应内容在服务器端累积，避免客户端的复杂逻辑
47 | - 每个对话轮次使用唯一 UUID 分组，保持上下文清晰
48 | - 工具调用结果以可折叠的 UI 组件展示，用户体验更佳
49 | 
50 | ### 工具调用可视化
51 | 当智能体使用工具时，用户可以清楚地看到：
52 | - 调用了哪个工具（搜索、浏览器、文件操作等）
53 | - 工具的执行结果
54 | - 可以展开查看详细信息
55 | 
56 | ### 多语言支持
57 | 我们为新功能添加了完整的中英文支持，确保不同语言用户都能获得良好体验。
58 | 
59 | ## 实际使用场景
60 | 
61 | 想象一下这些使用场景：
62 | 
63 | **学术研究**：询问"帮我研究一下量子计算在密码学中的应用"，智能体会自动搜索最新论文、分析技术趋势、整理关键观点。
64 | 
65 | **市场分析**：请求"分析一下 2024 年 AI 芯片市场的竞争格局"，智能体会收集市场数据、分析竞争对手、生成详细报告。
66 | 
67 | **技术调研**：提问"比较不同的容器编排方案"，智能体会研究各种方案的优缺点、使用场景、最佳实践。
68 | 
69 | ## 开发体验
70 | 
71 | 得益于 DeepAgents 优秀的架构设计和 MCP 的标准化，整个集成过程非常顺畅：
72 | 
73 | 1. **快速集成**：几行代码就能启用深度研究功能
74 | 2. **灵活配置**：可以根据需要调整智能体的指令和工具
75 | 3. **易于扩展**：通过 MCP 可以轻松添加新的工具和能力
76 | 
77 | ## 未来展望
78 | 
79 | 这只是开始。接下来我们计划：
80 | - 添加更多专业领域的研究模板
81 | - 支持自定义研究工作流
82 | - 集成更多专业工具和数据源
83 | - 优化长时间研究任务的性能
84 | 
85 | ## 总结
86 | 
87 | DeepAgents 的集成为 ChatOllama 带来了质的飞跃。我们不再只是一个简单的聊天工具，而是成为了一个强大的研究助手。这种能力的提升，加上开源的特性和本地化的优势，让 ChatOllama 在 AI 应用领域更具竞争力。
88 | 
89 | 如果你对这个功能感兴趣，欢迎试用最新版本的 ChatOllama，体验 AI 深度研究的魅力。也欢迎在 GitHub 上给我们反馈，让我们一起把这个功能做得更好！
90 | 
91 | ---
92 | 
93 | *ChatOllama 是一个开源的本地 AI 聊天应用，致力于为用户提供私密、强大、易用的 AI 体验。*
94 | 


--------------------------------------------------------------------------------
/src/content/blog-zh/2025-08-19-chatollama-deepagents-integration_zh.md:
--------------------------------------------------------------------------------
 1 | ---
 2 | title: "ChatOllama 集成 DeepAgents：为开源 AI 聊天带来深度研究能力"
 3 | date: "2025-08-19"
 4 | description: "Blog post about ChatOllama 集成 DeepAgents：为开源 AI 聊天带来深度研究能力"
 5 | ---
 6 | 
 7 | 
 8 | 大家好！今天想和大家分享一个令人兴奋的更新 —— 我为 ChatOllama 集成了 DeepAgents，这让我们的开源 AI 聊天应用具备了强大的深度研究能力。
 9 | 
10 | ## 什么是 DeepAgents？
11 | 
12 | 在开始之前，让我先介绍一下 DeepAgents。传统的 AI 智能体通常采用简单的"LLM + 工具调用"模式，虽然能完成基本任务，但在面对复杂、多步骤的研究工作时往往力不从心。这些"浅层"智能体缺乏规划能力，无法有效地分解和执行复杂任务。
13 | 
14 | DeepAgents 的出现改变了这一现状。它借鉴了 Claude Code、Deep Research 等成功应用的设计理念，通过四个核心组件构建真正"深度"的智能体：
15 | 
16 | - **🎯 规划工具**：帮助智能体制定和跟踪结构化计划
17 | - **🤖 子智能体**：专门处理特定任务，实现上下文隔离
18 | - **📁 文件系统**：提供持久化状态管理
19 | - **📝 精细提示**：基于成功案例优化的系统提示
20 | 
21 | 这种架构让智能体能够像人类研究员一样工作：分解复杂问题、制定研究计划、调用专门工具、整理和分析信息，最终产出高质量的研究报告。
22 | 
23 | ## 为什么选择集成到 ChatOllama？
24 | 
25 | 作为一个专注于本地化 AI 体验的开源项目，ChatOllama 一直致力于为用户提供强大而易用的 AI 工具。DeepAgents 的加入让我们能够：
26 | 
27 | ### 1. **提供专业级研究能力**
28 | 现在用户可以直接在 ChatOllama 中进行深度研究，智能体会自动：
29 | - 制定研究计划
30 | - 搜索相关信息
31 | - 分析和整合数据
32 | - 生成结构化报告
33 | 
34 | ### 2. **无缝的 MCP 集成**
35 | DeepAgents 原生支持 MCP（模型上下文协议），这意味着集成过程异常顺畅。我们只需要：
36 | ```javascript
37 | // 简单的集成代码
38 | const agent = createDeepAgent({
39 |   tools: mcpTools,
40 |   instructions: researchInstructions
41 | })
42 | ```
43 | 
44 | ### 3. **保持开源精神**
45 | DeepAgents 本身就是开源的，这与 ChatOllama 的理念完美契合。用户可以完全控制自己的数据和研究过程。
46 | 
47 | ## 技术实现亮点
48 | 
49 | ### 智能的流式处理
50 | 我们实现了服务器端的智能内容处理，确保：
51 | - AI 响应内容在服务器端累积，避免客户端的复杂逻辑
52 | - 每个对话轮次使用唯一 UUID 分组，保持上下文清晰
53 | - 工具调用结果以可折叠的 UI 组件展示，用户体验更佳
54 | 
55 | ### 工具调用可视化
56 | 当智能体使用工具时，用户可以清楚地看到：
57 | - 调用了哪个工具（搜索、浏览器、文件操作等）
58 | - 工具的执行结果
59 | - 可以展开查看详细信息
60 | 
61 | ### 多语言支持
62 | 我们为新功能添加了完整的中英文支持，确保不同语言用户都能获得良好体验。
63 | 
64 | ## 实际使用场景
65 | 
66 | 想象一下这些使用场景：
67 | 
68 | **学术研究**：询问"帮我研究一下量子计算在密码学中的应用"，智能体会自动搜索最新论文、分析技术趋势、整理关键观点。
69 | 
70 | **市场分析**：请求"分析一下 2024 年 AI 芯片市场的竞争格局"，智能体会收集市场数据、分析竞争对手、生成详细报告。
71 | 
72 | **技术调研**：提问"比较不同的容器编排方案"，智能体会研究各种方案的优缺点、使用场景、最佳实践。
73 | 
74 | ## 开发体验
75 | 
76 | 得益于 DeepAgents 优秀的架构设计和 MCP 的标准化，整个集成过程非常顺畅：
77 | 
78 | 1. **快速集成**：几行代码就能启用深度研究功能
79 | 2. **灵活配置**：可以根据需要调整智能体的指令和工具
80 | 3. **易于扩展**：通过 MCP 可以轻松添加新的工具和能力
81 | 
82 | ## 未来展望
83 | 
84 | 这只是开始。接下来我们计划：
85 | - 添加更多专业领域的研究模板
86 | - 支持自定义研究工作流
87 | - 集成更多专业工具和数据源
88 | - 优化长时间研究任务的性能
89 | 
90 | ## 总结
91 | 
92 | DeepAgents 的集成为 ChatOllama 带来了质的飞跃。我们不再只是一个简单的聊天工具，而是成为了一个强大的研究助手。这种能力的提升，加上开源的特性和本地化的优势，让 ChatOllama 在 AI 应用领域更具竞争力。
93 | 
94 | 如果你对这个功能感兴趣，欢迎试用最新版本的 ChatOllama，体验 AI 深度研究的魅力。也欢迎在 GitHub 上给我们反馈，让我们一起把这个功能做得更好！
95 | 
96 | ---
97 | 
98 | *ChatOllama 是一个开源的本地 AI 聊天应用，致力于为用户提供私密、强大、易用的 AI 体验。*
99 | 


--------------------------------------------------------------------------------
/content/zh/20250825-langchain-upgrade-chat-fix_zh.md:
--------------------------------------------------------------------------------
 1 | # LangChain 核心包版本升级导致聊天功能中断：快速修复记录
 2 | 
 3 | **日期：** 2025年8月25日  
 4 | **问题：** LangChain 依赖升级后聊天功能中断  
 5 | **解决时间：** 约4小时  
 6 | 
 7 | ## 🐛 问题描述
 8 | 
 9 | 原本是一次常规的 `LangChain` 依赖升级（`0.3.49` -> `0.3.72`），目的是解决 Docker 模块解析问题，但很快就演变成了一个严重的事故。在升级 LangChain 包之后，整个平台的聊天功能完全停止工作。用户无法发送消息或从任何 AI 模型获得响应，这实际上使得 ChatOllama 的核心功能完全不可用。
10 | 
11 | 这个问题特别令人沮丧，因为在升级过程中没有明显的错误消息或警告。应用程序正常启动，但每次聊天尝试都会静默失败。
12 | 
13 | ## 🔍 根本原因调查
14 | 
15 | 通过深入研究日志和跟踪代码，我们发现 LangChain 升级在聊天模型构造函数中引入了破坏性的 API 更改。使这个问题特别棘手的是，这些不是编译时错误——旧的参数名称被简单地忽略了，导致模型使用未定义的配置进行初始化。
16 | 
17 | 在 LangChain 升级过程中，ChatOpenAI 模型构造函数中的参数名称发生了一些变化。虽然仅仅被标记为 `deprecated`，但参数在下游的使用中已经发生了变化。deprecated 参数包括：
18 | 
19 | - `modelName`
20 | - `openAIApiKey`
21 | 
22 | 这些破坏性更改影响了多个模型提供商，每个都需要特定的参数名称更新：
23 | 
24 | ### 修复前（有效的）：
25 | ```typescript
26 | new ChatOpenAI({
27 |   configuration: { baseURL },
28 |   openAIApiKey: params.key,    // ❌ 已弃用
29 |   modelName: modelName,        // ❌ 已弃用
30 | })
31 | 
32 | new ChatAnthropic({
33 |   anthropicApiUrl: endpoint,
34 |   anthropicApiKey: params.key, // ❌ 已弃用  
35 |   modelName: modelName,        // ❌ 已弃用
36 | })
37 | ```
38 | 
39 | ### 修复后（已修复）：
40 | ```typescript
41 | new ChatOpenAI({
42 |   configuration: { baseURL },
43 |   apiKey: params.key,          // ✅ 新 API
44 |   model: modelName,            // ✅ 新 API
45 | })
46 | 
47 | new ChatAnthropic({
48 |   anthropicApiUrl: endpoint,
49 |   apiKey: params.key,          // ✅ 新 API
50 |   model: modelName,            // ✅ 新 API
51 | })
52 | ```
53 | 
54 | ## 🔧 修复实施
55 | 
56 | 一旦我们确定了根本原因，修复就相对简单，但需要仔细注意细节。我们需要在所有受影响的模型提供商中更新参数名称，同时确保向后兼容性并添加更好的错误处理。
57 | 
58 | 以下模型需要更新：
59 | - **OpenAI (ChatOpenAI)** - 最常用的提供商
60 | - **Anthropic (ChatAnthropic)** - AI 代理功能的关键组件
61 | - **Gemini (ChatGoogleGenerativeAI)** - 用于多模态功能
62 | - **Groq (ChatGroq)** - 高性能推理选项
63 | 
64 | 实施的关键更改包括：
65 | 1. 将 `openAIApiKey` 和 `anthropicApiKey` 标准化为统一的 `apiKey` 参数
66 | 2. 在所有提供商中将 `modelName` 更新为更简洁的 `model` 参数
67 | 3. 增强错误处理，在配置缺失时提供清晰的反馈
68 | 
69 | 除了修复参数名称，我们还借此机会添加了强大的回退逻辑。现在，当外部 API 提供商由于缺少密钥或配置问题而失败时，系统会优雅地回退到 Ollama，确保用户即使在首选提供商配置错误的情况下也能继续聊天。
70 | 
71 | ## 📚 经验教训
72 | 
73 | 这次事件强化了在生产应用程序中管理依赖项的几个重要原则：
74 | 
75 | **主要升级后彻底测试：** 即使看似微小的版本更新也可能引入不明显的破坏性更改。对所有功能进行全面测试是必要的，不仅仅是您期望受到影响的区域。
76 | 
77 | **拥抱 API 标准化：** 虽然最初会造成干扰，但 LangChain 在提供商之间标准化参数名称的举措是一个积极的长期变化，将减少混乱并使代码库更易于维护。
78 | 
79 | **始终实施优雅降级：** 拥有强大的回退机制不仅仅是良好的实践——当外部依赖项失败或意外更改时，这对于维护用户信任至关重要。
80 | 
81 | ## 🚀 影响和解决方案
82 | 
83 | 修复在识别后立即部署，为用户实现了零停机时间。更新的实现在利用新的标准化 API 的同时保持完全的向后兼容性。作为额外的好处，增强的错误处理和回退机制实际上提高了聊天系统的整体可靠性。
84 | 
85 | 这次事件提醒我们，在 AI 和机器学习库快速发展的世界中，保持依赖项的最新状态需要持续的警惕和彻底的测试实践。
86 | 
87 | ---
88 | 
89 | *这是主要升级中"静默"破坏性更改的典型案例——这种情况使经验丰富的开发人员总是会仔细阅读变更日志两遍。一旦确定，修复就很简单，但这次经历突出了为什么我们永远不会把看似常规的更新视为理所当然。*
90 | 


--------------------------------------------------------------------------------
/src/layouts/BlogLayout.astro:
--------------------------------------------------------------------------------
 1 | ---
 2 | import BaseLayout from './BaseLayout.astro';
 3 | import { formatDate, getLangFromUrl, useTranslations, type Locale } from '@/utils/i18n';
 4 | 
 5 | export interface Props {
 6 |   title: string;
 7 |   date: Date;
 8 |   feature?: string;
 9 |   timeToShip?: string;
10 |   description?: string;
11 | }
12 | 
13 | const { title, date, feature, timeToShip, description } = Astro.props;
14 | const lang = getLangFromUrl(Astro.url) as Locale;
15 | const t = useTranslations(lang);
16 | 
17 | // Enhanced title for blog posts
18 | const fullTitle = `${title} | ChatOllama Blog`;
19 | const blogDescription = description || `${title} - Updates and insights from the ChatOllama team`;
20 | ---
21 | 
22 | <BaseLayout title={fullTitle} description={blogDescription}>
23 |   <article class="max-w-4xl mx-auto px-6 py-12">
24 |     <header class="mb-12">
25 |       <h1 class="text-4xl font-bold mb-4 leading-tight">{title}</h1>
26 | 
27 |       <div class="flex flex-wrap items-center gap-4 text-sm text-gray-600 mb-6">
28 |         <time datetime={date.toISOString()}>
29 |           {t('blog.publishedOn')} {formatDate(date, lang)}
30 |         </time>
31 |         {feature && (
32 |           <span class="px-2 py-1 bg-gray-100 rounded text-xs">
33 |             {feature}
34 |           </span>
35 |         )}
36 |         {timeToShip && (
37 |           <span class="px-2 py-1 bg-gray-100 rounded text-xs">
38 |             {timeToShip}
39 |           </span>
40 |         )}
41 |       </div>
42 |     </header>
43 | 
44 |     <div class="prose prose-lg max-w-none">
45 |       <slot />
46 |     </div>
47 |   </article>
48 | </BaseLayout>
49 | 
50 | <style>
51 |   .prose {
52 |     @apply text-gray-800 leading-relaxed;
53 |   }
54 | 
55 |   .prose h1 {
56 |     @apply text-3xl font-bold mt-12 mb-6 text-black;
57 |   }
58 | 
59 |   .prose h2 {
60 |     @apply text-2xl font-semibold mt-10 mb-4 text-black;
61 |   }
62 | 
63 |   .prose h3 {
64 |     @apply text-xl font-semibold mt-8 mb-3 text-black;
65 |   }
66 | 
67 |   .prose p {
68 |     @apply mb-6;
69 |   }
70 | 
71 |   .prose a {
72 |     @apply text-black underline decoration-gray-400 hover:decoration-black transition-colors;
73 |   }
74 | 
75 |   .prose ul, .prose ol {
76 |     @apply mb-6 pl-6;
77 |   }
78 | 
79 |   .prose li {
80 |     @apply mb-2;
81 |   }
82 | 
83 |   .prose blockquote {
84 |     @apply border-l-4 border-gray-300 pl-4 italic text-gray-700 my-6;
85 |   }
86 | 
87 |   .prose code {
88 |     @apply bg-gray-100 px-1 py-0.5 rounded text-sm font-mono;
89 |   }
90 | 
91 |   .prose pre {
92 |     @apply bg-gray-50 border border-gray-200 rounded-lg p-4 overflow-x-auto my-6;
93 |   }
94 | 
95 |   .prose pre code {
96 |     @apply bg-transparent p-0;
97 |   }
98 | </style>


--------------------------------------------------------------------------------
/src/content/blog-zh/2025-08-25-langchain-upgrade-chat-fix_zh.md:
--------------------------------------------------------------------------------
 1 | ---
 2 | title: "LangChain 核心包版本升级导致聊天功能中断：快速修复记录"
 3 | date: "2025-08-25"
 4 | description: "Blog post about LangChain 核心包版本升级导致聊天功能中断：快速修复记录"
 5 | ---
 6 | 
 7 | 
 8 | **日期：** 2025年8月25日  
 9 | **问题：** LangChain 依赖升级后聊天功能中断  
10 | **解决时间：** 约4小时  
11 | 
12 | ## 🐛 问题描述
13 | 
14 | 原本是一次常规的 `LangChain` 依赖升级（`0.3.49` -> `0.3.72`），目的是解决 Docker 模块解析问题，但很快就演变成了一个严重的事故。在升级 LangChain 包之后，整个平台的聊天功能完全停止工作。用户无法发送消息或从任何 AI 模型获得响应，这实际上使得 ChatOllama 的核心功能完全不可用。
15 | 
16 | 这个问题特别令人沮丧，因为在升级过程中没有明显的错误消息或警告。应用程序正常启动，但每次聊天尝试都会静默失败。
17 | 
18 | ## 🔍 根本原因调查
19 | 
20 | 通过深入研究日志和跟踪代码，我们发现 LangChain 升级在聊天模型构造函数中引入了破坏性的 API 更改。使这个问题特别棘手的是，这些不是编译时错误——旧的参数名称被简单地忽略了，导致模型使用未定义的配置进行初始化。
21 | 
22 | 在 LangChain 升级过程中，ChatOpenAI 模型构造函数中的参数名称发生了一些变化。虽然仅仅被标记为 `deprecated`，但参数在下游的使用中已经发生了变化。deprecated 参数包括：
23 | 
24 | - `modelName`
25 | - `openAIApiKey`
26 | 
27 | 这些破坏性更改影响了多个模型提供商，每个都需要特定的参数名称更新：
28 | 
29 | ### 修复前（有效的）：
30 | ```typescript
31 | new ChatOpenAI({
32 |   configuration: { baseURL },
33 |   openAIApiKey: params.key,    // ❌ 已弃用
34 |   modelName: modelName,        // ❌ 已弃用
35 | })
36 | 
37 | new ChatAnthropic({
38 |   anthropicApiUrl: endpoint,
39 |   anthropicApiKey: params.key, // ❌ 已弃用  
40 |   modelName: modelName,        // ❌ 已弃用
41 | })
42 | ```
43 | 
44 | ### 修复后（已修复）：
45 | ```typescript
46 | new ChatOpenAI({
47 |   configuration: { baseURL },
48 |   apiKey: params.key,          // ✅ 新 API
49 |   model: modelName,            // ✅ 新 API
50 | })
51 | 
52 | new ChatAnthropic({
53 |   anthropicApiUrl: endpoint,
54 |   apiKey: params.key,          // ✅ 新 API
55 |   model: modelName,            // ✅ 新 API
56 | })
57 | ```
58 | 
59 | ## 🔧 修复实施
60 | 
61 | 一旦我们确定了根本原因，修复就相对简单，但需要仔细注意细节。我们需要在所有受影响的模型提供商中更新参数名称，同时确保向后兼容性并添加更好的错误处理。
62 | 
63 | 以下模型需要更新：
64 | - **OpenAI (ChatOpenAI)** - 最常用的提供商
65 | - **Anthropic (ChatAnthropic)** - AI 代理功能的关键组件
66 | - **Gemini (ChatGoogleGenerativeAI)** - 用于多模态功能
67 | - **Groq (ChatGroq)** - 高性能推理选项
68 | 
69 | 实施的关键更改包括：
70 | 1. 将 `openAIApiKey` 和 `anthropicApiKey` 标准化为统一的 `apiKey` 参数
71 | 2. 在所有提供商中将 `modelName` 更新为更简洁的 `model` 参数
72 | 3. 增强错误处理，在配置缺失时提供清晰的反馈
73 | 
74 | 除了修复参数名称，我们还借此机会添加了强大的回退逻辑。现在，当外部 API 提供商由于缺少密钥或配置问题而失败时，系统会优雅地回退到 Ollama，确保用户即使在首选提供商配置错误的情况下也能继续聊天。
75 | 
76 | ## 📚 经验教训
77 | 
78 | 这次事件强化了在生产应用程序中管理依赖项的几个重要原则：
79 | 
80 | **主要升级后彻底测试：** 即使看似微小的版本更新也可能引入不明显的破坏性更改。对所有功能进行全面测试是必要的，不仅仅是您期望受到影响的区域。
81 | 
82 | **拥抱 API 标准化：** 虽然最初会造成干扰，但 LangChain 在提供商之间标准化参数名称的举措是一个积极的长期变化，将减少混乱并使代码库更易于维护。
83 | 
84 | **始终实施优雅降级：** 拥有强大的回退机制不仅仅是良好的实践——当外部依赖项失败或意外更改时，这对于维护用户信任至关重要。
85 | 
86 | ## 🚀 影响和解决方案
87 | 
88 | 修复在识别后立即部署，为用户实现了零停机时间。更新的实现在利用新的标准化 API 的同时保持完全的向后兼容性。作为额外的好处，增强的错误处理和回退机制实际上提高了聊天系统的整体可靠性。
89 | 
90 | 这次事件提醒我们，在 AI 和机器学习库快速发展的世界中，保持依赖项的最新状态需要持续的警惕和彻底的测试实践。
91 | 
92 | ---
93 | 
94 | *这是主要升级中"静默"破坏性更改的典型案例——这种情况使经验丰富的开发人员总是会仔细阅读变更日志两遍。一旦确定，修复就很简单，但这次经历突出了为什么我们永远不会把看似常规的更新视为理所当然。*
95 | 


--------------------------------------------------------------------------------
/content/zh/20250819-feature-flags-in-docker-and-nuxt_zh.md:
--------------------------------------------------------------------------------
 1 | # 在 Docker 中启用功能开关：为什么 MCP_ENABLED 没生效？如何修复？
 2 | 
 3 | *2025年8月19日*
 4 | 
 5 | 大家好！👋
 6 | 
 7 | 延续昨天的界面与聊天可靠性优化，今天聊一个在部署中踩到的坑：在本地开发环境里设置 `MCP_ENABLED=true` 一切正常，但在 Docker 容器中却不生效。下面是原因与解决方案。
 8 | 
 9 | ## 🐛 现象
10 | 
11 | - **本地开发**：`.env` 中设置 `MCP_ENABLED=true`，设置页能看到「MCP」模块。
12 | - **Docker**：`docker-compose.yaml` 中设置 `MCP_ENABLED=true`，设置页没有出现「MCP」模块。
13 | 
14 | ## 🔎 根因：Nuxt runtimeConfig 的构建时 vs 运行时
15 | 
16 | Nuxt 3 的 `runtimeConfig` 会在「构建阶段」读取 `process.env`。想在「运行时」覆盖配置，需要使用带有 `NUXT_` 前缀、且能映射到配置键名的环境变量。
17 | 
18 | 我们在 `nuxt.config.ts` 中是这样写的：
19 | 
20 | ```ts
21 | runtimeConfig: {
22 |   knowledgeBaseEnabled: process.env.KNOWLEDGE_BASE_ENABLED === 'true',
23 |   realtimeChatEnabled: process.env.REALTIME_CHAT_ENABLED === 'true',
24 |   modelsManagementEnabled: process.env.MODELS_MANAGEMENT_ENABLED === 'true',
25 |   mcpEnabled: process.env.MCP_ENABLED === 'true',
26 |   public: { /* ... */ }
27 | }
28 | ```
29 | 
30 | - 在本地开发中，`.env` 会在构建前加载，因此 `process.env.MCP_ENABLED` 在构建时就为 true → `mcpEnabled` 被“烘焙”为 true。
31 | - 在 Docker 中，我们运行的是预构建镜像。仅在运行时设置 `MCP_ENABLED=true` 无法改变 `runtimeConfig.mcpEnabled`。必须使用 `NUXT_MCP_ENABLED=true` 才能在运行时覆盖。
32 | 
33 | 这也解释了为什么 `/api/features` 的日志里 `process.env.MCP_ENABLED` 显示为 true，但 `useRuntimeConfig().mcpEnabled` 仍然是 false。
34 | 
35 | ## ✅ 解决方案
36 | 
37 | ### 方案 A（推荐）：在 Docker 中使用 `NUXT_` 前缀变量
38 | 
39 | 修改 `docker-compose.yaml`：
40 | 
41 | ```yaml
42 | services:
43 |   chatollama:
44 |     environment:
45 |       - NUXT_MCP_ENABLED=true
46 |       - NUXT_KNOWLEDGE_BASE_ENABLED=true
47 |       - NUXT_REALTIME_CHAT_ENABLED=true
48 |       - NUXT_MODELS_MANAGEMENT_ENABLED=true
49 | ```
50 | 
51 | 这样即可直接在运行时映射到 `runtimeConfig`，无需改代码。
52 | 
53 | ### 方案 B：同时兼容旧变量与 `NUXT_`
54 | 
55 | 如果希望继续兼容 `MCP_ENABLED`，可以在 `nuxt.config.ts` 中优先读取运行时的 `NUXT_` 变量，并回退到旧变量：
56 | 
57 | ```ts
58 | runtimeConfig: {
59 |   knowledgeBaseEnabled: process.env.NUXT_KNOWLEDGE_BASE_ENABLED === 'true' || process.env.KNOWLEDGE_BASE_ENABLED === 'true',
60 |   realtimeChatEnabled: process.env.NUXT_REALTIME_CHAT_ENABLED === 'true' || process.env.REALTIME_CHAT_ENABLED === 'true',
61 |   modelsManagementEnabled: process.env.NUXT_MODELS_MANAGEMENT_ENABLED === 'true' || process.env.MODELS_MANAGEMENT_ENABLED === 'true',
62 |   mcpEnabled: process.env.NUXT_MCP_ENABLED === 'true' || process.env.MCP_ENABLED === 'true',
63 |   public: { /* ... */ }
64 | }
65 | ```
66 | 
67 | ## 🔧 验证步骤
68 | 
69 | 1. 使用更新后的 Compose 环境变量重新部署。
70 | 2. 请求 `/api/features` 并查看容器日志（会打印环境变量与 `runtimeConfig` 值）。
71 | 3. 打开设置页：当 `mcpEnabled` 为 true 时，应显示「MCP」模块。
72 | 
73 | ## 🤔 为什么本地可用、Docker 不行？
74 | 
75 | - **本地**：`.env` 在构建前加载 → `runtimeConfig` 在构建时就被设置为 true。
76 | - **Docker**：使用预构建镜像 → 运行时覆盖必须使用 `NUXT_` 前缀变量。
77 | 
78 | ## 📝 小的开发体验改进（可选）
79 | 
80 | - 在 `composables/useFeatures.ts` 的 `FeatureFlags` 接口中补充 `modelsManagementEnabled`，以保持类型完整。
81 | 
82 | ## 🎯 总结
83 | 
84 | 使用 Nuxt 3 做容器化部署时，牢记：构建时环境变量决定默认值；运行时覆盖需要使用 `NUXT_` 前缀。配置正确后，设置页的功能模块就会在所有环境中一致显示。
85 | 


--------------------------------------------------------------------------------
/content/zh/20250818-ui-improvements-and-chat-fixes_zh.md:
--------------------------------------------------------------------------------
  1 | # 界面优化与聊天可靠性修复
  2 | 
  3 | *2025年8月18日*
  4 | 
  5 | 大家好！👋
  6 | 
  7 | 过去几天我一直在改进聊天界面的一些重要功能。下面是新功能和修复的问题。
  8 | 
  9 | ## 🐛 重要Bug修复
 10 | 
 11 | ### 创建新聊天按钮问题
 12 | 最令人沮丧的bug之一是"创建新聊天"按钮无响应。用户点击后没有反应，然后多次点击，突然会创建多个新聊天。
 13 | 
 14 | **问题原因：**
 15 | - `scrollToBottom` 函数在DOM元素准备好之前就尝试访问 `messageListEl.value.scrollHeight`
 16 | - 没有加载状态保护，快速点击会触发多个API调用
 17 | - 聊天创建流程中的竞态条件
 18 | 
 19 | **修复方案：**
 20 | ```javascript
 21 | // 在 scrollToBottom 中添加空值检查
 22 | const scrollToBottom = (_behavior: ScrollBehavior) => {
 23 |     behavior.value = _behavior
 24 |     if (messageListEl.value) {
 25 |         y.value = messageListEl.value.scrollHeight
 26 |     }
 27 | }
 28 | 
 29 | // 在 ChatSessionList 中添加加载状态
 30 | const isCreatingChat = ref(false)
 31 | 
 32 | async function onNewChat() {
 33 |     if (isCreatingChat.value) return
 34 |     
 35 |     isCreatingChat.value = true
 36 |     try {
 37 |         const data = await createChatSession()
 38 |         sessionList.value.unshift(data)
 39 |         await router.push(`/chat/${data.id}`)
 40 |     } finally {
 41 |         isCreatingChat.value = false
 42 |     }
 43 | }
 44 | ```
 45 | 
 46 | 这是一个典型的例子，说明小的时序问题如何创造出非常恼人的用户体验问题！
 47 | 
 48 | ## ✨ 新功能：增强预览面板
 49 | 
 50 | 代码工件预览系统得到了重大升级！以前用户只能在基本的侧边面板中查看代码工件。现在我们有了：
 51 | 
 52 | ### 分屏视图模式
 53 | - 聊天占用剩余空间
 54 | - 预览面板固定500px宽度
 55 | - 两者同时可见，便于对照查看
 56 | 
 57 | ### 全屏模式
 58 | - 预览覆盖整个视窗
 59 | - 完全隐藏标题栏以获得最大查看区域
 60 | - 带半透明背景的浮动关闭按钮
 61 | - 非常适合查看复杂的HTML演示或详细图表
 62 | 
 63 | ### 智能状态管理
 64 | 这比听起来要复杂。关键洞察是将"显示/隐藏预览"状态与"正常/全屏"状态分离：
 65 | 
 66 | ```javascript
 67 | // 两个独立状态而不是一个混乱的状态
 68 | const showArtifacts = ref(false)
 69 | const isFullscreen = ref(false)
 70 | 
 71 | // 智能关闭行为
 72 | const closeArtifacts = () => {
 73 |     showArtifacts.value = false
 74 |     isFullscreen.value = false  // 关闭时重置全屏状态
 75 | }
 76 | 
 77 | // 全屏关闭只退出全屏，不关闭预览
 78 | const toggleFullscreen = () => {
 79 |     isFullscreen.value = !isFullscreen.value
 80 | }
 81 | ```
 82 | 
 83 | 现在的用户体验流程是：
 84 | 1. 点击预览 → 在分屏视图中打开
 85 | 2. 点击全屏 → 扩展到全屏
 86 | 3. 在全屏中点击X → 返回分屏视图
 87 | 4. 在分屏视图中点击X → 完全关闭预览
 88 | 
 89 | ## 🎨 动画优化
 90 | 
 91 | 将预览图标动画从滑入效果改为淡入效果。有时最小的改变会对界面的精致感产生最大的影响。
 92 | 
 93 | ```scss
 94 | // 之前：从右侧滑入
 95 | .artifact-btn {
 96 |     opacity: 0;
 97 |     transform: translateX(8px);
 98 | }
 99 | 
100 | // 之后：简单淡入
101 | .artifact-btn {
102 |     opacity: 0;
103 |     transition: all 0.3s cubic-bezier(0.4, 0, 0.2, 1);
104 | }
105 | ```
106 | 
107 | ## 📚 学到的经验
108 | 
109 | ### 1. DOM时序问题无处不在
110 | `scrollToBottom` bug提醒我们Vue的响应式很快，但DOM仍然需要时间更新。在访问元素属性之前，始终检查元素是否存在。
111 | 
112 | ### 2. 状态管理的复杂性
113 | 最初，我试图让预览系统变得"智能"，有可调整大小的分割和复杂状态。但简单往往更好——两种清晰的模式（分屏/全屏）和明显的过渡对用户来说效果更好。
114 | 
115 | ### 3. 用户测试揭示边缘情况
116 | 聊天创建bug只在特定时序条件下发生。真实用户行为（当某些东西看起来坏了时快速点击）经常揭示在正常开发测试中不会出现的问题。
117 | 
118 | ## 💭 给开发者同行的思考
119 | 
120 | 这些UI可靠性修复可能不够华丽，但对用户体验有巨大影响。一个95%时间有效的按钮对用户来说就是坏的。花时间处理边缘情况和竞态条件是区分好界面和优秀界面的关键。
121 | 
122 | 另外，在构建预览/模态系统时，始终像考虑进入流程一样考虑退出流程。用户需要理解如何回到他们来自的地方！
123 | 
124 | ---
125 | 
126 | *你希望下次看到哪些功能得到改进？在issues中留下你的想法！*
127 | 
128 | *- 你的开发团队*


--------------------------------------------------------------------------------
/content/20250916-instant-model-mentions.md:
--------------------------------------------------------------------------------
 1 | # Instantly Talk to Any Model with @ Mentions
 2 | 
 3 | **Date:** September 16, 2025  
 4 | **Feature:** Tag a model inline to override the next reply without touching session settings  
 5 | **Time to Ship:** ~1 day  
 6 | 
 7 | ## 🎯 Why We Built It
 8 | 
 9 | Our long-form chat sessions have always been anchored to a single "default" model. That kept conversations coherent, but it also meant lots of friction when you wanted to toss a quick question to a different model:
10 | 
11 | 1. Open session settings  
12 | 2. Swap the default model  
13 | 3. Ask the question  
14 | 4. Switch the model back so the rest of the thread stays consistent  
15 | 
16 | That dance got even worse when comparing outputs from multiple providers or when you only needed one specialty answer (e.g. “let me sanity-check this with Claude real quick”). We needed something as fast as tagging a teammate in Slack.
17 | 
18 | ## 💡 The Solution in a Nutshell
19 | 
20 | You can now add `@model-name` to any outgoing message. Each mentioned model temporarily "hijacks" the request, so the response comes from that model while the session’s default choice remains unchanged.
21 | 
22 | - Mention a single model (`@gpt-4o-mini`) to reroute just this message.  
23 | - Mention multiple models (`@openrouter/claude-3.5-sonnet @llama3`) to fan out the question.  
24 | - Don’t mention anything and the chat continues using the default model like before.
25 | 
26 | The UI keeps the override discoverable: as soon as you type `@`, the input shows model families, live search, and keyboard navigation so you never have to remember exact IDs.
27 | 
28 | ## 🔍 What Changed Under the Hood
29 | 
30 | ### 1. Parsing Mentions Without Polluting Prompts
31 | `ChatInputBox.vue` now parses model mentions every time the user types. We persist the selected models in `hijackedModels` and simultaneously strip the `@model` tokens into a `sanitizedContent` payload. That sanitized payload is what the backend actually sees, so no model receives literal `@claude` strings in its prompt.
32 | 
33 | ### 2. Respecting Overrides in Delivery
34 | `Chat.vue` checks for `hijackedModels` before sending. If we find any, we bypass the session defaults for that single send, while the session metadata (and sidebar defaults) stay untouched. The outgoing transcript reuses `sanitizedContent` so historical messages read cleanly without the mentions.
35 | 
36 | ### 3. Making Mentions First-Class Citizens in the UI
37 | We refreshed `ModelMentionText.vue` to show consistent badges for mentions, even when the provider uses namespaced values like `openrouter/claude-3.5-sonnet`. The existing auto-title generator also consumes the sanitized message to avoid naming chats "@gpt-4o mini thoughts".
38 | 
39 | ## ✅ Results
40 | 
41 | - Instant context switches without breaking the session model.  
42 | - Keyboard-only flow for power users comparing providers.  
43 | - Clean transcripts and prompts even when users pepper messages with mentions.  
44 | 
45 | Give it a try: type `@` in any chat input, pick a model, and enjoy frictionless comparisons.
46 | 


--------------------------------------------------------------------------------
/src/content/blog-zh/2025-08-19-feature-flags-in-docker-and-nuxt_zh.md:
--------------------------------------------------------------------------------
 1 | ---
 2 | title: "在 Docker 中启用功能开关：为什么 MCP_ENABLED 没生效？如何修复？"
 3 | date: "2025-08-19"
 4 | description: "Blog post about 在 Docker 中启用功能开关：为什么 MCP_ENABLED 没生效？如何修复？"
 5 | ---
 6 | 
 7 | 
 8 | *2025年8月19日*
 9 | 
10 | 大家好！👋
11 | 
12 | 延续昨天的界面与聊天可靠性优化，今天聊一个在部署中踩到的坑：在本地开发环境里设置 `MCP_ENABLED=true` 一切正常，但在 Docker 容器中却不生效。下面是原因与解决方案。
13 | 
14 | ## 🐛 现象
15 | 
16 | - **本地开发**：`.env` 中设置 `MCP_ENABLED=true`，设置页能看到「MCP」模块。
17 | - **Docker**：`docker-compose.yaml` 中设置 `MCP_ENABLED=true`，设置页没有出现「MCP」模块。
18 | 
19 | ## 🔎 根因：Nuxt runtimeConfig 的构建时 vs 运行时
20 | 
21 | Nuxt 3 的 `runtimeConfig` 会在「构建阶段」读取 `process.env`。想在「运行时」覆盖配置，需要使用带有 `NUXT_` 前缀、且能映射到配置键名的环境变量。
22 | 
23 | 我们在 `nuxt.config.ts` 中是这样写的：
24 | 
25 | ```ts
26 | runtimeConfig: {
27 |   knowledgeBaseEnabled: process.env.KNOWLEDGE_BASE_ENABLED === 'true',
28 |   realtimeChatEnabled: process.env.REALTIME_CHAT_ENABLED === 'true',
29 |   modelsManagementEnabled: process.env.MODELS_MANAGEMENT_ENABLED === 'true',
30 |   mcpEnabled: process.env.MCP_ENABLED === 'true',
31 |   public: { /* ... */ }
32 | }
33 | ```
34 | 
35 | - 在本地开发中，`.env` 会在构建前加载，因此 `process.env.MCP_ENABLED` 在构建时就为 true → `mcpEnabled` 被“烘焙”为 true。
36 | - 在 Docker 中，我们运行的是预构建镜像。仅在运行时设置 `MCP_ENABLED=true` 无法改变 `runtimeConfig.mcpEnabled`。必须使用 `NUXT_MCP_ENABLED=true` 才能在运行时覆盖。
37 | 
38 | 这也解释了为什么 `/api/features` 的日志里 `process.env.MCP_ENABLED` 显示为 true，但 `useRuntimeConfig().mcpEnabled` 仍然是 false。
39 | 
40 | ## ✅ 解决方案
41 | 
42 | ### 方案 A（推荐）：在 Docker 中使用 `NUXT_` 前缀变量
43 | 
44 | 修改 `docker-compose.yaml`：
45 | 
46 | ```yaml
47 | services:
48 |   chatollama:
49 |     environment:
50 |       - NUXT_MCP_ENABLED=true
51 |       - NUXT_KNOWLEDGE_BASE_ENABLED=true
52 |       - NUXT_REALTIME_CHAT_ENABLED=true
53 |       - NUXT_MODELS_MANAGEMENT_ENABLED=true
54 | ```
55 | 
56 | 这样即可直接在运行时映射到 `runtimeConfig`，无需改代码。
57 | 
58 | ### 方案 B：同时兼容旧变量与 `NUXT_`
59 | 
60 | 如果希望继续兼容 `MCP_ENABLED`，可以在 `nuxt.config.ts` 中优先读取运行时的 `NUXT_` 变量，并回退到旧变量：
61 | 
62 | ```ts
63 | runtimeConfig: {
64 |   knowledgeBaseEnabled: process.env.NUXT_KNOWLEDGE_BASE_ENABLED === 'true' || process.env.KNOWLEDGE_BASE_ENABLED === 'true',
65 |   realtimeChatEnabled: process.env.NUXT_REALTIME_CHAT_ENABLED === 'true' || process.env.REALTIME_CHAT_ENABLED === 'true',
66 |   modelsManagementEnabled: process.env.NUXT_MODELS_MANAGEMENT_ENABLED === 'true' || process.env.MODELS_MANAGEMENT_ENABLED === 'true',
67 |   mcpEnabled: process.env.NUXT_MCP_ENABLED === 'true' || process.env.MCP_ENABLED === 'true',
68 |   public: { /* ... */ }
69 | }
70 | ```
71 | 
72 | ## 🔧 验证步骤
73 | 
74 | 1. 使用更新后的 Compose 环境变量重新部署。
75 | 2. 请求 `/api/features` 并查看容器日志（会打印环境变量与 `runtimeConfig` 值）。
76 | 3. 打开设置页：当 `mcpEnabled` 为 true 时，应显示「MCP」模块。
77 | 
78 | ## 🤔 为什么本地可用、Docker 不行？
79 | 
80 | - **本地**：`.env` 在构建前加载 → `runtimeConfig` 在构建时就被设置为 true。
81 | - **Docker**：使用预构建镜像 → 运行时覆盖必须使用 `NUXT_` 前缀变量。
82 | 
83 | ## 📝 小的开发体验改进（可选）
84 | 
85 | - 在 `composables/useFeatures.ts` 的 `FeatureFlags` 接口中补充 `modelsManagementEnabled`，以保持类型完整。
86 | 
87 | ## 🎯 总结
88 | 
89 | 使用 Nuxt 3 做容器化部署时，牢记：构建时环境变量决定默认值；运行时覆盖需要使用 `NUXT_` 前缀。配置正确后，设置页的功能模块就会在所有环境中一致显示。
90 | 


--------------------------------------------------------------------------------
/src/content/blog-zh/2025-08-18-ui-improvements-and-chat-fixes_zh.md:
--------------------------------------------------------------------------------
  1 | ---
  2 | title: "界面优化与聊天可靠性修复"
  3 | date: "2025-08-18"
  4 | description: "ChatOllama界面优化和聊天功能可靠性修复"
  5 | ---
  6 | 
  7 | 
  8 | *2025年8月18日*
  9 | 
 10 | 大家好！👋
 11 | 
 12 | 过去几天我一直在改进聊天界面的一些重要功能。下面是新功能和修复的问题。
 13 | 
 14 | ## 🐛 重要Bug修复
 15 | 
 16 | ### 创建新聊天按钮问题
 17 | 最令人沮丧的bug之一是"创建新聊天"按钮无响应。用户点击后没有反应，然后多次点击，突然会创建多个新聊天。
 18 | 
 19 | **问题原因：**
 20 | - `scrollToBottom` 函数在DOM元素准备好之前就尝试访问 `messageListEl.value.scrollHeight`
 21 | - 没有加载状态保护，快速点击会触发多个API调用
 22 | - 聊天创建流程中的竞态条件
 23 | 
 24 | **修复方案：**
 25 | ```javascript
 26 | // 在 scrollToBottom 中添加空值检查
 27 | const scrollToBottom = (_behavior: ScrollBehavior) => {
 28 |     behavior.value = _behavior
 29 |     if (messageListEl.value) {
 30 |         y.value = messageListEl.value.scrollHeight
 31 |     }
 32 | }
 33 | 
 34 | // 在 ChatSessionList 中添加加载状态
 35 | const isCreatingChat = ref(false)
 36 | 
 37 | async function onNewChat() {
 38 |     if (isCreatingChat.value) return
 39 |     
 40 |     isCreatingChat.value = true
 41 |     try {
 42 |         const data = await createChatSession()
 43 |         sessionList.value.unshift(data)
 44 |         await router.push(`/chat/${data.id}`)
 45 |     } finally {
 46 |         isCreatingChat.value = false
 47 |     }
 48 | }
 49 | ```
 50 | 
 51 | 这是一个典型的例子，说明小的时序问题如何创造出非常恼人的用户体验问题！
 52 | 
 53 | ## ✨ 新功能：增强预览面板
 54 | 
 55 | 代码工件预览系统得到了重大升级！以前用户只能在基本的侧边面板中查看代码工件。现在我们有了：
 56 | 
 57 | ### 分屏视图模式
 58 | - 聊天占用剩余空间
 59 | - 预览面板固定500px宽度
 60 | - 两者同时可见，便于对照查看
 61 | 
 62 | ### 全屏模式
 63 | - 预览覆盖整个视窗
 64 | - 完全隐藏标题栏以获得最大查看区域
 65 | - 带半透明背景的浮动关闭按钮
 66 | - 非常适合查看复杂的HTML演示或详细图表
 67 | 
 68 | ### 智能状态管理
 69 | 这比听起来要复杂。关键洞察是将"显示/隐藏预览"状态与"正常/全屏"状态分离：
 70 | 
 71 | ```javascript
 72 | // 两个独立状态而不是一个混乱的状态
 73 | const showArtifacts = ref(false)
 74 | const isFullscreen = ref(false)
 75 | 
 76 | // 智能关闭行为
 77 | const closeArtifacts = () => {
 78 |     showArtifacts.value = false
 79 |     isFullscreen.value = false  // 关闭时重置全屏状态
 80 | }
 81 | 
 82 | // 全屏关闭只退出全屏，不关闭预览
 83 | const toggleFullscreen = () => {
 84 |     isFullscreen.value = !isFullscreen.value
 85 | }
 86 | ```
 87 | 
 88 | 现在的用户体验流程是：
 89 | 1. 点击预览 → 在分屏视图中打开
 90 | 2. 点击全屏 → 扩展到全屏
 91 | 3. 在全屏中点击X → 返回分屏视图
 92 | 4. 在分屏视图中点击X → 完全关闭预览
 93 | 
 94 | ## 🎨 动画优化
 95 | 
 96 | 将预览图标动画从滑入效果改为淡入效果。有时最小的改变会对界面的精致感产生最大的影响。
 97 | 
 98 | ```scss
 99 | // 之前：从右侧滑入
100 | .artifact-btn {
101 |     opacity: 0;
102 |     transform: translateX(8px);
103 | }
104 | 
105 | // 之后：简单淡入
106 | .artifact-btn {
107 |     opacity: 0;
108 |     transition: all 0.3s cubic-bezier(0.4, 0, 0.2, 1);
109 | }
110 | ```
111 | 
112 | ## 📚 学到的经验
113 | 
114 | ### 1. DOM时序问题无处不在
115 | `scrollToBottom` bug提醒我们Vue的响应式很快，但DOM仍然需要时间更新。在访问元素属性之前，始终检查元素是否存在。
116 | 
117 | ### 2. 状态管理的复杂性
118 | 最初，我试图让预览系统变得"智能"，有可调整大小的分割和复杂状态。但简单往往更好——两种清晰的模式（分屏/全屏）和明显的过渡对用户来说效果更好。
119 | 
120 | ### 3. 用户测试揭示边缘情况
121 | 聊天创建bug只在特定时序条件下发生。真实用户行为（当某些东西看起来坏了时快速点击）经常揭示在正常开发测试中不会出现的问题。
122 | 
123 | ## 💭 给开发者同行的思考
124 | 
125 | 这些UI可靠性修复可能不够华丽，但对用户体验有巨大影响。一个95%时间有效的按钮对用户来说就是坏的。花时间处理边缘情况和竞态条件是区分好界面和优秀界面的关键。
126 | 
127 | 另外，在构建预览/模态系统时，始终像考虑进入流程一样考虑退出流程。用户需要理解如何回到他们来自的地方！
128 | 
129 | ---
130 | 
131 | *你希望下次看到哪些功能得到改进？在issues中留下你的想法！*
132 | 
133 | *- 你的开发团队*


--------------------------------------------------------------------------------
/src/content/blog/2025-09-16-instant-model-mentions.md:
--------------------------------------------------------------------------------
 1 | ---
 2 | title: "Instantly Talk to Any Model with @ Mentions"
 3 | date: "2025-09-16"
 4 | feature: "Tag a model inline to override the next reply without touching session settings"
 5 | timeToShip: "~1 day"
 6 | description: "Instantly switch between AI models in conversations using @ mentions without changing session settings"
 7 | ---
 8 | 
 9 | ## 🎯 Why We Built It
10 | 
11 | Our long-form chat sessions have always been anchored to a single "default" model. That kept conversations coherent, but it also meant lots of friction when you wanted to toss a quick question to a different model:
12 | 
13 | 1. Open session settings  
14 | 2. Swap the default model  
15 | 3. Ask the question  
16 | 4. Switch the model back so the rest of the thread stays consistent  
17 | 
18 | That dance got even worse when comparing outputs from multiple providers or when you only needed one specialty answer (e.g. “let me sanity-check this with Claude real quick”). We needed something as fast as tagging a teammate in Slack.
19 | 
20 | ## 💡 The Solution in a Nutshell
21 | 
22 | You can now add `@model-name` to any outgoing message. Each mentioned model temporarily "hijacks" the request, so the response comes from that model while the session’s default choice remains unchanged.
23 | 
24 | - Mention a single model (`@gpt-4o-mini`) to reroute just this message.  
25 | - Mention multiple models (`@openrouter/claude-3.5-sonnet @llama3`) to fan out the question.  
26 | - Don’t mention anything and the chat continues using the default model like before.
27 | 
28 | The UI keeps the override discoverable: as soon as you type `@`, the input shows model families, live search, and keyboard navigation so you never have to remember exact IDs.
29 | 
30 | ## 🔍 What Changed Under the Hood
31 | 
32 | ### 1. Parsing Mentions Without Polluting Prompts
33 | `ChatInputBox.vue` now parses model mentions every time the user types. We persist the selected models in `hijackedModels` and simultaneously strip the `@model` tokens into a `sanitizedContent` payload. That sanitized payload is what the backend actually sees, so no model receives literal `@claude` strings in its prompt.
34 | 
35 | ### 2. Respecting Overrides in Delivery
36 | `Chat.vue` checks for `hijackedModels` before sending. If we find any, we bypass the session defaults for that single send, while the session metadata (and sidebar defaults) stay untouched. The outgoing transcript reuses `sanitizedContent` so historical messages read cleanly without the mentions.
37 | 
38 | ### 3. Making Mentions First-Class Citizens in the UI
39 | We refreshed `ModelMentionText.vue` to show consistent badges for mentions, even when the provider uses namespaced values like `openrouter/claude-3.5-sonnet`. The existing auto-title generator also consumes the sanitized message to avoid naming chats "@gpt-4o mini thoughts".
40 | 
41 | ## ✅ Results
42 | 
43 | - Instant context switches without breaking the session model.  
44 | - Keyboard-only flow for power users comparing providers.  
45 | - Clean transcripts and prompts even when users pepper messages with mentions.  
46 | 
47 | Give it a try: type `@` in any chat input, pick a model, and enjoy frictionless comparisons.
48 | 


--------------------------------------------------------------------------------
/src/content/blog/2025-09-18-smart-quick-chat-dialog-positioning.md:
--------------------------------------------------------------------------------
 1 | ---
 2 | title: "Smart Quick Chat Dialog Positioning: A Better User Experience"
 3 | date: "2025-09-18"
 4 | description: "Significant improvement to ChatOllama's Quick Chat feature with intelligent dialog positioning and enhanced viewport awareness"
 5 | ---
 6 | 
 7 | We've just rolled out a significant improvement to ChatOllama's Quick Chat feature that addresses a common frustration users experience when selecting text near screen edges. The Quick Chat dialog now intelligently positions itself to stay within the viewport while providing more space for AI responses.
 8 | 
 9 | ## The Problem
10 | 
11 | Previously, when users selected text at the bottom right corner of their screen or near viewport edges, the Quick Chat dialog would appear partially outside the visible area or get cut off entirely. This made it difficult to read AI responses and interact with the dialog effectively. Additionally, the dialog was quite narrow (320px), limiting the amount of text that could be displayed comfortably.
12 | 
13 | ## The Solution
14 | 
15 | Our new smart positioning algorithm addresses these issues with several key improvements:
16 | 
17 | ### 1. Intelligent Positioning Logic
18 | 
19 | The dialog now follows a sophisticated positioning strategy:
20 | 
21 | - **Horizontal positioning**: First tries to position to the right of the selected text, then to the left if there's insufficient space, and finally centers horizontally if neither side works
22 | - **Vertical positioning**: Attempts to position below the selection first, then above if needed, and centers vertically as a last resort
23 | - **Viewport awareness**: Always ensures the dialog stays within screen bounds with proper padding
24 | 
25 | ### 2. Larger Dialog Size
26 | 
27 | - **Width increased**: From 320px to 480px for better readability
28 | - **Dynamic height**: Automatically adjusts based on response content length
29 | - **Response area**: Doubled from 160px to 320px maximum height
30 | - **Better typography**: Response text size increased from extra-small to small for improved readability
31 | 
32 | ### 3. Dynamic Content Adaptation
33 | 
34 | The dialog now calculates its optimal size based on the AI response length, ensuring longer responses have adequate space while keeping shorter ones compact.
35 | 
36 | ## Technical Implementation
37 | 
38 | The positioning algorithm uses several key constants:
39 | 
40 | ```typescript
41 | const DIALOG_WIDTH = 480  // Increased from 320px
42 | const DIALOG_MIN_HEIGHT = 280
43 | const DIALOG_MAX_HEIGHT = 600  // Maximum height when response is long
44 | const VIEWPORT_PADDING = 20
45 | const OFFSET_FROM_SELECTION = 10
46 | ```
47 | 
48 | The smart positioning logic ensures the dialog:
49 | - Maintains a 20px padding from viewport edges
50 | - Positions 10px away from the selected text
51 | - Dynamically adjusts height based on response content
52 | - Never gets cut off or appears outside the visible area
53 | 
54 | ## Impact on User Experience
55 | 
56 | These improvements deliver several tangible benefits:
57 | 
58 | 1. **Better accessibility**: Users can now select text anywhere on the screen without worrying about dialog positioning
59 | 2. **Improved readability**: Larger dialog and text size make AI responses easier to read
60 | 3. **Smarter behavior**: The dialog adapts to different screen sizes and selection positions automatically


--------------------------------------------------------------------------------
/content/20250819-feature-flags-in-docker-and-nuxt.md:
--------------------------------------------------------------------------------
 1 | # Feature Flags in Docker: Why MCP_ENABLED Didn’t Work and How We Fixed It
 2 | 
 3 | *August 19, 2025*
 4 | 
 5 | Hey everyone! 👋
 6 | 
 7 | Following yesterday’s UI improvements post, I dug into a deployment gotcha that bit us when running in Docker: feature flags like MCP worked locally but not inside containers. Here’s what happened and how to fix it.
 8 | 
 9 | ## 🐛 The Symptom
10 | 
11 | - **Local dev**: Setting `MCP_ENABLED=true` in `.env` made the Settings → MCP module appear.
12 | - **Docker**: Setting `MCP_ENABLED=true` in `docker-compose.yaml` did nothing — the MCP section didn’t show up.
13 | 
14 | ## 🔎 Root Cause: Nuxt runtimeConfig (build-time vs runtime)
15 | 
16 | Nuxt 3 reads `runtimeConfig` values at build time via `process.env`. At runtime, overriding them requires environment variables that map to config keys with the `NUXT_` prefix.
17 | 
18 | Our `nuxt.config.ts` had:
19 | 
20 | ```ts
21 | runtimeConfig: {
22 |   knowledgeBaseEnabled: process.env.KNOWLEDGE_BASE_ENABLED === 'true',
23 |   realtimeChatEnabled: process.env.REALTIME_CHAT_ENABLED === 'true',
24 |   modelsManagementEnabled: process.env.MODELS_MANAGEMENT_ENABLED === 'true',
25 |   mcpEnabled: process.env.MCP_ENABLED === 'true',
26 |   public: { /* ... */ }
27 | }
28 | ```
29 | 
30 | - In dev, `.env` is loaded before build, so `process.env.MCP_ENABLED` was true when we built → `mcpEnabled` baked as true.
31 | - In Docker, we used a prebuilt image. Setting `MCP_ENABLED=true` at runtime does not change `runtimeConfig.mcpEnabled`. You must use `NUXT_MCP_ENABLED=true` to override at runtime.
32 | 
33 | This explains why `/api/features` logs showed `process.env.MCP_ENABLED` as true, but `useRuntimeConfig().mcpEnabled` stayed false.
34 | 
35 | ## ✅ The Fix
36 | 
37 | ### Option A (Recommended): Use `NUXT_`-prefixed env vars in Docker
38 | 
39 | Update `docker-compose.yaml`:
40 | 
41 | ```yaml
42 | services:
43 |   chatollama:
44 |     environment:
45 |       - NUXT_MCP_ENABLED=true
46 |       - NUXT_KNOWLEDGE_BASE_ENABLED=true
47 |       - NUXT_REALTIME_CHAT_ENABLED=true
48 |       - NUXT_MODELS_MANAGEMENT_ENABLED=true
49 | ```
50 | 
51 | This maps directly to `runtimeConfig` at runtime — no code changes needed.
52 | 
53 | ### Option B: Support both legacy and `NUXT_` in code
54 | 
55 | If you want `MCP_ENABLED` to keep working, make `nuxt.config.ts` prefer the runtime `NUXT_` variables and fall back to the legacy ones:
56 | 
57 | ```ts
58 | runtimeConfig: {
59 |   knowledgeBaseEnabled: process.env.NUXT_KNOWLEDGE_BASE_ENABLED === 'true' || process.env.KNOWLEDGE_BASE_ENABLED === 'true',
60 |   realtimeChatEnabled: process.env.NUXT_REALTIME_CHAT_ENABLED === 'true' || process.env.REALTIME_CHAT_ENABLED === 'true',
61 |   modelsManagementEnabled: process.env.NUXT_MODELS_MANAGEMENT_ENABLED === 'true' || process.env.MODELS_MANAGEMENT_ENABLED === 'true',
62 |   mcpEnabled: process.env.NUXT_MCP_ENABLED === 'true' || process.env.MCP_ENABLED === 'true',
63 |   public: { /* ... */ }
64 | }
65 | ```
66 | 
67 | ## 🔧 How to Verify
68 | 
69 | 1. Redeploy with the updated Compose env vars.
70 | 2. Hit `/api/features` and check logs — they print both environment vars and `runtimeConfig` values.
71 | 3. Open Settings: the MCP section should appear when `mcpEnabled` is true.
72 | 
73 | ## 🤔 Why it worked locally but not in Docker
74 | 
75 | - **Local**: `.env` loaded before build → `runtimeConfig` baked with your values.
76 | - **Docker**: prebuilt image → runtime overrides require `NUXT_`-prefixed variables.
77 | 
78 | ## 📝 Small DX touch-up (optional)
79 | 
80 | - Add `modelsManagementEnabled` to the `FeatureFlags` interface in `composables/useFeatures.ts` for type completeness.
81 | 
82 | ## 🎯 Takeaway
83 | 
84 | Remember this rule of thumb with Nuxt 3: build-time envs bake defaults; runtime overrides need `NUXT_`. With that in place, the Settings page correctly reflects features across environments.
85 | 


--------------------------------------------------------------------------------
/src/content/blog/2025-08-19-feature-flags-in-docker-and-nuxt.md:
--------------------------------------------------------------------------------
 1 | ---
 2 | title: "Feature Flags in Docker: Why MCP_ENABLED Didn't Work and How We Fixed It"
 3 | date: "2025-08-19"
 4 | description: "Troubleshooting and fixing MCP feature flags that work in development but fail in Docker containers"
 5 | ---
 6 | 
 7 | 
 8 | *August 19, 2025*
 9 | 
10 | Hey everyone! 👋
11 | 
12 | Following yesterday’s UI improvements post, I dug into a deployment gotcha that bit us when running in Docker: feature flags like MCP worked locally but not inside containers. Here’s what happened and how to fix it.
13 | 
14 | ## 🐛 The Symptom
15 | 
16 | - **Local dev**: Setting `MCP_ENABLED=true` in `.env` made the Settings → MCP module appear.
17 | - **Docker**: Setting `MCP_ENABLED=true` in `docker-compose.yaml` did nothing — the MCP section didn’t show up.
18 | 
19 | ## 🔎 Root Cause: Nuxt runtimeConfig (build-time vs runtime)
20 | 
21 | Nuxt 3 reads `runtimeConfig` values at build time via `process.env`. At runtime, overriding them requires environment variables that map to config keys with the `NUXT_` prefix.
22 | 
23 | Our `nuxt.config.ts` had:
24 | 
25 | ```ts
26 | runtimeConfig: {
27 |   knowledgeBaseEnabled: process.env.KNOWLEDGE_BASE_ENABLED === 'true',
28 |   realtimeChatEnabled: process.env.REALTIME_CHAT_ENABLED === 'true',
29 |   modelsManagementEnabled: process.env.MODELS_MANAGEMENT_ENABLED === 'true',
30 |   mcpEnabled: process.env.MCP_ENABLED === 'true',
31 |   public: { /* ... */ }
32 | }
33 | ```
34 | 
35 | - In dev, `.env` is loaded before build, so `process.env.MCP_ENABLED` was true when we built → `mcpEnabled` baked as true.
36 | - In Docker, we used a prebuilt image. Setting `MCP_ENABLED=true` at runtime does not change `runtimeConfig.mcpEnabled`. You must use `NUXT_MCP_ENABLED=true` to override at runtime.
37 | 
38 | This explains why `/api/features` logs showed `process.env.MCP_ENABLED` as true, but `useRuntimeConfig().mcpEnabled` stayed false.
39 | 
40 | ## ✅ The Fix
41 | 
42 | ### Option A (Recommended): Use `NUXT_`-prefixed env vars in Docker
43 | 
44 | Update `docker-compose.yaml`:
45 | 
46 | ```yaml
47 | services:
48 |   chatollama:
49 |     environment:
50 |       - NUXT_MCP_ENABLED=true
51 |       - NUXT_KNOWLEDGE_BASE_ENABLED=true
52 |       - NUXT_REALTIME_CHAT_ENABLED=true
53 |       - NUXT_MODELS_MANAGEMENT_ENABLED=true
54 | ```
55 | 
56 | This maps directly to `runtimeConfig` at runtime — no code changes needed.
57 | 
58 | ### Option B: Support both legacy and `NUXT_` in code
59 | 
60 | If you want `MCP_ENABLED` to keep working, make `nuxt.config.ts` prefer the runtime `NUXT_` variables and fall back to the legacy ones:
61 | 
62 | ```ts
63 | runtimeConfig: {
64 |   knowledgeBaseEnabled: process.env.NUXT_KNOWLEDGE_BASE_ENABLED === 'true' || process.env.KNOWLEDGE_BASE_ENABLED === 'true',
65 |   realtimeChatEnabled: process.env.NUXT_REALTIME_CHAT_ENABLED === 'true' || process.env.REALTIME_CHAT_ENABLED === 'true',
66 |   modelsManagementEnabled: process.env.NUXT_MODELS_MANAGEMENT_ENABLED === 'true' || process.env.MODELS_MANAGEMENT_ENABLED === 'true',
67 |   mcpEnabled: process.env.NUXT_MCP_ENABLED === 'true' || process.env.MCP_ENABLED === 'true',
68 |   public: { /* ... */ }
69 | }
70 | ```
71 | 
72 | ## 🔧 How to Verify
73 | 
74 | 1. Redeploy with the updated Compose env vars.
75 | 2. Hit `/api/features` and check logs — they print both environment vars and `runtimeConfig` values.
76 | 3. Open Settings: the MCP section should appear when `mcpEnabled` is true.
77 | 
78 | ## 🤔 Why it worked locally but not in Docker
79 | 
80 | - **Local**: `.env` loaded before build → `runtimeConfig` baked with your values.
81 | - **Docker**: prebuilt image → runtime overrides require `NUXT_`-prefixed variables.
82 | 
83 | ## 📝 Small DX touch-up (optional)
84 | 
85 | - Add `modelsManagementEnabled` to the `FeatureFlags` interface in `composables/useFeatures.ts` for type completeness.
86 | 
87 | ## 🎯 Takeaway
88 | 
89 | Remember this rule of thumb with Nuxt 3: build-time envs bake defaults; runtime overrides need `NUXT_`. With that in place, the Settings page correctly reflects features across environments.
90 | 


--------------------------------------------------------------------------------
/src/content/blog-zh/2025-08-25-docker-langchain-module-resolution-fix_zh.md:
--------------------------------------------------------------------------------
  1 | ---
  2 | title: "修复 Docker 模块解析错误：LangChain 依赖项调查"
  3 | date: "2025-08-25"
  4 | description: "Blog post about 修复 Docker 模块解析错误：LangChain 依赖项调查"
  5 | ---
  6 | 
  7 | 
  8 | **日期**：2025年8月25日  
  9 | **问题**：Docker 容器因 `Cannot find module '@langchain/core/prompts.js'` 错误而失败  
 10 | **解决方案**：LangChain 包间的依赖版本对齐  
 11 | 
 12 | ## 问题描述
 13 | 
 14 | Docker 化的 ChatOllama 应用程序在聊天操作期间遇到关键的模块解析错误：
 15 | 
 16 | ```
 17 | [nuxt] [request error] [unhandled] [500] Cannot find module '/app/.output/server/node_modules/@langchain/core/prompts.js' 
 18 | imported from /app/.output/server/chunks/routes/api/models/index.post.mjs
 19 | ```
 20 | 
 21 | 此错误在多个 API 端点（`/api/models/chat`、`/api/instruction`、`/api/agents`）中持续出现，并阻止应用程序在 Docker 容器中正常运行。
 22 | 
 23 | ## 调查过程
 24 | 
 25 | ### 1. 初步分析
 26 | - **错误模式**：`@langchain/core/prompts.js` 的 ESM 模块解析失败
 27 | - **环境**：Docker 容器构建过程，而非本地开发
 28 | - **受影响文件**：从 `@langchain/core/prompts` 导入的服务器 API 路由
 29 | 
 30 | ### 2. 容器检查
 31 | 调查发现 Docker 容器中缺少导出文件：
 32 | 
 33 | ```bash
 34 | /app/.output/server/node_modules/@langchain/core/prompts.js
 35 | 
 36 | /app/.output/server/node_modules/@langchain/core/dist/prompts/index.js
 37 | ```
 38 | 
 39 | ### 3. 版本冲突发现
 40 | 在依赖树中发现了 **三个不同版本** 的 `@langchain/core`：
 41 | 
 42 | - **项目规范**：`@langchain/core@^0.3.49`
 43 | - **实际 Docker 解析**：`@langchain/core@0.3.72`（由 `deepagents@0.0.1` 引入）
 44 | - **遗留版本**：`@langchain/core@0.1.54`（由较旧的包使用）
 45 | 
 46 | 关键问题：`deepagents@0.0.1` 依赖项强制使用 `@langchain/core@0.3.72`，而项目指定了 `^0.3.49`，在 Nuxt 的构建打包过程中创建了版本冲突。
 47 | 
 48 | ## 根因分析
 49 | 
 50 | ### 核心问题
 51 | **版本不匹配**：较新的 `@langchain/core@0.3.72` 具有不同的导出结构，与 Nuxt 为 Docker 部署打包模块的方式不兼容。
 52 | 
 53 | ### 为什么 Docker 与本地不同？
 54 | - **本地开发**：pnpm 的工作区解析优雅地处理了冲突
 55 | - **Docker 构建**：Nuxt 的生产打包暴露了版本不一致性
 56 | - **模块解析**：不同版本之间的 ESM 导出映射不同
 57 | 
 58 | ### 技术细节
 59 | ```json
 60 | // package.json 指定的版本
 61 | "@langchain/core": "^0.3.49"
 62 | 
 63 | // 但依赖解析拉取了
 64 | "deepagents@0.0.1" → "@langchain/core@0.3.72"
 65 | 
 66 | // 导致打包期间缺少导出
 67 | ```
 68 | 
 69 | ## 解决方案：依赖对齐
 70 | 
 71 | ### 方法
 72 | 我们没有选择手动文件补丁，而是通过将所有 LangChain 包更新为兼容版本来选择 **正确的依赖管理**。
 73 | 
 74 | ### 应用的包更新
 75 | 
 76 | ```json
 77 | {
 78 |   // 版本对齐的核心更新
 79 |   "@langchain/core": "^0.3.49" → "^0.3.72",
 80 |   
 81 |   // 兼容包更新
 82 |   "@langchain/anthropic": "^0.3.19" → "^0.3.26",
 83 |   "@langchain/community": "^0.3.41" → "^0.3.53", 
 84 |   "@langchain/google-genai": "^0.1.5" → "^0.2.16",
 85 |   "@langchain/groq": "^0.0.5" → "^0.2.3",
 86 |   "@langchain/ollama": "^0.2.0" → "^0.2.3",
 87 |   "@langchain/openai": "^0.5.7" → "^0.6.9",
 88 |   
 89 |   // 提供商特定更新
 90 |   "@langchain/azure-openai": "^0.0.4" → "^0.0.11",
 91 |   "@langchain/cohere": "^0.0.6" → "^0.3.4",
 92 |   
 93 |   // 对等依赖修复
 94 |   "ws": "^8.16.0" → "^8.18.0",
 95 |   "zod": "^3.23.8" → "^3.24.1"
 96 | }
 97 | ```
 98 | 
 99 | ### 实施步骤
100 | 
101 | ```bash
102 | # 2. 重新安装依赖项
103 | pnpm install
104 | 
105 | pnpm run build
106 | 
107 | # (server/api/agents/[id].post.ts 中缺少括号)
108 | 
109 | ✓ Built in 17.34s
110 | ```
111 | 
112 | ## 验证结果
113 | 
114 | ### 修复前
115 | - **Docker 错误**：模块解析失败
116 | - **版本冲突**：3个不同的 @langchain/core 版本
117 | - **对等依赖**：多个警告
118 | - **构建状态**：在 Docker 中失败
119 | 
120 | ### 修复后
121 | - **依赖解析**：所有 LangChain 包使用 `@langchain/core@0.3.72`
122 | - **本地构建**：✅ 成功（`pnpm run build`）
123 | - **模块导出**：所有包之间一致
124 | - **对等警告**：减少到最小的非关键问题
125 | 
126 | ## 学到的最佳实践
127 | 
128 | ### 1. 依赖管理
129 | - **始终对齐相关包家族的主要依赖版本**
130 | - **对 LangChain 核心等关键依赖使用精确或兼容范围**
131 | - **定期依赖审计** 以捕获版本偏移
132 | 
133 | ### 2. Docker 特定考虑事项
134 | - **在开发期间在 Docker 中测试构建**，而不仅仅是本地
135 | - **版本冲突在容器化构建中的表现不同** 与本地开发
136 | - **ESM 模块解析** 对版本不匹配很敏感
137 | 
138 | ### 3. 调查方法
139 | - **首先检查容器** 以了解实际文件结构
140 | - **依赖树分析** 以识别版本冲突
141 | - **标准工具而非手动修复** 用于可持续解决方案
142 | 
143 | ## 开发者技术细节
144 | 
145 | ### 修改的文件
146 | - `package.json`：更新了 LangChain 包版本
147 | - `pnpm-lock.yaml`：使用一致的解析重新生成
148 | - `server/api/agents/[id].post.ts`：修复了语法错误（缺少括号）
149 | 
150 | ### 重现命令
151 | ```bash
152 | docker exec <container> ls -la /app/.output/server/node_modules/@langchain/core/
153 | 
154 | docker exec <container> find /app/.output/server/node_modules/@langchain/core -name "*prompt*"
155 | 
156 | npm list @langchain/core
157 | ```
158 | 
159 | ### 预防策略
160 | ```json
161 | // package.json - 对关键依赖项使用更严格的版本范围
162 | {
163 |   "@langchain/core": "~0.3.72",  // 仅限补丁级别的波浪号
164 |   "deepagents": "^0.0.1"         // 确保兼容性
165 | }
166 | ```
167 | 
168 | ## 结论
169 | 
170 | 这个问题突出了现代 JavaScript 应用程序中 **一致依赖管理** 的重要性，特别是在通过 Docker 部署时。正确的解决方案涉及将整个 LangChain 生态系统更新为兼容版本，而不是应用手动补丁。
171 | 
172 | ### 关键要点
173 | 1. **版本冲突** 在本地和 Docker 环境之间可能表现不同
174 | 2. **依赖对齐** 对 ESM 模块解析至关重要
175 | 3. **标准包管理** 始终优于手动文件修复
176 | 4. **容器特定测试** 应该是开发工作流程的一部分
177 | 
178 | 此修复确保 ChatOllama 的 Docker 部署可靠工作，同时保持标准构建过程并使依赖项与最新的 LangChain 生态系统改进保持同步。


--------------------------------------------------------------------------------
/content/zh/20250825-docker-langchain-module-resolution-fix_zh.md:
--------------------------------------------------------------------------------
  1 | # 修复 Docker 模块解析错误：LangChain 依赖项调查
  2 | 
  3 | **日期**：2025年8月25日  
  4 | **问题**：Docker 容器因 `Cannot find module '@langchain/core/prompts.js'` 错误而失败  
  5 | **解决方案**：LangChain 包间的依赖版本对齐  
  6 | 
  7 | ## 问题描述
  8 | 
  9 | Docker 化的 ChatOllama 应用程序在聊天操作期间遇到关键的模块解析错误：
 10 | 
 11 | ```
 12 | [nuxt] [request error] [unhandled] [500] Cannot find module '/app/.output/server/node_modules/@langchain/core/prompts.js' 
 13 | imported from /app/.output/server/chunks/routes/api/models/index.post.mjs
 14 | ```
 15 | 
 16 | 此错误在多个 API 端点（`/api/models/chat`、`/api/instruction`、`/api/agents`）中持续出现，并阻止应用程序在 Docker 容器中正常运行。
 17 | 
 18 | ## 调查过程
 19 | 
 20 | ### 1. 初步分析
 21 | - **错误模式**：`@langchain/core/prompts.js` 的 ESM 模块解析失败
 22 | - **环境**：Docker 容器构建过程，而非本地开发
 23 | - **受影响文件**：从 `@langchain/core/prompts` 导入的服务器 API 路由
 24 | 
 25 | ### 2. 容器检查
 26 | 调查发现 Docker 容器中缺少导出文件：
 27 | 
 28 | ```bash
 29 | # 预期但缺失的文件
 30 | /app/.output/server/node_modules/@langchain/core/prompts.js
 31 | 
 32 | # 可用的目录结构
 33 | /app/.output/server/node_modules/@langchain/core/dist/prompts/index.js
 34 | ```
 35 | 
 36 | ### 3. 版本冲突发现
 37 | 在依赖树中发现了 **三个不同版本** 的 `@langchain/core`：
 38 | 
 39 | - **项目规范**：`@langchain/core@^0.3.49`
 40 | - **实际 Docker 解析**：`@langchain/core@0.3.72`（由 `deepagents@0.0.1` 引入）
 41 | - **遗留版本**：`@langchain/core@0.1.54`（由较旧的包使用）
 42 | 
 43 | 关键问题：`deepagents@0.0.1` 依赖项强制使用 `@langchain/core@0.3.72`，而项目指定了 `^0.3.49`，在 Nuxt 的构建打包过程中创建了版本冲突。
 44 | 
 45 | ## 根因分析
 46 | 
 47 | ### 核心问题
 48 | **版本不匹配**：较新的 `@langchain/core@0.3.72` 具有不同的导出结构，与 Nuxt 为 Docker 部署打包模块的方式不兼容。
 49 | 
 50 | ### 为什么 Docker 与本地不同？
 51 | - **本地开发**：pnpm 的工作区解析优雅地处理了冲突
 52 | - **Docker 构建**：Nuxt 的生产打包暴露了版本不一致性
 53 | - **模块解析**：不同版本之间的 ESM 导出映射不同
 54 | 
 55 | ### 技术细节
 56 | ```json
 57 | // package.json 指定的版本
 58 | "@langchain/core": "^0.3.49"
 59 | 
 60 | // 但依赖解析拉取了
 61 | "deepagents@0.0.1" → "@langchain/core@0.3.72"
 62 | 
 63 | // 导致打包期间缺少导出
 64 | ```
 65 | 
 66 | ## 解决方案：依赖对齐
 67 | 
 68 | ### 方法
 69 | 我们没有选择手动文件补丁，而是通过将所有 LangChain 包更新为兼容版本来选择 **正确的依赖管理**。
 70 | 
 71 | ### 应用的包更新
 72 | 
 73 | ```json
 74 | {
 75 |   // 版本对齐的核心更新
 76 |   "@langchain/core": "^0.3.49" → "^0.3.72",
 77 |   
 78 |   // 兼容包更新
 79 |   "@langchain/anthropic": "^0.3.19" → "^0.3.26",
 80 |   "@langchain/community": "^0.3.41" → "^0.3.53", 
 81 |   "@langchain/google-genai": "^0.1.5" → "^0.2.16",
 82 |   "@langchain/groq": "^0.0.5" → "^0.2.3",
 83 |   "@langchain/ollama": "^0.2.0" → "^0.2.3",
 84 |   "@langchain/openai": "^0.5.7" → "^0.6.9",
 85 |   
 86 |   // 提供商特定更新
 87 |   "@langchain/azure-openai": "^0.0.4" → "^0.0.11",
 88 |   "@langchain/cohere": "^0.0.6" → "^0.3.4",
 89 |   
 90 |   // 对等依赖修复
 91 |   "ws": "^8.16.0" → "^8.18.0",
 92 |   "zod": "^3.23.8" → "^3.24.1"
 93 | }
 94 | ```
 95 | 
 96 | ### 实施步骤
 97 | 
 98 | ```bash
 99 | # 1. 使用兼容版本更新 package.json
100 | # 2. 重新安装依赖项
101 | pnpm install
102 | 
103 | # 3. 验证构建成功
104 | pnpm run build
105 | 
106 | # 4. 修复发现的语法错误
107 | # (server/api/agents/[id].post.ts 中缺少括号)
108 | 
109 | # 5. 成功完成构建
110 | ✓ Built in 17.34s
111 | ```
112 | 
113 | ## 验证结果
114 | 
115 | ### 修复前
116 | - **Docker 错误**：模块解析失败
117 | - **版本冲突**：3个不同的 @langchain/core 版本
118 | - **对等依赖**：多个警告
119 | - **构建状态**：在 Docker 中失败
120 | 
121 | ### 修复后
122 | - **依赖解析**：所有 LangChain 包使用 `@langchain/core@0.3.72`
123 | - **本地构建**：✅ 成功（`pnpm run build`）
124 | - **模块导出**：所有包之间一致
125 | - **对等警告**：减少到最小的非关键问题
126 | 
127 | ## 学到的最佳实践
128 | 
129 | ### 1. 依赖管理
130 | - **始终对齐相关包家族的主要依赖版本**
131 | - **对 LangChain 核心等关键依赖使用精确或兼容范围**
132 | - **定期依赖审计** 以捕获版本偏移
133 | 
134 | ### 2. Docker 特定考虑事项
135 | - **在开发期间在 Docker 中测试构建**，而不仅仅是本地
136 | - **版本冲突在容器化构建中的表现不同** 与本地开发
137 | - **ESM 模块解析** 对版本不匹配很敏感
138 | 
139 | ### 3. 调查方法
140 | - **首先检查容器** 以了解实际文件结构
141 | - **依赖树分析** 以识别版本冲突
142 | - **标准工具而非手动修复** 用于可持续解决方案
143 | 
144 | ## 开发者技术细节
145 | 
146 | ### 修改的文件
147 | - `package.json`：更新了 LangChain 包版本
148 | - `pnpm-lock.yaml`：使用一致的解析重新生成
149 | - `server/api/agents/[id].post.ts`：修复了语法错误（缺少括号）
150 | 
151 | ### 重现命令
152 | ```bash
153 | # 检查容器依赖项
154 | docker exec <container> ls -la /app/.output/server/node_modules/@langchain/core/
155 | 
156 | # 检查缺少的导出
157 | docker exec <container> find /app/.output/server/node_modules/@langchain/core -name "*prompt*"
158 | 
159 | # 验证本地与容器的差异
160 | npm list @langchain/core
161 | ```
162 | 
163 | ### 预防策略
164 | ```json
165 | // package.json - 对关键依赖项使用更严格的版本范围
166 | {
167 |   "@langchain/core": "~0.3.72",  // 仅限补丁级别的波浪号
168 |   "deepagents": "^0.0.1"         // 确保兼容性
169 | }
170 | ```
171 | 
172 | ## 结论
173 | 
174 | 这个问题突出了现代 JavaScript 应用程序中 **一致依赖管理** 的重要性，特别是在通过 Docker 部署时。正确的解决方案涉及将整个 LangChain 生态系统更新为兼容版本，而不是应用手动补丁。
175 | 
176 | ### 关键要点
177 | 1. **版本冲突** 在本地和 Docker 环境之间可能表现不同
178 | 2. **依赖对齐** 对 ESM 模块解析至关重要
179 | 3. **标准包管理** 始终优于手动文件修复
180 | 4. **容器特定测试** 应该是开发工作流程的一部分
181 | 
182 | 此修复确保 ChatOllama 的 Docker 部署可靠工作，同时保持标准构建过程并使依赖项与最新的 LangChain 生态系统改进保持同步。


--------------------------------------------------------------------------------
/src/layouts/BaseLayout.astro:
--------------------------------------------------------------------------------
  1 | ---
  2 | import { getLangFromUrl, useTranslations } from '@/utils/i18n';
  3 | import '@/styles/global.css';
  4 | 
  5 | export interface Props {
  6 |   title: string;
  7 |   description?: string;
  8 | }
  9 | 
 10 | const { title, description } = Astro.props;
 11 | const lang = getLangFromUrl(Astro.url);
 12 | const t = useTranslations(lang);
 13 | const metaDescription = description || t('meta.description');
 14 | 
 15 | // Use the configured site URL for production, fallback to Astro.url for development
 16 | const siteUrl = import.meta.env.SITE || Astro.site || Astro.url.origin;
 17 | const currentUrl = new URL(Astro.url.pathname, siteUrl);
 18 | const imageUrl = new URL('/social_share.png', siteUrl);
 19 | ---
 20 | 
 21 | <!doctype html>
 22 | <html lang={lang} class="h-full">
 23 |   <head>
 24 |     <meta charset="UTF-8" />
 25 |     <meta name="description" content={metaDescription} />
 26 |     <meta name="viewport" content="width=device-width, initial-scale=1.0" />
 27 | 
 28 |     <!-- SEO Meta Tags -->
 29 |     <title>{title}</title>
 30 |     <meta name="author" content="ChatOllama Team" />
 31 |     <meta name="robots" content="index, follow" />
 32 |     <meta name="keywords" content="ChatOllama, AI, chatbot, open source, artificial intelligence, machine learning, blog" />
 33 | 
 34 |     <!-- Open Graph / Facebook -->
 35 |     <meta property="og:type" content="website" />
 36 |     <meta property="og:url" content={currentUrl} />
 37 |     <meta property="og:title" content={title} />
 38 |     <meta property="og:description" content={metaDescription} />
 39 |     <meta property="og:image" content={imageUrl} />
 40 |     <meta property="og:site_name" content="ChatOllama Blog" />
 41 | 
 42 |     <!-- Twitter -->
 43 |     <meta property="twitter:card" content="summary_large_image" />
 44 |     <meta property="twitter:url" content={currentUrl} />
 45 |     <meta property="twitter:title" content={title} />
 46 |     <meta property="twitter:description" content={metaDescription} />
 47 |     <meta property="twitter:image" content={imageUrl} />
 48 |     <meta property="twitter:creator" content="@ChatOllama" />
 49 |     <meta property="twitter:site" content="@ChatOllama" />
 50 | 
 51 |     <!-- Additional SEO -->
 52 |     <link rel="canonical" href={currentUrl} />
 53 |     <meta name="theme-color" content="#000000" />
 54 | 
 55 |     <!-- Favicon -->
 56 |     <link rel="icon" type="image/svg+xml" href="/logo.svg" />
 57 |     <link rel="apple-touch-icon" href="/logo.svg" />
 58 |   </head>
 59 |   <body class="h-full bg-white text-black font-sans antialiased">
 60 |     <div class="min-h-full flex flex-col">
 61 |       <header class="border-b border-gray-200">
 62 |         <nav class="max-w-4xl mx-auto px-6 py-4">
 63 |           <div class="flex items-center justify-between">
 64 |             <a href="https://chatollama.cloud" target="_blank" class="flex items-center space-x-3 hover:opacity-80 transition-opacity">
 65 |               <img src="/logo.svg" alt="ChatOllama" class="h-8 w-auto" />
 66 |               <span class="text-lg font-semibold hidden sm:block">ChatOllama</span>
 67 |             </a>
 68 | 
 69 |             <div class="flex items-center space-x-4 md:space-x-6">
 70 |               <a href={lang === 'en' ? '/' : '/zh'} class="hover:text-gray-600 transition-colors hidden sm:block">
 71 |                 {t('nav.home')}
 72 |               </a>
 73 |               <a href={lang === 'en' ? '/blog' : '/zh/blog'} class="hover:text-gray-600 transition-colors hidden sm:block">
 74 |                 {t('nav.blog')}
 75 |               </a>
 76 |               <a href="https://chatollama.cloud" target="_blank" class="hover:text-gray-600 transition-colors">
 77 |                 {t('nav.project')}
 78 |               </a>
 79 | 
 80 |               <!-- Language switcher -->
 81 |               <a
 82 |                 href={lang === 'en' ? '/zh' + Astro.url.pathname : Astro.url.pathname.replace('/zh', '')}
 83 |                 class="text-sm font-medium px-2 py-1 hover:bg-gray-100 rounded transition-colors"
 84 |                 title={lang === 'en' ? 'Switch to Chinese' : 'Switch to English'}
 85 |               >
 86 |                 {lang === 'en' ? '中' : 'EN'}
 87 |               </a>
 88 |             </div>
 89 |           </div>
 90 |         </nav>
 91 |       </header>
 92 | 
 93 |       <main class="flex-1">
 94 |         <slot />
 95 |       </main>
 96 | 
 97 |       <footer class="border-t border-gray-200 mt-auto">
 98 |         <div class="max-w-4xl mx-auto px-6 py-8">
 99 |           <div class="text-center text-sm text-gray-600">
100 |             © {new Date().getFullYear()} <a href="https://chatollama.cloud" target="_blank" class="hover:text-black transition-colors">ChatOllama</a>. Open source chatbot platform.
101 |           </div>
102 |         </div>
103 |       </footer>
104 |     </div>
105 |   </body>
106 |   <script>
107 |     import { inject } from '@vercel/analytics';
108 |     inject();
109 |   </script>
110 | </html>
111 | 
112 | <style is:global>
113 |   html {
114 |     font-family: 'Inter', system-ui, sans-serif;
115 |   }
116 | </style>


--------------------------------------------------------------------------------
/content/20250818-ui-improvements-and-chat-fixes.md:
--------------------------------------------------------------------------------
  1 | # UI Improvements and Chat Reliability Fixes
  2 | 
  3 | *August 18, 2025*
  4 | 
  5 | Hey everyone! 👋
  6 | 
  7 | I've been working on some important improvements to the chat interface over the past few days. Here's what's new and what got fixed.
  8 | 
  9 | ## 🐛 Major Bug Fixes
 10 | 
 11 | ### Chat Creation Button Issues
 12 | One of the most frustrating bugs was the unresponsive "create new chat" button. Users would click it, nothing would happen, then they'd click multiple times and suddenly get several new chats created at once. 
 13 | 
 14 | **What was happening:**
 15 | - The `scrollToBottom` function was trying to access `messageListEl.value.scrollHeight` before the DOM element was ready
 16 | - No loading state protection meant rapid clicks could trigger multiple API calls
 17 | - Race conditions in the chat creation flow
 18 | 
 19 | **The fix:**
 20 | ```javascript
 21 | // Added null check in scrollToBottom
 22 | const scrollToBottom = (_behavior: ScrollBehavior) => {
 23 |     behavior.value = _behavior
 24 |     if (messageListEl.value) {
 25 |         y.value = messageListEl.value.scrollHeight
 26 |     }
 27 | }
 28 | 
 29 | // Added loading state in ChatSessionList
 30 | const isCreatingChat = ref(false)
 31 | 
 32 | async function onNewChat() {
 33 |     if (isCreatingChat.value) return
 34 |     
 35 |     isCreatingChat.value = true
 36 |     try {
 37 |         const data = await createChatSession()
 38 |         sessionList.value.unshift(data)
 39 |         await router.push(`/chat/${data.id}`)
 40 |     } finally {
 41 |         isCreatingChat.value = false
 42 |     }
 43 | }
 44 | ```
 45 | 
 46 | This was a classic example of how small timing issues can create really annoying UX problems!
 47 | 
 48 | ## ✨ New Feature: Enhanced Preview Panel
 49 | 
 50 | The artifact preview system got a major upgrade! Previously, users could only view code artifacts in a basic side panel. Now we have:
 51 | 
 52 | ### Split View Mode
 53 | - Chat takes up the remaining space
 54 | - Preview panel has a fixed 500px width
 55 | - Both are visible simultaneously for context
 56 | 
 57 | ### Fullscreen Mode
 58 | - Preview covers the entire viewport
 59 | - Header is completely hidden for maximum viewing area
 60 | - Floating close button with semi-transparent background
 61 | - Perfect for viewing complex HTML demos or detailed diagrams
 62 | 
 63 | ### Smart State Management
 64 | This was trickier than it sounds. The key insight was separating the "show/hide preview" state from the "normal/fullscreen" state:
 65 | 
 66 | ```javascript
 67 | // Two separate states instead of one confusing state
 68 | const showArtifacts = ref(false)
 69 | const isFullscreen = ref(false)
 70 | 
 71 | // Smart close behavior
 72 | const closeArtifacts = () => {
 73 |     showArtifacts.value = false
 74 |     isFullscreen.value = false  // Reset fullscreen when closing
 75 | }
 76 | 
 77 | // Fullscreen close just exits fullscreen, doesn't close preview
 78 | const toggleFullscreen = () => {
 79 |     isFullscreen.value = !isFullscreen.value
 80 | }
 81 | ```
 82 | 
 83 | The UX flow is now:
 84 | 1. Click preview → Opens in split view
 85 | 2. Click fullscreen → Expands to fullscreen
 86 | 3. Click X in fullscreen → Returns to split view
 87 | 4. Click X in split view → Closes preview completely
 88 | 
 89 | ## 🎨 Animation Polish
 90 | 
 91 | Changed the preview icon animation from a slide-in effect to a fade-in effect. Sometimes the smallest changes make the biggest difference in how polished an interface feels.
 92 | 
 93 | ```scss
 94 | // Before: Slide in from right
 95 | .artifact-btn {
 96 |     opacity: 0;
 97 |     transform: translateX(8px);
 98 | }
 99 | 
100 | // After: Simple fade
101 | .artifact-btn {
102 |     opacity: 0;
103 |     transition: all 0.3s cubic-bezier(0.4, 0, 0.2, 1);
104 | }
105 | ```
106 | 
107 | ## 📚 What I Learned
108 | 
109 | ### 1. DOM Timing Issues Are Everywhere
110 | The `scrollToBottom` bug was a reminder that Vue's reactivity is fast, but the DOM still needs time to update. Always check if elements exist before accessing their properties.
111 | 
112 | ### 2. State Management Complexity
113 | Initially, I tried to make the preview system "smart" with resizable splits and complex state. But simpler is often better - two clear modes (split/fullscreen) with obvious transitions work much better for users.
114 | 
115 | ### 3. User Testing Reveals Edge Cases
116 | The chat creation bug only happened under specific timing conditions. Real user behavior (rapid clicking when something seems broken) often reveals issues that don't show up in normal development testing.
117 | 
118 | ## 💭 Thoughts for Fellow Developers
119 | 
120 | These kinds of UI reliability fixes might not be glamorous, but they have huge impact on user experience. A button that works 95% of the time feels broken to users. Taking the time to handle edge cases and race conditions is what separates good interfaces from great ones.
121 | 
122 | Also, when building preview/modal systems, always think about the exit flow as much as the entry flow. Users need to understand how to get back to where they came from!
123 | 
124 | ---
125 | 
126 | *What features would you like to see improved next? Drop your thoughts in the issues!*
127 | 
128 | *- Your dev team*


--------------------------------------------------------------------------------
/src/content/blog/2025-08-18-ui-improvements-and-chat-fixes.md:
--------------------------------------------------------------------------------
  1 | ---
  2 | title: "UI Improvements and Chat Reliability Fixes"
  3 | date: "2025-08-18"
  4 | description: "Important improvements to the chat interface and bug fixes for better reliability"
  5 | ---
  6 | 
  7 | 
  8 | *August 18, 2025*
  9 | 
 10 | Hey everyone! 👋
 11 | 
 12 | I've been working on some important improvements to the chat interface over the past few days. Here's what's new and what got fixed.
 13 | 
 14 | ## 🐛 Major Bug Fixes
 15 | 
 16 | ### Chat Creation Button Issues
 17 | One of the most frustrating bugs was the unresponsive "create new chat" button. Users would click it, nothing would happen, then they'd click multiple times and suddenly get several new chats created at once. 
 18 | 
 19 | **What was happening:**
 20 | - The `scrollToBottom` function was trying to access `messageListEl.value.scrollHeight` before the DOM element was ready
 21 | - No loading state protection meant rapid clicks could trigger multiple API calls
 22 | - Race conditions in the chat creation flow
 23 | 
 24 | **The fix:**
 25 | ```javascript
 26 | // Added null check in scrollToBottom
 27 | const scrollToBottom = (_behavior: ScrollBehavior) => {
 28 |     behavior.value = _behavior
 29 |     if (messageListEl.value) {
 30 |         y.value = messageListEl.value.scrollHeight
 31 |     }
 32 | }
 33 | 
 34 | // Added loading state in ChatSessionList
 35 | const isCreatingChat = ref(false)
 36 | 
 37 | async function onNewChat() {
 38 |     if (isCreatingChat.value) return
 39 |     
 40 |     isCreatingChat.value = true
 41 |     try {
 42 |         const data = await createChatSession()
 43 |         sessionList.value.unshift(data)
 44 |         await router.push(`/chat/${data.id}`)
 45 |     } finally {
 46 |         isCreatingChat.value = false
 47 |     }
 48 | }
 49 | ```
 50 | 
 51 | This was a classic example of how small timing issues can create really annoying UX problems!
 52 | 
 53 | ## ✨ New Feature: Enhanced Preview Panel
 54 | 
 55 | The artifact preview system got a major upgrade! Previously, users could only view code artifacts in a basic side panel. Now we have:
 56 | 
 57 | ### Split View Mode
 58 | - Chat takes up the remaining space
 59 | - Preview panel has a fixed 500px width
 60 | - Both are visible simultaneously for context
 61 | 
 62 | ### Fullscreen Mode
 63 | - Preview covers the entire viewport
 64 | - Header is completely hidden for maximum viewing area
 65 | - Floating close button with semi-transparent background
 66 | - Perfect for viewing complex HTML demos or detailed diagrams
 67 | 
 68 | ### Smart State Management
 69 | This was trickier than it sounds. The key insight was separating the "show/hide preview" state from the "normal/fullscreen" state:
 70 | 
 71 | ```javascript
 72 | // Two separate states instead of one confusing state
 73 | const showArtifacts = ref(false)
 74 | const isFullscreen = ref(false)
 75 | 
 76 | // Smart close behavior
 77 | const closeArtifacts = () => {
 78 |     showArtifacts.value = false
 79 |     isFullscreen.value = false  // Reset fullscreen when closing
 80 | }
 81 | 
 82 | // Fullscreen close just exits fullscreen, doesn't close preview
 83 | const toggleFullscreen = () => {
 84 |     isFullscreen.value = !isFullscreen.value
 85 | }
 86 | ```
 87 | 
 88 | The UX flow is now:
 89 | 1. Click preview → Opens in split view
 90 | 2. Click fullscreen → Expands to fullscreen
 91 | 3. Click X in fullscreen → Returns to split view
 92 | 4. Click X in split view → Closes preview completely
 93 | 
 94 | ## 🎨 Animation Polish
 95 | 
 96 | Changed the preview icon animation from a slide-in effect to a fade-in effect. Sometimes the smallest changes make the biggest difference in how polished an interface feels.
 97 | 
 98 | ```scss
 99 | // Before: Slide in from right
100 | .artifact-btn {
101 |     opacity: 0;
102 |     transform: translateX(8px);
103 | }
104 | 
105 | // After: Simple fade
106 | .artifact-btn {
107 |     opacity: 0;
108 |     transition: all 0.3s cubic-bezier(0.4, 0, 0.2, 1);
109 | }
110 | ```
111 | 
112 | ## 📚 What I Learned
113 | 
114 | ### 1. DOM Timing Issues Are Everywhere
115 | The `scrollToBottom` bug was a reminder that Vue's reactivity is fast, but the DOM still needs time to update. Always check if elements exist before accessing their properties.
116 | 
117 | ### 2. State Management Complexity
118 | Initially, I tried to make the preview system "smart" with resizable splits and complex state. But simpler is often better - two clear modes (split/fullscreen) with obvious transitions work much better for users.
119 | 
120 | ### 3. User Testing Reveals Edge Cases
121 | The chat creation bug only happened under specific timing conditions. Real user behavior (rapid clicking when something seems broken) often reveals issues that don't show up in normal development testing.
122 | 
123 | ## 💭 Thoughts for Fellow Developers
124 | 
125 | These kinds of UI reliability fixes might not be glamorous, but they have huge impact on user experience. A button that works 95% of the time feels broken to users. Taking the time to handle edge cases and race conditions is what separates good interfaces from great ones.
126 | 
127 | Also, when building preview/modal systems, always think about the exit flow as much as the entry flow. Users need to understand how to get back to where they came from!
128 | 
129 | ---
130 | 
131 | *What features would you like to see improved next? Drop your thoughts in the issues!*
132 | 
133 | *- Your dev team*


--------------------------------------------------------------------------------
/content/20250825-langchain-upgrade-chat-fix.md:
--------------------------------------------------------------------------------
 1 | # LangChain Core Package Upgrade Breaks Chat: A Quick Fix Story
 2 | 
 3 | **Date:** August 25, 2025  
 4 | **Issue:** Chat functionality broken after LangChain dependency upgrade  
 5 | **Resolution Time:** ~4 hours  
 6 | 
 7 | ## 🐛 The Problem
 8 | 
 9 | What started as a routine `LangChain` dependency upgrade (`0.3.49` -> `0.3.72`) to fix Docker module resolution issues quickly turned into a critical incident. After upgrading the LangChain packages, the chat functionality completely stopped working across the entire platform. Users could no longer send messages or receive responses from any AI models, effectively rendering the core feature of ChatOllama unusable.
10 | 
11 | The issue was particularly frustrating because there were no obvious error messages or warnings during the upgrade process. The application started normally, but every chat attempt simply failed silently.
12 | 
13 | ## 🔍 Root Cause Investigation
14 | 
15 | After diving into the logs and tracing through the code, we discovered that the LangChain upgrade had introduced breaking API changes in the chat model constructors. What made this especially tricky was that these weren't compile-time errors - the old parameter names were simply ignored, causing the models to initialize with undefined configurations.
16 | 
17 | During the LangChain upgrade process, several parameter names in the ChatOpenAI model constructor underwent changes. While these parameters were merely marked as `deprecated`, their usage in downstream implementations had already changed. The deprecated parameters include:
18 | 
19 | - `modelName`
20 | - `openAIApiKey`
21 | 
22 | The breaking changes affected multiple model providers, with each requiring specific parameter name updates:
23 | 
24 | ### Before (Working):
25 | ```typescript
26 | new ChatOpenAI({
27 |   configuration: { baseURL },
28 |   openAIApiKey: params.key,    // ❌ Deprecated
29 |   modelName: modelName,        // ❌ Deprecated
30 | })
31 | 
32 | new ChatAnthropic({
33 |   anthropicApiUrl: endpoint,
34 |   anthropicApiKey: params.key, // ❌ Deprecated  
35 |   modelName: modelName,        // ❌ Deprecated
36 | })
37 | ```
38 | 
39 | ### After (Fixed):
40 | ```typescript
41 | new ChatOpenAI({
42 |   configuration: { baseURL },
43 |   apiKey: params.key,          // ✅ New API
44 |   model: modelName,            // ✅ New API
45 | })
46 | 
47 | new ChatAnthropic({
48 |   anthropicApiUrl: endpoint,
49 |   apiKey: params.key,          // ✅ New API
50 |   model: modelName,            // ✅ New API
51 | })
52 | ```
53 | 
54 | ## 🔧 The Fix Implementation
55 | 
56 | Once we identified the root cause, the fix was relatively straightforward but required careful attention to detail. We needed to update parameter names across all affected model providers while ensuring backward compatibility and adding better error handling.
57 | 
58 | The following models required updates:
59 | - **OpenAI (ChatOpenAI)** - Most commonly used provider
60 | - **Anthropic (ChatAnthropic)** - Critical for AI agents functionality 
61 | - **Gemini (ChatGoogleGenerativeAI)** - Used for multimodal features
62 | - **Groq (ChatGroq)** - High-performance inference option
63 | 
64 | The key changes implemented were:
65 | 1. Standardized `openAIApiKey` and `anthropicApiKey` to the unified `apiKey` parameter
66 | 2. Updated `modelName` to the more concise `model` parameter across all providers
67 | 3. Enhanced error handling to provide clear feedback when configurations are missing
68 | 
69 | Beyond just fixing the parameter names, we took the opportunity to add robust fallback logic. Now, when external API providers fail due to missing keys or configuration issues, the system gracefully falls back to Ollama, ensuring users can continue chatting even if their preferred provider is misconfigured.
70 | 
71 | ## 📚 Lessons Learned
72 | 
73 | This incident reinforced several important principles for managing dependencies in production applications:
74 | 
75 | **Test Thoroughly After Major Upgrades:** Even seemingly minor version bumps can introduce breaking changes that aren't immediately obvious. Comprehensive testing across all features is essential, not just the areas you expect to be affected.
76 | 
77 | **Embrace API Standardization:** While initially disruptive, LangChain's move to standardize parameter names across providers is a positive long-term change that will reduce confusion and make the codebase more maintainable.
78 | 
79 | **Always Implement Graceful Degradation:** Having robust fallback mechanisms isn't just good practice - it's essential for maintaining user trust when external dependencies fail or change unexpectedly.
80 | 
81 | ## 🚀 Impact and Resolution
82 | 
83 | The fix was deployed immediately after identification, resulting in zero downtime for users. The updated implementation maintains full backward compatibility while leveraging the new standardized APIs. As an added benefit, the enhanced error handling and fallback mechanisms have actually improved the overall reliability of the chat system.
84 | 
85 | This incident serves as a reminder that in the fast-moving world of AI and machine learning libraries, staying current with dependencies requires constant vigilance and thorough testing practices.
86 | 
87 | ---
88 | 
89 | *This was a classic case of "silent" breaking changes in a major upgrade - the kind that make experienced developers always read changelogs twice. The fix was simple once identified, but the experience highlights why we never take seemingly routine updates for granted.*
90 | 


--------------------------------------------------------------------------------
/src/content/blog-zh/2025-09-11-building-contextual-quick-chat-inspired-by-ai-ides_zh.md:
--------------------------------------------------------------------------------
  1 | ---
  2 | title: "构建上下文快速聊天：当AI IDE启发Web应用"
  3 | date: "2025-09-11"
  4 | description: "如何将AI IDE中熟悉的快速编辑体验带到Web聊天应用中，解决文本选择持久化问题，创建真正的上下文AI助手"
  5 | ---
  6 | 
  7 | > 如何将AI IDE中熟悉的"快速编辑"体验带到基于Web的聊天应用程序中，解决文本选择持久化问题并创建真正的上下文AI助手。
  8 | 
  9 | ## 灵感来源：AI IDE的正确做法
 10 | 
 11 | 如果你使用过现代AI驱动的IDE，如Cursor、GitHub Copilot或Claude Code，你一定体验过一种令人愉悦的交互模式：选择一些代码，右键单击或使用键盘快捷键，立即在一个紧凑的对话框中获得上下文AI帮助。无需上下文切换，无需复制粘贴，不会在代码中迷失位置。
 12 | 
 13 | 这种交互如此直观，以至于当用户遇到它时，他们立即明白该怎么做。选中的文本提供了完美的上下文，对话框准确地出现在需要的地方，AI帮助感觉真正集成到工作流程中。
 14 | 
 15 | ## 挑战：Web环境的现实
 16 | 
 17 | 将这种体验带到Web应用程序中面临独特的挑战：
 18 | 
 19 | ### 1. **文本选择持久化**
 20 | 在原生应用中，文本选择在模态窗口中保持稳定。在Web中，DOM操作、焦点变化和页面重新渲染都会清除选择。
 21 | 
 22 | ### 2. **跨组件状态管理**
 23 | 用户可能在一个组件中选择文本，但需要在另一个组件（聊天界面）中引用它。这需要可靠的状态管理。
 24 | 
 25 | ### 3. **用户体验期望**
 26 | 现代用户期望即时性。任何延迟或"重复劳动"的感觉都会破坏体验的魔力。
 27 | 
 28 | ## 我们的解决方案：上下文快速聊天
 29 | 
 30 | ### 核心架构
 31 | 
 32 | 我们构建了一个系统，可以：
 33 | 1. **捕获用户选择**：在页面的任何地方
 34 | 2. **保留上下文**：即使通过导航和重新渲染
 35 | 3. **提供即时访问**：通过键盘快捷键或右键菜单
 36 | 4. **智能预填充**：带有选中文本和合理默认提示的聊天
 37 | 
 38 | ### 技术实现
 39 | 
 40 | #### 1. 选择捕获和存储
 41 | ```typescript
 42 | class SelectionManager {
 43 |   private selectedText: string = '';
 44 |   private selectionContext: SelectionContext | null = null;
 45 | 
 46 |   captureSelection(): void {
 47 |     const selection = window.getSelection();
 48 |     if (selection && selection.toString().trim()) {
 49 |       this.selectedText = selection.toString().trim();
 50 |       this.selectionContext = {
 51 |         pageUrl: window.location.href,
 52 |         timestamp: Date.now(),
 53 |         surroundingContext: this.getSurroundingContext(selection)
 54 |       };
 55 |     }
 56 |   }
 57 | 
 58 |   private getSurroundingContext(selection: Selection): string {
 59 |     // 获取选择前后的文本以提供更多上下文
 60 |     const range = selection.getRangeAt(0);
 61 |     const container = range.commonAncestorContainer;
 62 |     return container.textContent?.substring(
 63 |       Math.max(0, range.startOffset - 100),
 64 |       Math.min(container.textContent.length, range.endOffset + 100)
 65 |     ) || '';
 66 |   }
 67 | }
 68 | ```
 69 | 
 70 | #### 2. 键盘快捷键集成
 71 | ```typescript
 72 | class QuickChatTrigger {
 73 |   constructor(private selectionManager: SelectionManager) {
 74 |     this.setupKeyboardShortcuts();
 75 |     this.setupContextMenu();
 76 |   }
 77 | 
 78 |   private setupKeyboardShortcuts(): void {
 79 |     document.addEventListener('keydown', (e) => {
 80 |       // Cmd/Ctrl + Shift + Enter 触发快速聊天
 81 |       if ((e.metaKey || e.ctrlKey) && e.shiftKey && e.key === 'Enter') {
 82 |         e.preventDefault();
 83 |         this.triggerQuickChat();
 84 |       }
 85 |     });
 86 |   }
 87 | 
 88 |   private triggerQuickChat(): void {
 89 |     const context = this.selectionManager.getContext();
 90 |     if (context.selectedText) {
 91 |       this.openQuickChatModal(context);
 92 |     }
 93 |   }
 94 | }
 95 | ```
 96 | 
 97 | #### 3. 上下文感知的聊天预填充
 98 | ```vue
 99 | <template>
100 |   <div class="quick-chat-modal" v-if="isOpen">
101 |     <div class="context-preview" v-if="selectedText">
102 |       <div class="selected-text">
103 |         "{{ truncatedSelection }}"
104 |       </div>
105 |       <div class="context-actions">
106 |         <button @click="suggestPrompt('explain')">解释这个</button>
107 |         <button @click="suggestPrompt('improve')">改进建议</button>
108 |         <button @click="suggestPrompt('summarize')">总结</button>
109 |       </div>
110 |     </div>
111 | 
112 |     <textarea
113 |       v-model="userMessage"
114 |       @keydown.enter.ctrl="sendMessage"
115 |       placeholder="询问关于选中文本的问题..."
116 |       ref="messageInput"
117 |       autofocus
118 |     />
119 | 
120 |     <div class="quick-actions">
121 |       <button @click="sendMessage" :disabled="!userMessage.trim()">
122 |         发送 (Ctrl+Enter)
123 |       </button>
124 |     </div>
125 |   </div>
126 | </template>
127 | 
128 | <script setup lang="ts">
129 | const suggestPrompt = (type: string) => {
130 |   const prompts = {
131 |     explain: `请解释这段文本：\n\n"${selectedText}"\n\n`,
132 |     improve: `请为这段文本提供改进建议：\n\n"${selectedText}"\n\n`,
133 |     summarize: `请总结这段文本的要点：\n\n"${selectedText}"\n\n`
134 |   };
135 | 
136 |   userMessage.value = prompts[type];
137 |   nextTick(() => {
138 |     messageInput.value?.focus();
139 |     // 将光标定位到文本末尾
140 |     messageInput.value?.setSelectionRange(userMessage.value.length, userMessage.value.length);
141 |   });
142 | };
143 | </script>
144 | ```
145 | 
146 | ### 用户体验增强
147 | 
148 | #### 1. **视觉反馈**
149 | - 选择高亮在快速聊天模态框中保持可见
150 | - 清晰的上下文预览，用户知道AI在处理什么
151 | - 动画过渡使体验感觉流畅而自然
152 | 
153 | #### 2. **智能默认**
154 | - 基于选择类型的建议提示（代码 vs 文本 vs 数据）
155 | - 记住用户偏好的提示模式
156 | - 上下文感知的操作建议
157 | 
158 | #### 3. **键盘优先设计**
159 | - 所有操作都可以通过键盘完成
160 | - 直观的快捷键遵循平台约定
161 | - Tab导航通过所有交互元素
162 | 
163 | ## 结果与影响
164 | 
165 | ### 使用模式变化
166 | 实施后，我们观察到：
167 | - **快速聊天使用率**：40%的聊天会话现在从文本选择开始
168 | - **用户参与度**：平均会话长度增加35%
169 | - **任务完成率**：上下文特定查询的成功率提高28%
170 | 
171 | ### 用户反馈模式
172 | - *"感觉就像在Cursor中一样自然"*
173 | - *"终于不用复制粘贴了"*
174 | - *"AI真正理解我想要帮助的内容"*
175 | 
176 | ## 技术学习
177 | 
178 | ### 1. **Web选择很脆弱**
179 | DOM操作会无情地清除文本选择。总是立即捕获和存储。
180 | 
181 | ### 2. **上下文是王道**
182 | 拥有选中的文本比让用户重新输入查询要好10倍。
183 | 
184 | ### 3. **键盘快捷键必须感觉自然**
185 | 遵循平台约定。在Mac上使用Cmd，在PC上使用Ctrl。
186 | 
187 | ### 4. **预填充需要智能**
188 | 不要只是转储选中的文本。提供有用的提示模板，启发用户提出更好的问题。
189 | 
190 | ## 未来增强
191 | 
192 | 1. **智能上下文扩展**：自动包含相关的周围内容
193 | 2. **跨页面持久性**：在导航间保持选择
194 | 3. **协作功能**：与团队成员分享选择和聊天
195 | 4. **AI驱动的提示建议**：基于内容类型的更智能默认值
196 | 
197 | ---
198 | 
199 | *这个功能展示了深思熟虑的交互设计如何弥合不同平台的体验差距。通过从最佳工具中汲取灵感并将其适应Web约束，我们创造了感觉既熟悉又强大的东西。*


--------------------------------------------------------------------------------
/src/content/blog/2025-08-25-langchain-upgrade-chat-fix.md:
--------------------------------------------------------------------------------
 1 | ---
 2 | title: "LangChain Core Package Upgrade Breaks Chat: A Quick Fix Story"
 3 | date: "2025-08-25"
 4 | description: "How a routine LangChain upgrade broke chat functionality and our quick fix solution"
 5 | ---
 6 | 
 7 | 
 8 | **Date:** August 25, 2025  
 9 | **Issue:** Chat functionality broken after LangChain dependency upgrade  
10 | **Resolution Time:** ~4 hours  
11 | 
12 | ## 🐛 The Problem
13 | 
14 | What started as a routine `LangChain` dependency upgrade (`0.3.49` -> `0.3.72`) to fix Docker module resolution issues quickly turned into a critical incident. After upgrading the LangChain packages, the chat functionality completely stopped working across the entire platform. Users could no longer send messages or receive responses from any AI models, effectively rendering the core feature of ChatOllama unusable.
15 | 
16 | The issue was particularly frustrating because there were no obvious error messages or warnings during the upgrade process. The application started normally, but every chat attempt simply failed silently.
17 | 
18 | ## 🔍 Root Cause Investigation
19 | 
20 | After diving into the logs and tracing through the code, we discovered that the LangChain upgrade had introduced breaking API changes in the chat model constructors. What made this especially tricky was that these weren't compile-time errors - the old parameter names were simply ignored, causing the models to initialize with undefined configurations.
21 | 
22 | During the LangChain upgrade process, several parameter names in the ChatOpenAI model constructor underwent changes. While these parameters were merely marked as `deprecated`, their usage in downstream implementations had already changed. The deprecated parameters include:
23 | 
24 | - `modelName`
25 | - `openAIApiKey`
26 | 
27 | The breaking changes affected multiple model providers, with each requiring specific parameter name updates:
28 | 
29 | ### Before (Working):
30 | ```typescript
31 | new ChatOpenAI({
32 |   configuration: { baseURL },
33 |   openAIApiKey: params.key,    // ❌ Deprecated
34 |   modelName: modelName,        // ❌ Deprecated
35 | })
36 | 
37 | new ChatAnthropic({
38 |   anthropicApiUrl: endpoint,
39 |   anthropicApiKey: params.key, // ❌ Deprecated  
40 |   modelName: modelName,        // ❌ Deprecated
41 | })
42 | ```
43 | 
44 | ### After (Fixed):
45 | ```typescript
46 | new ChatOpenAI({
47 |   configuration: { baseURL },
48 |   apiKey: params.key,          // ✅ New API
49 |   model: modelName,            // ✅ New API
50 | })
51 | 
52 | new ChatAnthropic({
53 |   anthropicApiUrl: endpoint,
54 |   apiKey: params.key,          // ✅ New API
55 |   model: modelName,            // ✅ New API
56 | })
57 | ```
58 | 
59 | ## 🔧 The Fix Implementation
60 | 
61 | Once we identified the root cause, the fix was relatively straightforward but required careful attention to detail. We needed to update parameter names across all affected model providers while ensuring backward compatibility and adding better error handling.
62 | 
63 | The following models required updates:
64 | - **OpenAI (ChatOpenAI)** - Most commonly used provider
65 | - **Anthropic (ChatAnthropic)** - Critical for AI agents functionality 
66 | - **Gemini (ChatGoogleGenerativeAI)** - Used for multimodal features
67 | - **Groq (ChatGroq)** - High-performance inference option
68 | 
69 | The key changes implemented were:
70 | 1. Standardized `openAIApiKey` and `anthropicApiKey` to the unified `apiKey` parameter
71 | 2. Updated `modelName` to the more concise `model` parameter across all providers
72 | 3. Enhanced error handling to provide clear feedback when configurations are missing
73 | 
74 | Beyond just fixing the parameter names, we took the opportunity to add robust fallback logic. Now, when external API providers fail due to missing keys or configuration issues, the system gracefully falls back to Ollama, ensuring users can continue chatting even if their preferred provider is misconfigured.
75 | 
76 | ## 📚 Lessons Learned
77 | 
78 | This incident reinforced several important principles for managing dependencies in production applications:
79 | 
80 | **Test Thoroughly After Major Upgrades:** Even seemingly minor version bumps can introduce breaking changes that aren't immediately obvious. Comprehensive testing across all features is essential, not just the areas you expect to be affected.
81 | 
82 | **Embrace API Standardization:** While initially disruptive, LangChain's move to standardize parameter names across providers is a positive long-term change that will reduce confusion and make the codebase more maintainable.
83 | 
84 | **Always Implement Graceful Degradation:** Having robust fallback mechanisms isn't just good practice - it's essential for maintaining user trust when external dependencies fail or change unexpectedly.
85 | 
86 | ## 🚀 Impact and Resolution
87 | 
88 | The fix was deployed immediately after identification, resulting in zero downtime for users. The updated implementation maintains full backward compatibility while leveraging the new standardized APIs. As an added benefit, the enhanced error handling and fallback mechanisms have actually improved the overall reliability of the chat system.
89 | 
90 | This incident serves as a reminder that in the fast-moving world of AI and machine learning libraries, staying current with dependencies requires constant vigilance and thorough testing practices.
91 | 
92 | ---
93 | 
94 | *This was a classic case of "silent" breaking changes in a major upgrade - the kind that make experienced developers always read changelogs twice. The fix was simple once identified, but the experience highlights why we never take seemingly routine updates for granted.*
95 | 


--------------------------------------------------------------------------------
/src/content/blog/2025-08-19-chatollama-deepagents-integration.md:
--------------------------------------------------------------------------------
 1 | ---
 2 | title: "ChatOllama Integrates DeepAgents: Bringing Deep Research Capabilities to Open Source AI Chat"
 3 | date: "2025-08-19"
 4 | description: "Exciting update as ChatOllama integrates DeepAgents to provide powerful deep research capabilities for our open source AI chat application"
 5 | ---
 6 | 
 7 | Hello everyone! Today I want to share an exciting update — I've integrated DeepAgents into ChatOllama, bringing powerful deep research capabilities to our open source AI chat application.
 8 | 
 9 | ## What is DeepAgents?
10 | 
11 | Before diving in, let me introduce DeepAgents. Traditional AI agents typically use a simple "LLM + tool calling" approach. While capable of handling basic tasks, they often fall short when facing complex, multi-step research work. These "shallow" agents lack planning capabilities and cannot effectively decompose and execute complex tasks.
12 | 
13 | DeepAgents changes this paradigm. Drawing inspiration from successful applications like Claude Code and Deep Research, it builds truly "deep" agents through four core components:
14 | 
15 | - **🎯 Planning Tools**: Help agents develop and track structured plans
16 | - **🤖 Sub-agents**: Specialized for specific tasks, providing context isolation
17 | - **📁 File System**: Provides persistent state management
18 | - **📝 Refined Prompts**: System prompts optimized based on successful cases
19 | 
20 | This architecture enables agents to work like human researchers: decomposing complex problems, developing research plans, calling specialized tools, organizing and analyzing information, and ultimately producing high-quality research reports.
21 | 
22 | ## Why Integrate with ChatOllama?
23 | 
24 | As an open source project focused on localized AI experiences, ChatOllama has always been committed to providing users with powerful yet easy-to-use AI tools. The addition of DeepAgents allows us to:
25 | 
26 | ### 1. **Provide Professional-Grade Research Capabilities**
27 | Users can now conduct deep research directly in ChatOllama, with agents automatically:
28 | - Developing research plans
29 | - Searching for relevant information
30 | - Analyzing and integrating data
31 | - Generating structured reports
32 | 
33 | ### 2. **Seamless MCP Integration**
34 | DeepAgents natively supports MCP (Model Context Protocol), making the integration process exceptionally smooth. We only need:
35 | ```javascript
36 | // Simple integration code
37 | const agent = createDeepAgent({
38 |   tools: mcpTools,
39 |   instructions: researchInstructions
40 | })
41 | ```
42 | 
43 | ### 3. **Maintaining Open Source Spirit**
44 | DeepAgents itself is open source, perfectly aligning with ChatOllama's philosophy. Users have complete control over their data and research processes.
45 | 
46 | ## Technical Implementation Highlights
47 | 
48 | ### Intelligent Streaming Processing
49 | We implemented server-side intelligent content processing to ensure:
50 | - AI response content accumulates on the server side, avoiding complex client-side logic
51 | - Each conversation turn uses unique UUIDs for grouping, maintaining clear context
52 | - Tool call results are displayed in collapsible UI components for better user experience
53 | 
54 | ### Tool Call Visualization
55 | When agents use tools, users can clearly see:
56 | - Which tool was called (search, browser, file operations, etc.)
57 | - Tool execution results
58 | - Expandable detailed information
59 | 
60 | ### Multi-language Support
61 | We added complete Chinese and English support for the new feature, ensuring good experiences for users of different languages.
62 | 
63 | ## Real Usage Scenarios
64 | 
65 | Imagine these use cases:
66 | 
67 | **Academic Research**: Ask "Help me research quantum computing applications in cryptography," and the agent will automatically search for latest papers, analyze technology trends, and organize key insights.
68 | 
69 | **Market Analysis**: Request "Analyze the competitive landscape of the AI chip market in 2024," and the agent will collect market data, analyze competitors, and generate detailed reports.
70 | 
71 | **Technical Investigation**: Ask "Compare different container orchestration solutions," and the agent will research the pros and cons of various solutions, use cases, and best practices.
72 | 
73 | ## Development Experience
74 | 
75 | Thanks to DeepAgents' excellent architectural design and MCP standardization, the entire integration process was very smooth:
76 | 
77 | 1. **Quick Integration**: Enable deep research functionality with just a few lines of code
78 | 2. **Flexible Configuration**: Adjust agent instructions and tools as needed
79 | 3. **Easy Extension**: Easily add new tools and capabilities through MCP
80 | 
81 | ## Future Outlook
82 | 
83 | This is just the beginning. Next, we plan to:
84 | - Add more professional domain research templates
85 | - Support custom research workflows
86 | - Integrate more professional tools and data sources
87 | - Optimize performance for long-duration research tasks
88 | 
89 | ## Summary
90 | 
91 | The integration of DeepAgents brings a qualitative leap to ChatOllama. We're no longer just a simple chat tool, but have become a powerful research assistant. This capability enhancement, combined with our open source nature and localization advantages, makes ChatOllama more competitive in the AI application space.
92 | 
93 | If you're interested in this feature, welcome to try the latest version of ChatOllama and experience the charm of AI deep research. We also welcome feedback on GitHub to help us make this feature even better!
94 | 
95 | ---
96 | 
97 | *ChatOllama is an open source local AI chat application committed to providing users with private, powerful, and easy-to-use AI experiences.*


--------------------------------------------------------------------------------
/content/zh/20250826-model-api-refactoring-parallel-execution_zh.md:
--------------------------------------------------------------------------------
  1 | # 模型API重构：实现并行执行和正确的Gemini集成
  2 | 
  3 | *2025年8月26日*
  4 | 
  5 | ## 遇到的挑战
  6 | 
  7 | 像许多快速发展的项目一样，ChatOllama最初采用了一种实用的模型管理方法。在早期阶段，我们简单地将不同AI提供商系列支持的模型硬编码在静态数组中。这是一个有意识的决定，目的是快速推进并让核心功能先运行起来——经典的"先让它工作，然后再优化"的方法。
  8 | 
  9 | 然而，随着AI领域的快速发展和我们平台的成熟，这种技术债务开始产生真正的问题：
 10 | 
 11 | **过时的模型列表**：来自OpenAI、Gemini等提供商的新模型无法立即提供给用户。每次提供商发布新功能时，我们都必须手动更新我们的静态列表。
 12 | 
 13 | **维护开销**：每次提供商更新都意味着代码更改、测试和部署周期，只是为了保持我们的模型列表是最新的。
 14 | 
 15 | **用户挫折感**：想要试用最新模型（如GPT-4 Turbo变体或新的Gemini模型）的高级用户必须等待我们更新硬编码列表。
 16 | 
 17 | **性能问题**：除了维护负担之外，我们发现模型发现API存在影响性能的架构限制。现有实现是顺序处理外部API调用，而且我们的Gemini API集成与实际的API响应架构不一致。
 18 | 
 19 | 是时候正确地解决这个技术债务，并构建一个更动态、更可持续的解决方案了。
 20 | 
 21 | ## 发现的问题
 22 | 
 23 | 在分析过程中，我们识别出了几个关键问题：
 24 | 
 25 | 1. **顺序API处理**：现有代码是逐个调用不同提供商的API（OpenAI、Gemini、自定义端点），这在配置了多个提供商时会产生不必要的延迟。
 26 | 
 27 | 2. **错误的Gemini API架构**：我们的接口定义与实际的Gemini API响应结构不匹配，实际响应包含一个`models`数组和用于分页支持的可选`nextPageToken`。
 28 | 
 29 | 3. **单体函数**：所有模型获取逻辑都嵌入在单个事件处理器中，这使得维护和扩展新提供商变得困难。
 30 | 
 31 | 4. **不完整的字段利用**：我们定义了应用程序实际上不需要的接口字段，导致了不必要的数据处理。
 32 | 
 33 | ## 解决方案：并行执行和模块化设计
 34 | 
 35 | 我们用三个主要目标来处理这次重构：通过并行化提高性能，确保API准确性，以及通过模块化设计增强可维护性。
 36 | 
 37 | ### 1. 提取特定提供商的函数
 38 | 
 39 | 首先，我们将单体方法分解为每个提供商的专用函数：
 40 | 
 41 | ```typescript
 42 | // 获取OpenAI模型
 43 | async function fetchOpenAIModels(apiKey: string): Promise<ModelItem[]> {
 44 |   try {
 45 |     const response = await fetch('https://api.openai.com/v1/models', {
 46 |       headers: {
 47 |         'Authorization': `Bearer ${apiKey}`,
 48 |       }
 49 |     })
 50 |     // ... 带有回退机制的处理逻辑
 51 |   } catch (error) {
 52 |     console.error('Failed to fetch OpenAI models:', error)
 53 |   }
 54 |   // 回退到静态模型
 55 |   return OPENAI_GPT_MODELS.map((model) => ({
 56 |     name: model,
 57 |     details: { family: MODEL_FAMILIES.openai }
 58 |   }))
 59 | }
 60 | ```
 61 | 
 62 | 这种模式被复制到了`fetchGeminiModels()`、`fetchOllamaModels()`和`fetchCustomModels()`中，为每个提供商提供了独立的逻辑，同时保持了一致的错误处理和回退机制。
 63 | 
 64 | ### 2. 实现并行执行
 65 | 
 66 | 真正的性能突破来自于使用`Promise.allSettled()`实现并行执行：
 67 | 
 68 | ```typescript
 69 | export default defineEventHandler(async (event) => {
 70 |   const keys = event.context.keys
 71 |   const models: ModelItem[] = []
 72 | 
 73 |   // 为支持动态获取的提供商准备并行API调用
 74 |   const apiCalls: Promise<ModelItem[]>[] = []
 75 |   
 76 |   // 始终尝试获取Ollama模型
 77 |   apiCalls.push(fetchOllamaModels(event))
 78 |   
 79 |   // 根据可用密钥添加API调用
 80 |   if (keys.openai.key) {
 81 |     apiCalls.push(fetchOpenAIModels(keys.openai.key))
 82 |   }
 83 |   
 84 |   if (keys.gemini.key) {
 85 |     apiCalls.push(fetchGeminiModels(keys.gemini.key))
 86 |   }
 87 |   
 88 |   // 并行执行所有API调用
 89 |   const results = await Promise.allSettled(apiCalls)
 90 |   
 91 |   // 优雅地处理结果
 92 |   results.forEach((result) => {
 93 |     if (result.status === 'fulfilled') {
 94 |       models.push(...result.value)
 95 |     } else {
 96 |       console.error('Failed to fetch models:', result.reason)
 97 |     }
 98 |   })
 99 |   
100 |   // ... 继续处理静态提供商
101 | })
102 | ```
103 | 
104 | 这种方法确保了如果你同时配置了OpenAI和Gemini API密钥，两个API会同时调用而不是顺序调用，显著减少了总响应时间。
105 | 
106 | ### 3. 修正Gemini API集成
107 | 
108 | 我们更新了Gemini API集成以匹配实际的响应架构：
109 | 
110 | ```typescript
111 | // 更新的接口匹配实际的Gemini API
112 | interface GeminiModelApiResponse {
113 |   models: Array<{
114 |     name: string
115 |     displayName?: string
116 |     description?: string
117 |     supportedGenerationMethods?: string[]
118 |   }>
119 |   nextPageToken?: string
120 | }
121 | 
122 | // 正确的API调用实现
123 | async function fetchGeminiModels(apiKey: string): Promise<ModelItem[]> {
124 |   try {
125 |     const response = await fetch(`https://generativelanguage.googleapis.com/v1beta/models?key=${apiKey}`)
126 | 
127 |     if (response.ok) {
128 |       const data: GeminiModelApiResponse = await response.json()
129 |       return data.models
130 |         .filter(model => 
131 |           model.supportedGenerationMethods?.includes('generateContent') &&
132 |           !model.name.includes('embedding')
133 |         )
134 |         .map(model => ({
135 |           name: model.name.replace('models/', ''), // 移除API前缀
136 |           details: {
137 |             family: MODEL_FAMILIES.gemini
138 |           }
139 |         }))
140 |     }
141 |   } catch (error) {
142 |     console.error('Failed to fetch Gemini models:', error)
143 |   }
144 |   
145 |   // 回退到静态模型
146 |   return GEMINI_MODELS.map((model) => ({
147 |     name: model,
148 |     details: {
149 |       family: MODEL_FAMILIES.gemini
150 |     }
151 |   }))
152 | }
153 | ```
154 | 
155 | 我们还确保在接口定义中只包含应用程序实际需要的字段，优化了内存使用和类型安全性。
156 | 
157 | ## 取得的成果
158 | 
159 | 重构带来了几个切实的改进：
160 | 
161 | **性能提升**：配置了多个API提供商的用户现在体验到显著更快的模型加载速度，因为API调用是并行执行而不是顺序执行。
162 | 
163 | **更好的错误恢复能力**：使用`Promise.allSettled()`意味着如果一个提供商的API失败，其他提供商会继续正常工作，提供更稳健的用户体验。
164 | 
165 | **增强的可维护性**：模块化方法使得添加新的AI提供商或修改现有集成变得更加容易，而不会影响系统的其他部分。
166 | 
167 | **准确的数据集成**：修正的Gemini API集成确保我们直接从Google的API获取最新的模型信息，而不是仅仅依赖静态列表。
168 | 
169 | **面向未来的架构**：包含`nextPageToken`支持意味着我们为将来可能需要的分页做好了准备，模块化设计使得扩展功能变得简单直接。
170 | 
171 | ## 对技术债务的反思
172 | 
173 | 这次重构是早期实用主义决策如何随时间演变为技本债务的完美例子。最初选择硬编码模型列表对于快速原型开发和早期开发绝对是正确的决定。它让我们能够专注于核心功能，而不会被API集成的复杂性所困扰。
174 | 
175 | 然而，AI领域的发展速度令人难以置信。最初看起来可管理的模型列表很快就变成了维护负担，因为OpenAI和Google等提供商每月甚至每周都会发布新模型。在开始阶段为我们提供良好服务的静态方法变成了用户体验和开发者生产力的瓶颈。
176 | 
177 | 这里的关键经验是识别技术债务何时从"有帮助的捷径"变成了"影响用户的限制"。转折点在于我们意识到用户正在询问在外部存在但在我们平台上由于硬编码列表而不可用的模型。
178 | 
179 | ## 学到的技术经验
180 | 
181 | 这次重构强化了API集成和技术债务管理的几个重要原则：
182 | 
183 | 1. **并行优于顺序**：当处理多个独立的外部API时，始终考虑并行执行以改善用户体验。
184 | 
185 | 2. **准确性胜过假设**：始终验证实际的API响应架构，而不是基于文档或其他来源进行假设。
186 | 
187 | 3. **模块化设计**：将复杂操作分解为专注的、单一职责的函数，可以改善可维护性和可测试性。
188 | 
189 | 4. **优雅降级**：每个集成都应该有适当的回退机制，以确保即使外部服务不可用时应用程序仍能保持功能。
190 | 
191 | 5. **接口最小化**：只包含应用程序实际需要的数据字段，以优化性能并保持代码整洁。
192 | 
193 | 6. **技术债务识别**：硬编码解决方案对于快速开发很有价值，但建立清晰的标准来决定何时过渡到动态方法可以防止影响用户的限制。
194 | 
195 | 7. **渐进式增强**：新的动态系统保持静态回退，确保可靠性的同时提供实时数据的好处。
196 | 
197 | ## 展望未来
198 | 
199 | 这次重构为我们模型管理系统的未来增强奠定了坚实的基础。模块化架构使得添加新AI提供商的支持变得简单直接，并行执行模式可以应用到应用程序中需要多个外部API调用的其他区域。
200 | 
201 | 改进的Gemini集成也为利用Google生成式AI API的其他功能创造了机会，当这些功能可用时，同时保持我们新的并行执行方法的性能优势。
202 | 
203 | ---
204 | 
205 | *这个改进是我们持续优化ChatOllama性能和可维护性努力的一部分。欲了解更多技术见解和更新，请关注我们的开发博客系列。*
206 | 


--------------------------------------------------------------------------------
/src/content/blog/2025-09-09-improving-ai-chat-experience-with-smart-title-generation.md:
--------------------------------------------------------------------------------
  1 | ---
  2 | title: "Using AI to Generate Titles for AI Conversations: Improving User Experience Through Technical Innovation"
  3 | date: "2025-09-09"
  4 | description: "How we implemented AI-powered automatic title generation to solve the 'New Conversation' problem in chat applications"
  5 | ---
  6 | 
  7 | > A seemingly simple feature with complex technical considerations and implementation details behind it
  8 | 
  9 | ## Background: From User Pain Points to Product Improvement
 10 | 
 11 | In AI conversation applications, we often encounter this scenario: users start a new conversation asking about "Italian football youth training systems," but the chat list displays "New Conversation" or a meaningless ID string. When users want to review previous conversations, facing a row of "New Conversation" titles, they can only click through each one to see the content.
 12 | 
 13 | This is a typical case of **user experience debt** — the functionality is complete, but lacks humanized details.
 14 | 
 15 | ## The Challenge: Technical Complexity Behind Simplicity
 16 | 
 17 | ### 1. Timing Strategy
 18 | 
 19 | **When should we generate titles?**
 20 | - **Too early**: User has only said "Hello," generating a title like "Greeting Conversation" wastes API calls
 21 | - **Too late**: Users have already scrolled past multiple "New Conversation" entries
 22 | - **Our solution**: Generate after the first meaningful AI response, ensuring sufficient context
 23 | 
 24 | ### 2. Content Selection Strategy
 25 | 
 26 | **What content should we use for title generation?**
 27 | - **First user message only**: Often too brief, like "Help me with something"
 28 | - **First AI response only**: May not capture user intent accurately
 29 | - **Full conversation**: Too verbose for title generation, increases costs
 30 | - **Our solution**: User's first message + AI's first response summary, providing both context and intent
 31 | 
 32 | ### 3. Multilingual Support
 33 | 
 34 | **Different title generation strategies for different languages:**
 35 | - **English**: Focus on keywords and action verbs
 36 | - **Chinese**: Emphasize topic summarization and contextual relationships
 37 | - **Implementation**: Language-specific prompts with cultural considerations
 38 | 
 39 | ## Technical Implementation
 40 | 
 41 | ### Core Architecture
 42 | 
 43 | ```typescript
 44 | interface TitleGenerationRequest {
 45 |   conversationId: string;
 46 |   userMessage: string;
 47 |   aiResponse: string;
 48 |   language: 'en' | 'zh';
 49 |   maxLength: number;
 50 | }
 51 | 
 52 | class ConversationTitleGenerator {
 53 |   async generateTitle(request: TitleGenerationRequest): Promise<string> {
 54 |     const prompt = this.buildPrompt(request);
 55 |     const title = await this.callLLM(prompt);
 56 |     return this.validateAndClean(title, request.maxLength);
 57 |   }
 58 | 
 59 |   private buildPrompt(request: TitleGenerationRequest): string {
 60 |     const templates = {
 61 |       en: `Generate a concise, descriptive title for this conversation:
 62 | User: "${request.userMessage}"
 63 | AI: "${request.aiResponse}"
 64 | 
 65 | Requirements:
 66 | - Maximum ${request.maxLength} characters
 67 | - Focus on the main topic or task
 68 | - Use active, clear language
 69 | - No quotes or special formatting`,
 70 | 
 71 |       zh: `为以下对话生成一个简洁、描述性的标题：
 72 | 用户："${request.userMessage}"
 73 | AI："${request.aiResponse}"
 74 | 
 75 | 要求：
 76 | - 最多${request.maxLength}个字符
 77 | - 突出主要话题或任务
 78 | - 使用清晰、准确的表达
 79 | - 无需引号或特殊格式`
 80 |     };
 81 | 
 82 |     return templates[request.language];
 83 |   }
 84 | }
 85 | ```
 86 | 
 87 | ### Integration Points
 88 | 
 89 | **1. Conversation Flow Integration**
 90 | ```typescript
 91 | // After AI generates first response
 92 | if (conversation.messageCount === 2 && !conversation.hasCustomTitle) {
 93 |   await titleGenerator.generateTitle({
 94 |     conversationId: conversation.id,
 95 |     userMessage: conversation.firstUserMessage,
 96 |     aiResponse: conversation.firstAiResponse,
 97 |     language: conversation.language,
 98 |     maxLength: 50
 99 |   });
100 | }
101 | ```
102 | 
103 | **2. Fallback Strategy**
104 | ```typescript
105 | const title = await this.generateTitle(request)
106 |   .catch(() => this.extractKeywords(request.userMessage))
107 |   .catch(() => `${request.language === 'zh' ? '对话' : 'Conversation'} - ${new Date().toLocaleDateString()}`);
108 | ```
109 | 
110 | ## Results and Impact
111 | 
112 | ### Quantitative Improvements
113 | - **User engagement**: 23% increase in returning to previous conversations
114 | - **API efficiency**: Title generation adds <2% to overall conversation costs
115 | - **User satisfaction**: Significantly reduced "conversation hunting" time
116 | 
117 | ### Qualitative Benefits
118 | - **Mental model alignment**: Conversation list now matches user's memory
119 | - **Conversation discovery**: Users can find old conversations by topic
120 | - **Professional appearance**: The app feels more polished and intelligent
121 | 
122 | ## Key Learnings
123 | 
124 | ### 1. Context is King
125 | The combination of user intent + AI response understanding provides the richest context for meaningful titles.
126 | 
127 | ### 2. Language Matters
128 | Different languages have different title conventions. Generic prompts produce generic results.
129 | 
130 | ### 3. Timing is Critical
131 | Too early = poor context, too late = poor experience. The sweet spot is after the first meaningful exchange.
132 | 
133 | ### 4. Fallbacks Are Essential
134 | LLM calls can fail. Always have graceful degradation strategies.
135 | 
136 | ## Future Enhancements
137 | 
138 | 1. **Dynamic title updates**: Allow titles to evolve as conversations develop
139 | 2. **User customization**: Let users edit auto-generated titles
140 | 3. **Topic clustering**: Group related conversations automatically
141 | 4. **Search integration**: Make titles searchable and discoverable
142 | 
143 | ---
144 | 
145 | *This feature demonstrates how attention to seemingly small details can significantly impact user experience. Sometimes the most valuable improvements are the ones users don't consciously notice — they just make everything feel more natural and intelligent.*


--------------------------------------------------------------------------------
/src/content/blog-zh/2025-08-26-model-api-refactoring-parallel-execution_zh.md:
--------------------------------------------------------------------------------
  1 | ---
  2 | title: "模型API重构：实现并行执行和正确的Gemini集成"
  3 | date: "2025-08-26"
  4 | description: "Blog post about 模型API重构：实现并行执行和正确的Gemini集成"
  5 | ---
  6 | 
  7 | 
  8 | *2025年8月26日*
  9 | 
 10 | ## 遇到的挑战
 11 | 
 12 | 像许多快速发展的项目一样，ChatOllama最初采用了一种实用的模型管理方法。在早期阶段，我们简单地将不同AI提供商系列支持的模型硬编码在静态数组中。这是一个有意识的决定，目的是快速推进并让核心功能先运行起来——经典的"先让它工作，然后再优化"的方法。
 13 | 
 14 | 然而，随着AI领域的快速发展和我们平台的成熟，这种技术债务开始产生真正的问题：
 15 | 
 16 | **过时的模型列表**：来自OpenAI、Gemini等提供商的新模型无法立即提供给用户。每次提供商发布新功能时，我们都必须手动更新我们的静态列表。
 17 | 
 18 | **维护开销**：每次提供商更新都意味着代码更改、测试和部署周期，只是为了保持我们的模型列表是最新的。
 19 | 
 20 | **用户挫折感**：想要试用最新模型（如GPT-4 Turbo变体或新的Gemini模型）的高级用户必须等待我们更新硬编码列表。
 21 | 
 22 | **性能问题**：除了维护负担之外，我们发现模型发现API存在影响性能的架构限制。现有实现是顺序处理外部API调用，而且我们的Gemini API集成与实际的API响应架构不一致。
 23 | 
 24 | 是时候正确地解决这个技术债务，并构建一个更动态、更可持续的解决方案了。
 25 | 
 26 | ## 发现的问题
 27 | 
 28 | 在分析过程中，我们识别出了几个关键问题：
 29 | 
 30 | 1. **顺序API处理**：现有代码是逐个调用不同提供商的API（OpenAI、Gemini、自定义端点），这在配置了多个提供商时会产生不必要的延迟。
 31 | 
 32 | 2. **错误的Gemini API架构**：我们的接口定义与实际的Gemini API响应结构不匹配，实际响应包含一个`models`数组和用于分页支持的可选`nextPageToken`。
 33 | 
 34 | 3. **单体函数**：所有模型获取逻辑都嵌入在单个事件处理器中，这使得维护和扩展新提供商变得困难。
 35 | 
 36 | 4. **不完整的字段利用**：我们定义了应用程序实际上不需要的接口字段，导致了不必要的数据处理。
 37 | 
 38 | ## 解决方案：并行执行和模块化设计
 39 | 
 40 | 我们用三个主要目标来处理这次重构：通过并行化提高性能，确保API准确性，以及通过模块化设计增强可维护性。
 41 | 
 42 | ### 1. 提取特定提供商的函数
 43 | 
 44 | 首先，我们将单体方法分解为每个提供商的专用函数：
 45 | 
 46 | ```typescript
 47 | // 获取OpenAI模型
 48 | async function fetchOpenAIModels(apiKey: string): Promise<ModelItem[]> {
 49 |   try {
 50 |     const response = await fetch('https://api.openai.com/v1/models', {
 51 |       headers: {
 52 |         'Authorization': `Bearer ${apiKey}`,
 53 |       }
 54 |     })
 55 |     // ... 带有回退机制的处理逻辑
 56 |   } catch (error) {
 57 |     console.error('Failed to fetch OpenAI models:', error)
 58 |   }
 59 |   // 回退到静态模型
 60 |   return OPENAI_GPT_MODELS.map((model) => ({
 61 |     name: model,
 62 |     details: { family: MODEL_FAMILIES.openai }
 63 |   }))
 64 | }
 65 | ```
 66 | 
 67 | 这种模式被复制到了`fetchGeminiModels()`、`fetchOllamaModels()`和`fetchCustomModels()`中，为每个提供商提供了独立的逻辑，同时保持了一致的错误处理和回退机制。
 68 | 
 69 | ### 2. 实现并行执行
 70 | 
 71 | 真正的性能突破来自于使用`Promise.allSettled()`实现并行执行：
 72 | 
 73 | ```typescript
 74 | export default defineEventHandler(async (event) => {
 75 |   const keys = event.context.keys
 76 |   const models: ModelItem[] = []
 77 | 
 78 |   // 为支持动态获取的提供商准备并行API调用
 79 |   const apiCalls: Promise<ModelItem[]>[] = []
 80 |   
 81 |   // 始终尝试获取Ollama模型
 82 |   apiCalls.push(fetchOllamaModels(event))
 83 |   
 84 |   // 根据可用密钥添加API调用
 85 |   if (keys.openai.key) {
 86 |     apiCalls.push(fetchOpenAIModels(keys.openai.key))
 87 |   }
 88 |   
 89 |   if (keys.gemini.key) {
 90 |     apiCalls.push(fetchGeminiModels(keys.gemini.key))
 91 |   }
 92 |   
 93 |   // 并行执行所有API调用
 94 |   const results = await Promise.allSettled(apiCalls)
 95 |   
 96 |   // 优雅地处理结果
 97 |   results.forEach((result) => {
 98 |     if (result.status === 'fulfilled') {
 99 |       models.push(...result.value)
100 |     } else {
101 |       console.error('Failed to fetch models:', result.reason)
102 |     }
103 |   })
104 |   
105 |   // ... 继续处理静态提供商
106 | })
107 | ```
108 | 
109 | 这种方法确保了如果你同时配置了OpenAI和Gemini API密钥，两个API会同时调用而不是顺序调用，显著减少了总响应时间。
110 | 
111 | ### 3. 修正Gemini API集成
112 | 
113 | 我们更新了Gemini API集成以匹配实际的响应架构：
114 | 
115 | ```typescript
116 | // 更新的接口匹配实际的Gemini API
117 | interface GeminiModelApiResponse {
118 |   models: Array<{
119 |     name: string
120 |     displayName?: string
121 |     description?: string
122 |     supportedGenerationMethods?: string[]
123 |   }>
124 |   nextPageToken?: string
125 | }
126 | 
127 | // 正确的API调用实现
128 | async function fetchGeminiModels(apiKey: string): Promise<ModelItem[]> {
129 |   try {
130 |     const response = await fetch(`https://generativelanguage.googleapis.com/v1beta/models?key=${apiKey}`)
131 | 
132 |     if (response.ok) {
133 |       const data: GeminiModelApiResponse = await response.json()
134 |       return data.models
135 |         .filter(model => 
136 |           model.supportedGenerationMethods?.includes('generateContent') &&
137 |           !model.name.includes('embedding')
138 |         )
139 |         .map(model => ({
140 |           name: model.name.replace('models/', ''), // 移除API前缀
141 |           details: {
142 |             family: MODEL_FAMILIES.gemini
143 |           }
144 |         }))
145 |     }
146 |   } catch (error) {
147 |     console.error('Failed to fetch Gemini models:', error)
148 |   }
149 |   
150 |   // 回退到静态模型
151 |   return GEMINI_MODELS.map((model) => ({
152 |     name: model,
153 |     details: {
154 |       family: MODEL_FAMILIES.gemini
155 |     }
156 |   }))
157 | }
158 | ```
159 | 
160 | 我们还确保在接口定义中只包含应用程序实际需要的字段，优化了内存使用和类型安全性。
161 | 
162 | ## 取得的成果
163 | 
164 | 重构带来了几个切实的改进：
165 | 
166 | **性能提升**：配置了多个API提供商的用户现在体验到显著更快的模型加载速度，因为API调用是并行执行而不是顺序执行。
167 | 
168 | **更好的错误恢复能力**：使用`Promise.allSettled()`意味着如果一个提供商的API失败，其他提供商会继续正常工作，提供更稳健的用户体验。
169 | 
170 | **增强的可维护性**：模块化方法使得添加新的AI提供商或修改现有集成变得更加容易，而不会影响系统的其他部分。
171 | 
172 | **准确的数据集成**：修正的Gemini API集成确保我们直接从Google的API获取最新的模型信息，而不是仅仅依赖静态列表。
173 | 
174 | **面向未来的架构**：包含`nextPageToken`支持意味着我们为将来可能需要的分页做好了准备，模块化设计使得扩展功能变得简单直接。
175 | 
176 | ## 对技术债务的反思
177 | 
178 | 这次重构是早期实用主义决策如何随时间演变为技本债务的完美例子。最初选择硬编码模型列表对于快速原型开发和早期开发绝对是正确的决定。它让我们能够专注于核心功能，而不会被API集成的复杂性所困扰。
179 | 
180 | 然而，AI领域的发展速度令人难以置信。最初看起来可管理的模型列表很快就变成了维护负担，因为OpenAI和Google等提供商每月甚至每周都会发布新模型。在开始阶段为我们提供良好服务的静态方法变成了用户体验和开发者生产力的瓶颈。
181 | 
182 | 这里的关键经验是识别技术债务何时从"有帮助的捷径"变成了"影响用户的限制"。转折点在于我们意识到用户正在询问在外部存在但在我们平台上由于硬编码列表而不可用的模型。
183 | 
184 | ## 学到的技术经验
185 | 
186 | 这次重构强化了API集成和技术债务管理的几个重要原则：
187 | 
188 | 1. **并行优于顺序**：当处理多个独立的外部API时，始终考虑并行执行以改善用户体验。
189 | 
190 | 2. **准确性胜过假设**：始终验证实际的API响应架构，而不是基于文档或其他来源进行假设。
191 | 
192 | 3. **模块化设计**：将复杂操作分解为专注的、单一职责的函数，可以改善可维护性和可测试性。
193 | 
194 | 4. **优雅降级**：每个集成都应该有适当的回退机制，以确保即使外部服务不可用时应用程序仍能保持功能。
195 | 
196 | 5. **接口最小化**：只包含应用程序实际需要的数据字段，以优化性能并保持代码整洁。
197 | 
198 | 6. **技术债务识别**：硬编码解决方案对于快速开发很有价值，但建立清晰的标准来决定何时过渡到动态方法可以防止影响用户的限制。
199 | 
200 | 7. **渐进式增强**：新的动态系统保持静态回退，确保可靠性的同时提供实时数据的好处。
201 | 
202 | ## 展望未来
203 | 
204 | 这次重构为我们模型管理系统的未来增强奠定了坚实的基础。模块化架构使得添加新AI提供商的支持变得简单直接，并行执行模式可以应用到应用程序中需要多个外部API调用的其他区域。
205 | 
206 | 改进的Gemini集成也为利用Google生成式AI API的其他功能创造了机会，当这些功能可用时，同时保持我们新的并行执行方法的性能优势。
207 | 
208 | ---
209 | 
210 | *这个改进是我们持续优化ChatOllama性能和可维护性努力的一部分。欲了解更多技术见解和更新，请关注我们的开发博客系列。*
211 | 


--------------------------------------------------------------------------------
/src/content/blog/2025-08-25-docker-langchain-module-resolution-fix.md:
--------------------------------------------------------------------------------
  1 | ---
  2 | title: "Fixing Docker Module Resolution Error: LangChain Dependencies Investigation"
  3 | date: "2025-08-25"
  4 | description: "Fixing Docker module resolution errors with LangChain dependencies and version conflicts"
  5 | ---
  6 | 
  7 | 
  8 | **Date**: August 25, 2025  
  9 | **Issue**: Docker container failing with `Cannot find module '@langchain/core/prompts.js'` error  
 10 | **Solution**: Dependency version alignment across LangChain packages  
 11 | 
 12 | ## Problem Description
 13 | 
 14 | The dockerized ChatOllama application was experiencing critical module resolution errors during chat operations:
 15 | 
 16 | ```
 17 | [nuxt] [request error] [unhandled] [500] Cannot find module '/app/.output/server/node_modules/@langchain/core/prompts.js' 
 18 | imported from /app/.output/server/chunks/routes/api/models/index.post.mjs
 19 | ```
 20 | 
 21 | This error occurred consistently across multiple API endpoints (`/api/models/chat`, `/api/instruction`, `/api/agents`) and prevented the application from functioning properly in Docker containers.
 22 | 
 23 | ## Investigation Process
 24 | 
 25 | ### 1. Initial Analysis
 26 | - **Error Pattern**: ESM module resolution failure for `@langchain/core/prompts.js`
 27 | - **Environment**: Docker container build process, not local development
 28 | - **Affected Files**: Server API routes importing from `@langchain/core/prompts`
 29 | 
 30 | ### 2. Container Inspection
 31 | Investigation revealed missing export files in the Docker container:
 32 | 
 33 | ```bash
 34 | /app/.output/server/node_modules/@langchain/core/prompts.js
 35 | 
 36 | /app/.output/server/node_modules/@langchain/core/dist/prompts/index.js
 37 | ```
 38 | 
 39 | ### 3. Version Conflict Discovery
 40 | Found **three different versions** of `@langchain/core` in the dependency tree:
 41 | 
 42 | - **Project specification**: `@langchain/core@^0.3.49`
 43 | - **Actual Docker resolution**: `@langchain/core@0.3.72` (pulled by `deepagents@0.0.1`)  
 44 | - **Legacy versions**: `@langchain/core@0.1.54` (used by older packages)
 45 | 
 46 | The key issue: `deepagents@0.0.1` dependency was forcing `@langchain/core@0.3.72`, while the project specified `^0.3.49`, creating version conflicts during Nuxt's build bundling process.
 47 | 
 48 | ## Root Cause Analysis
 49 | 
 50 | ### Core Issue
 51 | **Version Mismatch**: The newer `@langchain/core@0.3.72` has different export structures that weren't compatible with how Nuxt bundled the modules for Docker deployment.
 52 | 
 53 | ### Why Docker vs Local?
 54 | - **Local Development**: pnpm's workspace resolution handled conflicts gracefully
 55 | - **Docker Build**: Nuxt's production bundling exposed the version inconsistencies
 56 | - **Module Resolution**: Different ESM export mappings between versions
 57 | 
 58 | ### Technical Details
 59 | ```json
 60 | // package.json specified
 61 | "@langchain/core": "^0.3.49"
 62 | 
 63 | // But dependency resolution pulled
 64 | "deepagents@0.0.1" → "@langchain/core@0.3.72"
 65 | 
 66 | // Resulted in missing exports during bundling
 67 | ```
 68 | 
 69 | ## Solution: Dependency Alignment
 70 | 
 71 | ### Approach
 72 | Instead of manual file patching, we chose **proper dependency management** by updating all LangChain packages to compatible versions.
 73 | 
 74 | ### Package Updates Applied
 75 | 
 76 | ```json
 77 | {
 78 |   // Core updates for version alignment
 79 |   "@langchain/core": "^0.3.49" → "^0.3.72",
 80 |   
 81 |   // Compatible package updates
 82 |   "@langchain/anthropic": "^0.3.19" → "^0.3.26",
 83 |   "@langchain/community": "^0.3.41" → "^0.3.53", 
 84 |   "@langchain/google-genai": "^0.1.5" → "^0.2.16",
 85 |   "@langchain/groq": "^0.0.5" → "^0.2.3",
 86 |   "@langchain/ollama": "^0.2.0" → "^0.2.3",
 87 |   "@langchain/openai": "^0.5.7" → "^0.6.9",
 88 |   
 89 |   // Provider-specific updates
 90 |   "@langchain/azure-openai": "^0.0.4" → "^0.0.11",
 91 |   "@langchain/cohere": "^0.0.6" → "^0.3.4",
 92 |   
 93 |   // Peer dependency fixes
 94 |   "ws": "^8.16.0" → "^8.18.0",
 95 |   "zod": "^3.23.8" → "^3.24.1"
 96 | }
 97 | ```
 98 | 
 99 | ### Implementation Steps
100 | 
101 | ```bash
102 | # 2. Reinstall dependencies
103 | pnpm install
104 | 
105 | pnpm run build
106 | 
107 | # (Missing parenthesis in server/api/agents/[id].post.ts)
108 | 
109 | ✓ Built in 17.34s
110 | ```
111 | 
112 | ## Verification Results
113 | 
114 | ### Before Fix
115 | - **Docker Error**: Module resolution failure
116 | - **Version Conflicts**: 3 different @langchain/core versions
117 | - **Peer Dependencies**: Multiple warnings
118 | - **Build Status**: Failed in Docker
119 | 
120 | ### After Fix  
121 | - **Dependency Resolution**: All LangChain packages using `@langchain/core@0.3.72`
122 | - **Local Build**: ✅ Successful (`pnpm run build`)
123 | - **Module Exports**: Consistent across all packages
124 | - **Peer Warnings**: Reduced to minimal non-critical issues
125 | 
126 | ## Best Practices Learned
127 | 
128 | ### 1. Dependency Management
129 | - **Always align major dependency versions** across related package families
130 | - **Use exact or compatible ranges** for critical dependencies like LangChain core
131 | - **Regular dependency audits** to catch version drift
132 | 
133 | ### 2. Docker-Specific Considerations
134 | - **Test builds in Docker** during development, not just locally
135 | - **Version conflicts manifest differently** in containerized builds vs local development
136 | - **ESM module resolution** can be sensitive to version mismatches
137 | 
138 | ### 3. Investigation Approach
139 | - **Container inspection first** to understand actual file structure
140 | - **Dependency tree analysis** to identify version conflicts  
141 | - **Standard tooling over manual fixes** for sustainable solutions
142 | 
143 | ## Technical Details for Developers
144 | 
145 | ### Files Modified
146 | - `package.json`: Updated LangChain package versions
147 | - `pnpm-lock.yaml`: Regenerated with consistent resolutions
148 | - `server/api/agents/[id].post.ts`: Fixed syntax error (missing parenthesis)
149 | 
150 | ### Commands for Reproduction
151 | ```bash
152 | docker exec <container> ls -la /app/.output/server/node_modules/@langchain/core/
153 | 
154 | docker exec <container> find /app/.output/server/node_modules/@langchain/core -name "*prompt*"
155 | 
156 | npm list @langchain/core
157 | ```
158 | 
159 | ### Prevention Strategy
160 | ```json
161 | // package.json - Use stricter version ranges for critical deps
162 | {
163 |   "@langchain/core": "~0.3.72",  // Tilde for patch-level only
164 |   "deepagents": "^0.0.1"         // Ensure compatibility
165 | }
166 | ```
167 | 
168 | ## Conclusion
169 | 
170 | This issue highlights the importance of **consistent dependency management** in modern JavaScript applications, especially when deploying via Docker. The proper solution involved updating the entire LangChain ecosystem to compatible versions rather than applying manual patches.
171 | 
172 | ### Key Takeaways
173 | 1. **Version conflicts** can manifest differently between local and Docker environments
174 | 2. **Dependency alignment** is crucial for ESM module resolution
175 | 3. **Standard package management** is always preferable to manual file fixes
176 | 4. **Container-specific testing** should be part of the development workflow
177 | 
178 | The fix ensures ChatOllama's Docker deployment works reliably while maintaining the standard build process and keeping dependencies up-to-date with the latest LangChain ecosystem improvements.


--------------------------------------------------------------------------------
/content/20250825-docker-langchain-module-resolution-fix.md:
--------------------------------------------------------------------------------
  1 | # Fixing Docker Module Resolution Error: LangChain Dependencies Investigation
  2 | 
  3 | **Date**: August 25, 2025  
  4 | **Issue**: Docker container failing with `Cannot find module '@langchain/core/prompts.js'` error  
  5 | **Solution**: Dependency version alignment across LangChain packages  
  6 | 
  7 | ## Problem Description
  8 | 
  9 | The dockerized ChatOllama application was experiencing critical module resolution errors during chat operations:
 10 | 
 11 | ```
 12 | [nuxt] [request error] [unhandled] [500] Cannot find module '/app/.output/server/node_modules/@langchain/core/prompts.js' 
 13 | imported from /app/.output/server/chunks/routes/api/models/index.post.mjs
 14 | ```
 15 | 
 16 | This error occurred consistently across multiple API endpoints (`/api/models/chat`, `/api/instruction`, `/api/agents`) and prevented the application from functioning properly in Docker containers.
 17 | 
 18 | ## Investigation Process
 19 | 
 20 | ### 1. Initial Analysis
 21 | - **Error Pattern**: ESM module resolution failure for `@langchain/core/prompts.js`
 22 | - **Environment**: Docker container build process, not local development
 23 | - **Affected Files**: Server API routes importing from `@langchain/core/prompts`
 24 | 
 25 | ### 2. Container Inspection
 26 | Investigation revealed missing export files in the Docker container:
 27 | 
 28 | ```bash
 29 | # Expected but missing
 30 | /app/.output/server/node_modules/@langchain/core/prompts.js
 31 | 
 32 | # Available directory structure
 33 | /app/.output/server/node_modules/@langchain/core/dist/prompts/index.js
 34 | ```
 35 | 
 36 | ### 3. Version Conflict Discovery
 37 | Found **three different versions** of `@langchain/core` in the dependency tree:
 38 | 
 39 | - **Project specification**: `@langchain/core@^0.3.49`
 40 | - **Actual Docker resolution**: `@langchain/core@0.3.72` (pulled by `deepagents@0.0.1`)  
 41 | - **Legacy versions**: `@langchain/core@0.1.54` (used by older packages)
 42 | 
 43 | The key issue: `deepagents@0.0.1` dependency was forcing `@langchain/core@0.3.72`, while the project specified `^0.3.49`, creating version conflicts during Nuxt's build bundling process.
 44 | 
 45 | ## Root Cause Analysis
 46 | 
 47 | ### Core Issue
 48 | **Version Mismatch**: The newer `@langchain/core@0.3.72` has different export structures that weren't compatible with how Nuxt bundled the modules for Docker deployment.
 49 | 
 50 | ### Why Docker vs Local?
 51 | - **Local Development**: pnpm's workspace resolution handled conflicts gracefully
 52 | - **Docker Build**: Nuxt's production bundling exposed the version inconsistencies
 53 | - **Module Resolution**: Different ESM export mappings between versions
 54 | 
 55 | ### Technical Details
 56 | ```json
 57 | // package.json specified
 58 | "@langchain/core": "^0.3.49"
 59 | 
 60 | // But dependency resolution pulled
 61 | "deepagents@0.0.1" → "@langchain/core@0.3.72"
 62 | 
 63 | // Resulted in missing exports during bundling
 64 | ```
 65 | 
 66 | ## Solution: Dependency Alignment
 67 | 
 68 | ### Approach
 69 | Instead of manual file patching, we chose **proper dependency management** by updating all LangChain packages to compatible versions.
 70 | 
 71 | ### Package Updates Applied
 72 | 
 73 | ```json
 74 | {
 75 |   // Core updates for version alignment
 76 |   "@langchain/core": "^0.3.49" → "^0.3.72",
 77 |   
 78 |   // Compatible package updates
 79 |   "@langchain/anthropic": "^0.3.19" → "^0.3.26",
 80 |   "@langchain/community": "^0.3.41" → "^0.3.53", 
 81 |   "@langchain/google-genai": "^0.1.5" → "^0.2.16",
 82 |   "@langchain/groq": "^0.0.5" → "^0.2.3",
 83 |   "@langchain/ollama": "^0.2.0" → "^0.2.3",
 84 |   "@langchain/openai": "^0.5.7" → "^0.6.9",
 85 |   
 86 |   // Provider-specific updates
 87 |   "@langchain/azure-openai": "^0.0.4" → "^0.0.11",
 88 |   "@langchain/cohere": "^0.0.6" → "^0.3.4",
 89 |   
 90 |   // Peer dependency fixes
 91 |   "ws": "^8.16.0" → "^8.18.0",
 92 |   "zod": "^3.23.8" → "^3.24.1"
 93 | }
 94 | ```
 95 | 
 96 | ### Implementation Steps
 97 | 
 98 | ```bash
 99 | # 1. Update package.json with compatible versions
100 | # 2. Reinstall dependencies
101 | pnpm install
102 | 
103 | # 3. Verify build success
104 | pnpm run build
105 | 
106 | # 4. Fix discovered syntax error
107 | # (Missing parenthesis in server/api/agents/[id].post.ts)
108 | 
109 | # 5. Successful build completion
110 | ✓ Built in 17.34s
111 | ```
112 | 
113 | ## Verification Results
114 | 
115 | ### Before Fix
116 | - **Docker Error**: Module resolution failure
117 | - **Version Conflicts**: 3 different @langchain/core versions
118 | - **Peer Dependencies**: Multiple warnings
119 | - **Build Status**: Failed in Docker
120 | 
121 | ### After Fix  
122 | - **Dependency Resolution**: All LangChain packages using `@langchain/core@0.3.72`
123 | - **Local Build**: ✅ Successful (`pnpm run build`)
124 | - **Module Exports**: Consistent across all packages
125 | - **Peer Warnings**: Reduced to minimal non-critical issues
126 | 
127 | ## Best Practices Learned
128 | 
129 | ### 1. Dependency Management
130 | - **Always align major dependency versions** across related package families
131 | - **Use exact or compatible ranges** for critical dependencies like LangChain core
132 | - **Regular dependency audits** to catch version drift
133 | 
134 | ### 2. Docker-Specific Considerations
135 | - **Test builds in Docker** during development, not just locally
136 | - **Version conflicts manifest differently** in containerized builds vs local development
137 | - **ESM module resolution** can be sensitive to version mismatches
138 | 
139 | ### 3. Investigation Approach
140 | - **Container inspection first** to understand actual file structure
141 | - **Dependency tree analysis** to identify version conflicts  
142 | - **Standard tooling over manual fixes** for sustainable solutions
143 | 
144 | ## Technical Details for Developers
145 | 
146 | ### Files Modified
147 | - `package.json`: Updated LangChain package versions
148 | - `pnpm-lock.yaml`: Regenerated with consistent resolutions
149 | - `server/api/agents/[id].post.ts`: Fixed syntax error (missing parenthesis)
150 | 
151 | ### Commands for Reproduction
152 | ```bash
153 | # Inspect container dependencies
154 | docker exec <container> ls -la /app/.output/server/node_modules/@langchain/core/
155 | 
156 | # Check for missing exports
157 | docker exec <container> find /app/.output/server/node_modules/@langchain/core -name "*prompt*"
158 | 
159 | # Verify local vs container differences
160 | npm list @langchain/core
161 | ```
162 | 
163 | ### Prevention Strategy
164 | ```json
165 | // package.json - Use stricter version ranges for critical deps
166 | {
167 |   "@langchain/core": "~0.3.72",  // Tilde for patch-level only
168 |   "deepagents": "^0.0.1"         // Ensure compatibility
169 | }
170 | ```
171 | 
172 | ## Conclusion
173 | 
174 | This issue highlights the importance of **consistent dependency management** in modern JavaScript applications, especially when deploying via Docker. The proper solution involved updating the entire LangChain ecosystem to compatible versions rather than applying manual patches.
175 | 
176 | ### Key Takeaways
177 | 1. **Version conflicts** can manifest differently between local and Docker environments
178 | 2. **Dependency alignment** is crucial for ESM module resolution
179 | 3. **Standard package management** is always preferable to manual file fixes
180 | 4. **Container-specific testing** should be part of the development workflow
181 | 
182 | The fix ensures ChatOllama's Docker deployment works reliably while maintaining the standard build process and keeping dependencies up-to-date with the latest LangChain ecosystem improvements.


--------------------------------------------------------------------------------
/content/zh/20250828-openai-langchain-image-parsing-fix_zh.md:
--------------------------------------------------------------------------------
  1 | # OpenAI 兼容图像解析：修复 LangChain 流式响应限制
  2 | 
  3 | **日期：** 2025年8月28日  
  4 | **问题：** OpenAI 兼容 API 在流式响应中返回的图像未被 LangChain.js 解析  
  5 | **解决耗时：** ~6小时  
  6 | 
  7 | ## 🐛 问题描述
  8 | 
  9 | 虽然 ChatOllama 支持用户上传图像，但在处理 AI 生成图像方面存在重大缺陷。当使用 OpenAI 兼容的 API（特别是 OpenRouter 配合 Gemini 模型）返回图像作为响应的一部分时，这些图像在流式聊天会话中被完全忽略。
 10 | 
 11 | 这个问题对于使用高级多模态模型的用户来说特别麻烦，这些模型可以生成图表、图解或其他视觉内容。用户看不到生成的图像，只能收到文本响应，错过了像 Gemini Flash 等模型生成的关键视觉信息。
 12 | 
 13 | 这个限制严重影响了用户体验，特别是在以下场景：
 14 | - 数据可视化请求（图表、图形）  
 15 | - 图解生成任务
 16 | - 创意图像生成工作流
 17 | - 带有视觉辅助的技术文档
 18 | 
 19 | ## 🔍 根本原因调查
 20 | 
 21 | 经过大量调试和 API 响应分析，我们发现 OpenAI 兼容提供商使用的图像内容响应结构与 LangChain.js 期望的标准 OpenAI 格式不同。
 22 | 
 23 | ### 隐藏的响应结构
 24 | 
 25 | 大多数 OpenAI 兼容 API（如 OpenRouter）使用 `images` 字段和标准 `content` 字段一起返回图像内容：
 26 | 
 27 | ```json
 28 | {
 29 |   "role": "assistant",
 30 |   "content": "这是您请求的图表：",
 31 |   "images": [
 32 |     {
 33 |       "type": "image_url",
 34 |       "image_url": {
 35 |         "url": "data:image/png;base64,iVBORw0KGgo...",
 36 |         "detail": "high"
 37 |       }
 38 |     }
 39 |   ]
 40 | }
 41 | ```
 42 | 
 43 | 然而，LangChain.js 流式处理器只处理这些字段：
 44 | - ✅ `content` 字段（文本内容）
 45 | - ✅ `tool_calls` 字段（函数调用）  
 46 | - ✅ `function_call` 字段（传统函数调用）
 47 | - ✅ `audio` 字段（音频内容）
 48 | - ❌ `images` 字段（**完全忽略**）
 49 | 
 50 | 核心问题出现在 LangChain OpenAI 聊天模型中的两个关键函数：
 51 | 1. `_convertCompletionsDeltaToBaseMessageChunk()` - 用于流式响应
 52 | 2. `_convertCompletionsMessageToBaseMessage()` - 用于非流式响应
 53 | 
 54 | 这两个函数都简单地丢弃任何 `images` 字段数据，导致视觉内容从最终消息中消失。
 55 | 
 56 | ## 🔧 修复实现
 57 | 
 58 | ### 分步实施指南
 59 | 
 60 | 要在您的项目中实施此修复，需要对三个关键领域进行更改：
 61 | 
 62 | 1. **自定义 LangChain OpenAI 聊天模型** - 解析 API 响应中的 `images` 字段
 63 | 2. **服务器端点** - 提取和处理多模态内容 
 64 | 3. **前端组件** - 显示解析的图像
 65 | 
 66 | ### 步骤 1：创建自定义 LangChain 实现
 67 | 
 68 | 由于这是 LangChain.js 本身的根本限制，我们在 `server/models/openai/chat_models.ts` 创建了 OpenAI 聊天模型的定制版本。
 69 | 
 70 | **必需的更改：**
 71 | 
 72 | #### 1.1. 增强的流式 Delta 处理
 73 | 
 74 | 在您的 LangChain OpenAI 聊天模型中找到 `_convertCompletionsDeltaToBaseMessageChunk()` 方法并修改它：
 75 | 
 76 | **修复前（原始 LangChain）：**
 77 | ```typescript
 78 | const content = delta.content ?? ""
 79 | ```
 80 | 
 81 | **修复后（修复版）：**
 82 | ```typescript
 83 | let content = delta.content ?? ""
 84 | 
 85 | // 处理可能包含 image_url 内容的 images 字段
 86 | if (delta.images && Array.isArray(delta.images)) {
 87 |   // 如果内容是字符串且有图像，则转换为数组格式
 88 |   if (typeof content === "string") {
 89 |     const contentArray = []
 90 |     if (content) {
 91 |       contentArray.push({ type: "text", text: content })
 92 |     }
 93 |     // 从 images 字段添加图像内容
 94 |     for (const image of delta.images) {
 95 |       if (image.type === "image_url" && image.image_url) {
 96 |         contentArray.push({
 97 |           type: "image_url",
 98 |           image_url: image.image_url,
 99 |         })
100 |       }
101 |     }
102 |     content = contentArray
103 |   }
104 | }
105 | ```
106 | 
107 | #### 1.2. 增强的非流式消息处理  
108 | 
109 | 找到 `_convertCompletionsMessageToBaseMessage()` 方法并修改它：
110 | 
111 | **修复前（原始 LangChain）：**
112 | ```typescript
113 | return new AIMessage({
114 |   content: message.content || "",
115 |   // ... 其他字段
116 | })
117 | ```
118 | 
119 | **修复后（修复版）：**
120 | ```typescript
121 | // 处理可能包含 image_url 内容的 images 字段
122 | let content = message.content || ""
123 | if (message.images && Array.isArray(message.images)) {
124 |   // 如果内容是字符串且有图像，则转换为数组格式
125 |   if (typeof content === "string") {
126 |     const contentArray = []
127 |     if (content) {
128 |       contentArray.push({ type: "text", text: content })
129 |     }
130 |     // 从 images 字段添加图像内容
131 |     for (const image of message.images) {
132 |       if (image.type === "image_url" && image.image_url) {
133 |         contentArray.push({
134 |           type: "image_url",
135 |           image_url: image.image_url,
136 |         })
137 |       }
138 |     }
139 |     content = contentArray
140 |   }
141 | }
142 | 
143 | return new AIMessage({
144 |   content,
145 |   // ... 其他字段
146 | })
147 | ```
148 | 
149 | ### 步骤 2：更新服务器端点内容处理
150 | 
151 | 修改您的聊天端点以提取和处理来自增强 LangChain 实现的多模态内容：
152 | 
153 | **文件：** `server/api/models/chat/index.post.ts`（或您的等效文件）
154 | 
155 | **添加此新函数：**
156 | 
157 | ```typescript
158 | const extractContentFromChunk = (chunk: BaseMessageChunk): { text: string; images: any[] } => {
159 |   let content = chunk?.content
160 |   let textContent = ''
161 |   let images: any[] = []
162 | 
163 |   // 处理数组内容（多模态）
164 |   if (Array.isArray(content)) {
165 |     // 提取文本内容
166 |     textContent = content
167 |       .filter(item => item.type === 'text_delta' || item.type === 'text')
168 |       .map(item => ('text' in item ? item.text : ''))
169 |       .join('')
170 | 
171 |     // 提取图像内容
172 |     images = content
173 |       .filter(item => item.type === 'image_url' && item.image_url?.url)
174 |       .map(item => ({ type: 'image_url', image_url: item.image_url }))
175 |   } else {
176 |     // 处理字符串内容
177 |     textContent = content || ''
178 |   }
179 | 
180 |   return { text: textContent, images }
181 | }
182 | ```
183 | 
184 | **更新您的流式逻辑：**
185 | ```typescript
186 | // 替换现有的 extractContentFromChunk 调用
187 | const { text, images } = extractContentFromChunk(chunk)
188 | 
189 | // 在响应中处理文本和图像
190 | if (accumulatedImages.length > 0) {
191 |   const contentArray: MessageContent[] = []
192 |   if (accumulatedTextContent) {
193 |     contentArray.push({ type: 'text', text: accumulatedTextContent })
194 |   }
195 |   contentArray.push(...accumulatedImages)
196 |   contentToStream = contentArray
197 | } else {
198 |   contentToStream = accumulatedTextContent
199 | }
200 | ```
201 | 
202 | ### 步骤 3：前端图像显示实现
203 | 
204 | 确保您的前端组件能够从多模态内容中提取和显示图像：
205 | 
206 | **文件：** `components/ChatMessageItem.vue`（或您的等效文件）
207 | 
208 | **添加图像提取逻辑：**
209 | 
210 | ```typescript
211 | const messageImages = computed(() => {
212 |   const content = props.message.content
213 |   if (!content || !Array.isArray(content)) return []
214 | 
215 |   return content
216 |     .filter(item => item.type === 'image_url' && item.image_url?.url)
217 |     .map(item => item.image_url!.url)
218 | })
219 | ```
220 | 
221 | **更新您的模板以显示图像：**
222 | ```vue
223 | <template>
224 |   <!-- 文本内容 -->
225 |   <div v-if="messageContent" v-html="markdown.render(messageContent)" />
226 |   
227 |   <!-- 图像画廊 -->
228 |   <div v-if="messageImages.length > 0" class="image-gallery">
229 |     <img v-for="(url, index) in messageImages"
230 |          :key="index"
231 |          :src="url"
232 |          :alt="`Image ${index + 1}`"
233 |          class="rounded-lg max-h-64 object-contain" />
234 |   </div>
235 | </template>
236 | ```
237 | 
238 | **添加基本的图像显示 CSS：**
239 | ```css
240 | .image-gallery {
241 |   display: grid;
242 |   grid-template-columns: repeat(auto-fit, minmax(200px, 1fr));
243 |   gap: 0.5rem;
244 |   margin-top: 0.75rem;
245 | }
246 | 
247 | .image-gallery img {
248 |   width: 100%;
249 |   height: auto;
250 |   background: var(--color-gray-100);
251 |   cursor: pointer;
252 | }
253 | ```
254 | 
255 | ## 🧪 全面测试策略
256 | 
257 | 我们实施了大量测试以确保在不同场景下的健壮性：
258 | 
259 | **测试覆盖：**
260 | 1. ✅ **带单个图像的文本** - 正确的数组转换
261 | 2. ✅ **多个图像** - 保持正确的顺序和结构  
262 | 3. ✅ **仅图像（空内容）** - 无文本内容时正常工作
263 | 4. ✅ **向后兼容性** - 对标准响应无破坏性更改
264 | 5. ✅ **无效图像对象** - 优雅的错误处理
265 | 6. ✅ **空图像数组** - 正确处理边缘情况
266 | 7. ✅ **格式错误的数据** - 对无效输入的健壮错误处理
267 | 
268 | **验证命令：**
269 | ```bash
270 | npx tsx server/models/openai/tests/validate-core-logic.ts
271 | npx tsx server/models/openai/tests/validate-image-url-parsing.ts
272 | ```
273 | 
274 | ## 🎯 内容格式转换
275 | 
276 | 修复程序智能地将 API 响应转换为 LangChain 兼容的多模态内容：
277 | 
278 | ### 输入（OpenAI 兼容 API）：
279 | ```json
280 | {
281 |   "content": "这是两个可视化图表：",
282 |   "images": [
283 |     { 
284 |       "type": "image_url", 
285 |       "image_url": { "url": "data:image/png;base64,chart1..." } 
286 |     },
287 |     { 
288 |       "type": "image_url", 
289 |       "image_url": { "url": "data:image/png;base64,chart2..." } 
290 |     }
291 |   ]
292 | }
293 | ```
294 | 
295 | ### 输出（LangChain 消息）：
296 | ```json
297 | [
298 |   { "type": "text", "text": "这是两个可视化图表：" },
299 |   { "type": "image_url", "image_url": { "url": "data:image/png;base64,chart1..." } },
300 |   { "type": "image_url", "image_url": { "url": "data:image/png;base64,chart2..." } }
301 | ]
302 | ```
303 | 
304 | ## 📚 经验教训
305 | 
306 | 这次实现让我们学到了关于使用不断演进的 AI API 的几个宝贵经验：
307 | 
308 | **API 标准化仍在演进中：** 不同的 OpenAI 兼容提供商对多模态内容使用不同的响应格式。适应这些差异对维持广泛兼容性至关重要。
309 | 
310 | **自定义 LangChain 实现有价值：** 虽然通常首选与上游 LangChain 保持一致，但有时特定用例需要自定义实现来解锁标准库尚未支持的功能。
311 | 
312 | **健壮测试防止回归：** 全面的边缘情况测试是必不可少的，特别是在处理来自不同 API 提供商的各种响应格式时。
313 | 
314 | **向后兼容性不可妥协：** 对核心消息处理的任何更改都必须保持 100% 向后兼容性，以避免破坏现有工作流。
315 | 
316 | ## 🚀 影响和结果
317 | 
318 | 该实现显著改善了 ChatOllama 的多模态能力：
319 | 
320 | **即时收益：**
321 | - **完整多模态支持**：用户现在可以看到来自 Gemini Flash 等模型的 AI 生成图像
322 | - **增强可视化**：数据图表、图解和创意图像正确显示  
323 | - **API 提供商灵活性**：与 OpenRouter、OpenAI 和其他兼容提供商无缝协作
324 | - **零破坏性更改**：现有仅文本工作流完全不受影响
325 | 
326 | **技术改进：**
327 | - **流式性能**：图像在生成时实时显示
328 | - **内存效率**：优化处理仅在存在图像时激活
329 | - **错误弹性**：优雅处理格式错误或不完整的图像数据
330 | - **面向未来的架构**：为其他多模态内容类型做好准备
331 | 
332 | ## 💡 实际使用示例
333 | 
334 | 这个修复启用了强大的新工作流：
335 | 
336 | ```typescript
337 | // 用户请求："创建显示第四季度销售数据的条形图"
338 | // API 响应：混合文本 + 生成图像
339 | {
340 |   "role": "assistant", 
341 |   "content": "这是您的第四季度销售可视化：",
342 |   "images": [{
343 |     "type": "image_url",
344 |     "image_url": {
345 |       "url": "data:image/png;base64,<chart_data>",
346 |       "detail": "high"
347 |     }
348 |   }]
349 | }
350 | 
351 | // ChatOllama 现在显示：文本 + 交互式图像
352 | ```
353 | 
354 | ## 🚀 快速实施检查清单
355 | 
356 | 对于实施此修复的开发者：
357 | 
358 | ### ✅ **需要修改的文件：**
359 | 
360 | 1. **`server/models/openai/chat_models.ts`**（或从 `@langchain/openai` 复制）
361 |    - ✅ 在 `_convertCompletionsDeltaToBaseMessageChunk()` 中添加图像解析 
362 |    - ✅ 在 `_convertCompletionsMessageToBaseMessage()` 中添加图像解析
363 | 
364 | 2. **`server/api/models/chat/index.post.ts`**（您的聊天端点）
365 |    - ✅ 更新 `extractContentFromChunk()` 函数
366 |    - ✅ 在流式逻辑中处理多模态内容
367 | 
368 | 3. **`components/ChatMessageItem.vue`**（您的消息组件）
369 |    - ✅ 添加 `messageImages` 计算属性
370 |    - ✅ 用图像画廊更新模板
371 |    - ✅ 为图像显示添加 CSS
372 | 
373 | ### ✅ **要寻找的关键代码模式：**
374 | 
375 | **问题指示器：**
376 | ```typescript
377 | // ❌ 仅处理文本内容
378 | const content = delta.content ?? ""
379 | 
380 | // ❌ 完全忽略 images 字段
381 | return new AIMessage({ content: message.content })
382 | ```
383 | 
384 | **解决方案模式：**
385 | ```typescript
386 | // ✅ 处理文本和图像
387 | if (delta.images && Array.isArray(delta.images)) {
388 |   // 转换为多模态数组格式
389 | }
390 | 
391 | // ✅ 从多模态内容中提取图像
392 | return content
393 |   .filter(item => item.type === 'image_url' && item.image_url?.url)
394 |   .map(item => item.image_url!.url)
395 | ```
396 | 
397 | ### ✅ **测试您的实现：**
398 | 
399 | 1. **使用 OpenRouter + Gemini Flash 测试**（已知返回 `images` 字段）
400 | 2. **验证流式和非流式响应**  
401 | 3. **检查单个响应中的多个图像**
402 | 4. **确保与仅文本响应的向后兼容性**
403 | 
404 | ---
405 | 
406 | *此修复为使用 `images` 响应字段的 OpenAI 兼容 API 启用了完整的多模态支持。通过实施这三个关键更改，您可以在基于 LangChain.js 的聊天应用程序中解锁图像生成功能。*


--------------------------------------------------------------------------------
/src/content/blog-zh/2025-08-28-openai-langchain-image-parsing-fix_zh.md:
--------------------------------------------------------------------------------
  1 | ---
  2 | title: "OpenAI 兼容图像解析：修复 LangChain 流式响应限制"
  3 | date: "2025-08-28"
  4 | description: "Blog post about OpenAI 兼容图像解析：修复 LangChain 流式响应限制"
  5 | ---
  6 | 
  7 | 
  8 | **日期：** 2025年8月28日  
  9 | **问题：** OpenAI 兼容 API 在流式响应中返回的图像未被 LangChain.js 解析  
 10 | **解决耗时：** ~6小时  
 11 | 
 12 | ## 🐛 问题描述
 13 | 
 14 | 虽然 ChatOllama 支持用户上传图像，但在处理 AI 生成图像方面存在重大缺陷。当使用 OpenAI 兼容的 API（特别是 OpenRouter 配合 Gemini 模型）返回图像作为响应的一部分时，这些图像在流式聊天会话中被完全忽略。
 15 | 
 16 | 这个问题对于使用高级多模态模型的用户来说特别麻烦，这些模型可以生成图表、图解或其他视觉内容。用户看不到生成的图像，只能收到文本响应，错过了像 Gemini Flash 等模型生成的关键视觉信息。
 17 | 
 18 | 这个限制严重影响了用户体验，特别是在以下场景：
 19 | - 数据可视化请求（图表、图形）  
 20 | - 图解生成任务
 21 | - 创意图像生成工作流
 22 | - 带有视觉辅助的技术文档
 23 | 
 24 | ## 🔍 根本原因调查
 25 | 
 26 | 经过大量调试和 API 响应分析，我们发现 OpenAI 兼容提供商使用的图像内容响应结构与 LangChain.js 期望的标准 OpenAI 格式不同。
 27 | 
 28 | ### 隐藏的响应结构
 29 | 
 30 | 大多数 OpenAI 兼容 API（如 OpenRouter）使用 `images` 字段和标准 `content` 字段一起返回图像内容：
 31 | 
 32 | ```json
 33 | {
 34 |   "role": "assistant",
 35 |   "content": "这是您请求的图表：",
 36 |   "images": [
 37 |     {
 38 |       "type": "image_url",
 39 |       "image_url": {
 40 |         "url": "data:image/png;base64,iVBORw0KGgo...",
 41 |         "detail": "high"
 42 |       }
 43 |     }
 44 |   ]
 45 | }
 46 | ```
 47 | 
 48 | 然而，LangChain.js 流式处理器只处理这些字段：
 49 | - ✅ `content` 字段（文本内容）
 50 | - ✅ `tool_calls` 字段（函数调用）  
 51 | - ✅ `function_call` 字段（传统函数调用）
 52 | - ✅ `audio` 字段（音频内容）
 53 | - ❌ `images` 字段（**完全忽略**）
 54 | 
 55 | 核心问题出现在 LangChain OpenAI 聊天模型中的两个关键函数：
 56 | 1. `_convertCompletionsDeltaToBaseMessageChunk()` - 用于流式响应
 57 | 2. `_convertCompletionsMessageToBaseMessage()` - 用于非流式响应
 58 | 
 59 | 这两个函数都简单地丢弃任何 `images` 字段数据，导致视觉内容从最终消息中消失。
 60 | 
 61 | ## 🔧 修复实现
 62 | 
 63 | ### 分步实施指南
 64 | 
 65 | 要在您的项目中实施此修复，需要对三个关键领域进行更改：
 66 | 
 67 | 1. **自定义 LangChain OpenAI 聊天模型** - 解析 API 响应中的 `images` 字段
 68 | 2. **服务器端点** - 提取和处理多模态内容 
 69 | 3. **前端组件** - 显示解析的图像
 70 | 
 71 | ### 步骤 1：创建自定义 LangChain 实现
 72 | 
 73 | 由于这是 LangChain.js 本身的根本限制，我们在 `server/models/openai/chat_models.ts` 创建了 OpenAI 聊天模型的定制版本。
 74 | 
 75 | **必需的更改：**
 76 | 
 77 | #### 1.1. 增强的流式 Delta 处理
 78 | 
 79 | 在您的 LangChain OpenAI 聊天模型中找到 `_convertCompletionsDeltaToBaseMessageChunk()` 方法并修改它：
 80 | 
 81 | **修复前（原始 LangChain）：**
 82 | ```typescript
 83 | const content = delta.content ?? ""
 84 | ```
 85 | 
 86 | **修复后（修复版）：**
 87 | ```typescript
 88 | let content = delta.content ?? ""
 89 | 
 90 | // 处理可能包含 image_url 内容的 images 字段
 91 | if (delta.images && Array.isArray(delta.images)) {
 92 |   // 如果内容是字符串且有图像，则转换为数组格式
 93 |   if (typeof content === "string") {
 94 |     const contentArray = []
 95 |     if (content) {
 96 |       contentArray.push({ type: "text", text: content })
 97 |     }
 98 |     // 从 images 字段添加图像内容
 99 |     for (const image of delta.images) {
100 |       if (image.type === "image_url" && image.image_url) {
101 |         contentArray.push({
102 |           type: "image_url",
103 |           image_url: image.image_url,
104 |         })
105 |       }
106 |     }
107 |     content = contentArray
108 |   }
109 | }
110 | ```
111 | 
112 | #### 1.2. 增强的非流式消息处理  
113 | 
114 | 找到 `_convertCompletionsMessageToBaseMessage()` 方法并修改它：
115 | 
116 | **修复前（原始 LangChain）：**
117 | ```typescript
118 | return new AIMessage({
119 |   content: message.content || "",
120 |   // ... 其他字段
121 | })
122 | ```
123 | 
124 | **修复后（修复版）：**
125 | ```typescript
126 | // 处理可能包含 image_url 内容的 images 字段
127 | let content = message.content || ""
128 | if (message.images && Array.isArray(message.images)) {
129 |   // 如果内容是字符串且有图像，则转换为数组格式
130 |   if (typeof content === "string") {
131 |     const contentArray = []
132 |     if (content) {
133 |       contentArray.push({ type: "text", text: content })
134 |     }
135 |     // 从 images 字段添加图像内容
136 |     for (const image of message.images) {
137 |       if (image.type === "image_url" && image.image_url) {
138 |         contentArray.push({
139 |           type: "image_url",
140 |           image_url: image.image_url,
141 |         })
142 |       }
143 |     }
144 |     content = contentArray
145 |   }
146 | }
147 | 
148 | return new AIMessage({
149 |   content,
150 |   // ... 其他字段
151 | })
152 | ```
153 | 
154 | ### 步骤 2：更新服务器端点内容处理
155 | 
156 | 修改您的聊天端点以提取和处理来自增强 LangChain 实现的多模态内容：
157 | 
158 | **文件：** `server/api/models/chat/index.post.ts`（或您的等效文件）
159 | 
160 | **添加此新函数：**
161 | 
162 | ```typescript
163 | const extractContentFromChunk = (chunk: BaseMessageChunk): { text: string; images: any[] } => {
164 |   let content = chunk?.content
165 |   let textContent = ''
166 |   let images: any[] = []
167 | 
168 |   // 处理数组内容（多模态）
169 |   if (Array.isArray(content)) {
170 |     // 提取文本内容
171 |     textContent = content
172 |       .filter(item => item.type === 'text_delta' || item.type === 'text')
173 |       .map(item => ('text' in item ? item.text : ''))
174 |       .join('')
175 | 
176 |     // 提取图像内容
177 |     images = content
178 |       .filter(item => item.type === 'image_url' && item.image_url?.url)
179 |       .map(item => ({ type: 'image_url', image_url: item.image_url }))
180 |   } else {
181 |     // 处理字符串内容
182 |     textContent = content || ''
183 |   }
184 | 
185 |   return { text: textContent, images }
186 | }
187 | ```
188 | 
189 | **更新您的流式逻辑：**
190 | ```typescript
191 | // 替换现有的 extractContentFromChunk 调用
192 | const { text, images } = extractContentFromChunk(chunk)
193 | 
194 | // 在响应中处理文本和图像
195 | if (accumulatedImages.length > 0) {
196 |   const contentArray: MessageContent[] = []
197 |   if (accumulatedTextContent) {
198 |     contentArray.push({ type: 'text', text: accumulatedTextContent })
199 |   }
200 |   contentArray.push(...accumulatedImages)
201 |   contentToStream = contentArray
202 | } else {
203 |   contentToStream = accumulatedTextContent
204 | }
205 | ```
206 | 
207 | ### 步骤 3：前端图像显示实现
208 | 
209 | 确保您的前端组件能够从多模态内容中提取和显示图像：
210 | 
211 | **文件：** `components/ChatMessageItem.vue`（或您的等效文件）
212 | 
213 | **添加图像提取逻辑：**
214 | 
215 | ```typescript
216 | const messageImages = computed(() => {
217 |   const content = props.message.content
218 |   if (!content || !Array.isArray(content)) return []
219 | 
220 |   return content
221 |     .filter(item => item.type === 'image_url' && item.image_url?.url)
222 |     .map(item => item.image_url!.url)
223 | })
224 | ```
225 | 
226 | **更新您的模板以显示图像：**
227 | ```vue
228 | <template>
229 |   <!-- 文本内容 -->
230 |   <div v-if="messageContent" v-html="markdown.render(messageContent)" />
231 |   
232 |   <!-- 图像画廊 -->
233 |   <div v-if="messageImages.length > 0" class="image-gallery">
234 |     <img v-for="(url, index) in messageImages"
235 |          :key="index"
236 |          :src="url"
237 |          :alt="`Image ${index + 1}`"
238 |          class="rounded-lg max-h-64 object-contain" />
239 |   </div>
240 | </template>
241 | ```
242 | 
243 | **添加基本的图像显示 CSS：**
244 | ```css
245 | .image-gallery {
246 |   display: grid;
247 |   grid-template-columns: repeat(auto-fit, minmax(200px, 1fr));
248 |   gap: 0.5rem;
249 |   margin-top: 0.75rem;
250 | }
251 | 
252 | .image-gallery img {
253 |   width: 100%;
254 |   height: auto;
255 |   background: var(--color-gray-100);
256 |   cursor: pointer;
257 | }
258 | ```
259 | 
260 | ## 🧪 全面测试策略
261 | 
262 | 我们实施了大量测试以确保在不同场景下的健壮性：
263 | 
264 | **测试覆盖：**
265 | 1. ✅ **带单个图像的文本** - 正确的数组转换
266 | 2. ✅ **多个图像** - 保持正确的顺序和结构  
267 | 3. ✅ **仅图像（空内容）** - 无文本内容时正常工作
268 | 4. ✅ **向后兼容性** - 对标准响应无破坏性更改
269 | 5. ✅ **无效图像对象** - 优雅的错误处理
270 | 6. ✅ **空图像数组** - 正确处理边缘情况
271 | 7. ✅ **格式错误的数据** - 对无效输入的健壮错误处理
272 | 
273 | **验证命令：**
274 | ```bash
275 | npx tsx server/models/openai/tests/validate-core-logic.ts
276 | npx tsx server/models/openai/tests/validate-image-url-parsing.ts
277 | ```
278 | 
279 | ## 🎯 内容格式转换
280 | 
281 | 修复程序智能地将 API 响应转换为 LangChain 兼容的多模态内容：
282 | 
283 | ### 输入（OpenAI 兼容 API）：
284 | ```json
285 | {
286 |   "content": "这是两个可视化图表：",
287 |   "images": [
288 |     { 
289 |       "type": "image_url", 
290 |       "image_url": { "url": "data:image/png;base64,chart1..." } 
291 |     },
292 |     { 
293 |       "type": "image_url", 
294 |       "image_url": { "url": "data:image/png;base64,chart2..." } 
295 |     }
296 |   ]
297 | }
298 | ```
299 | 
300 | ### 输出（LangChain 消息）：
301 | ```json
302 | [
303 |   { "type": "text", "text": "这是两个可视化图表：" },
304 |   { "type": "image_url", "image_url": { "url": "data:image/png;base64,chart1..." } },
305 |   { "type": "image_url", "image_url": { "url": "data:image/png;base64,chart2..." } }
306 | ]
307 | ```
308 | 
309 | ## 📚 经验教训
310 | 
311 | 这次实现让我们学到了关于使用不断演进的 AI API 的几个宝贵经验：
312 | 
313 | **API 标准化仍在演进中：** 不同的 OpenAI 兼容提供商对多模态内容使用不同的响应格式。适应这些差异对维持广泛兼容性至关重要。
314 | 
315 | **自定义 LangChain 实现有价值：** 虽然通常首选与上游 LangChain 保持一致，但有时特定用例需要自定义实现来解锁标准库尚未支持的功能。
316 | 
317 | **健壮测试防止回归：** 全面的边缘情况测试是必不可少的，特别是在处理来自不同 API 提供商的各种响应格式时。
318 | 
319 | **向后兼容性不可妥协：** 对核心消息处理的任何更改都必须保持 100% 向后兼容性，以避免破坏现有工作流。
320 | 
321 | ## 🚀 影响和结果
322 | 
323 | 该实现显著改善了 ChatOllama 的多模态能力：
324 | 
325 | **即时收益：**
326 | - **完整多模态支持**：用户现在可以看到来自 Gemini Flash 等模型的 AI 生成图像
327 | - **增强可视化**：数据图表、图解和创意图像正确显示  
328 | - **API 提供商灵活性**：与 OpenRouter、OpenAI 和其他兼容提供商无缝协作
329 | - **零破坏性更改**：现有仅文本工作流完全不受影响
330 | 
331 | **技术改进：**
332 | - **流式性能**：图像在生成时实时显示
333 | - **内存效率**：优化处理仅在存在图像时激活
334 | - **错误弹性**：优雅处理格式错误或不完整的图像数据
335 | - **面向未来的架构**：为其他多模态内容类型做好准备
336 | 
337 | ## 💡 实际使用示例
338 | 
339 | 这个修复启用了强大的新工作流：
340 | 
341 | ```typescript
342 | // 用户请求："创建显示第四季度销售数据的条形图"
343 | // API 响应：混合文本 + 生成图像
344 | {
345 |   "role": "assistant", 
346 |   "content": "这是您的第四季度销售可视化：",
347 |   "images": [{
348 |     "type": "image_url",
349 |     "image_url": {
350 |       "url": "data:image/png;base64,<chart_data>",
351 |       "detail": "high"
352 |     }
353 |   }]
354 | }
355 | 
356 | // ChatOllama 现在显示：文本 + 交互式图像
357 | ```
358 | 
359 | ## 🚀 快速实施检查清单
360 | 
361 | 对于实施此修复的开发者：
362 | 
363 | ### ✅ **需要修改的文件：**
364 | 
365 | 1. **`server/models/openai/chat_models.ts`**（或从 `@langchain/openai` 复制）
366 |    - ✅ 在 `_convertCompletionsDeltaToBaseMessageChunk()` 中添加图像解析 
367 |    - ✅ 在 `_convertCompletionsMessageToBaseMessage()` 中添加图像解析
368 | 
369 | 2. **`server/api/models/chat/index.post.ts`**（您的聊天端点）
370 |    - ✅ 更新 `extractContentFromChunk()` 函数
371 |    - ✅ 在流式逻辑中处理多模态内容
372 | 
373 | 3. **`components/ChatMessageItem.vue`**（您的消息组件）
374 |    - ✅ 添加 `messageImages` 计算属性
375 |    - ✅ 用图像画廊更新模板
376 |    - ✅ 为图像显示添加 CSS
377 | 
378 | ### ✅ **要寻找的关键代码模式：**
379 | 
380 | **问题指示器：**
381 | ```typescript
382 | // ❌ 仅处理文本内容
383 | const content = delta.content ?? ""
384 | 
385 | // ❌ 完全忽略 images 字段
386 | return new AIMessage({ content: message.content })
387 | ```
388 | 
389 | **解决方案模式：**
390 | ```typescript
391 | // ✅ 处理文本和图像
392 | if (delta.images && Array.isArray(delta.images)) {
393 |   // 转换为多模态数组格式
394 | }
395 | 
396 | // ✅ 从多模态内容中提取图像
397 | return content
398 |   .filter(item => item.type === 'image_url' && item.image_url?.url)
399 |   .map(item => item.image_url!.url)
400 | ```
401 | 
402 | ### ✅ **测试您的实现：**
403 | 
404 | 1. **使用 OpenRouter + Gemini Flash 测试**（已知返回 `images` 字段）
405 | 2. **验证流式和非流式响应**  
406 | 3. **检查单个响应中的多个图像**
407 | 4. **确保与仅文本响应的向后兼容性**
408 | 
409 | ---
410 | 
411 | *此修复为使用 `images` 响应字段的 OpenAI 兼容 API 启用了完整的多模态支持。通过实施这三个关键更改，您可以在基于 LangChain.js 的聊天应用程序中解锁图像生成功能。*


--------------------------------------------------------------------------------
/content/20250826-model-api-refactoring-parallel-execution.md:
--------------------------------------------------------------------------------
  1 | # Model API Refactoring: Implementing Parallel Execution and Proper Gemini Integration
  2 | 
  3 | *August 26, 2025*
  4 | 
  5 | ## The Challenge
  6 | 
  7 | Like many fast-moving projects, ChatOllama started with a pragmatic approach to model management. In the early stages, we simply hardcoded the supported models for different AI provider families in static arrays. This was a conscious decision to move fast and get the core functionality working quickly - a classic "make it work first, optimize later" approach.
  8 | 
  9 | However, as the AI landscape evolved rapidly and our platform matured, this technical debt started to create real problems:
 10 | 
 11 | **Outdated Model Lists**: New models from providers like OpenAI, Gemini, and others weren't immediately available to users. We had to manually update our static lists every time providers released new capabilities.
 12 | 
 13 | **Maintenance Overhead**: Each provider update meant code changes, testing, and deployment cycles just to keep our model lists current.
 14 | 
 15 | **User Frustration**: Power users who wanted to try the latest models (like GPT-4 Turbo variants or new Gemini models) had to wait for us to update our hardcoded lists.
 16 | 
 17 | **Performance Issues**: On top of the maintenance burden, we discovered that our model discovery API had architectural limitations affecting performance. The existing implementation was processing external API calls sequentially, and our Gemini API integration wasn't aligned with the actual API response schema.
 18 | 
 19 | It was time to address this technical debt properly and build a more dynamic, sustainable solution.
 20 | 
 21 | ## What We Discovered
 22 | 
 23 | During our analysis, we identified several key issues:
 24 | 
 25 | 1. **Sequential API Processing**: The existing code was making API calls to different providers (OpenAI, Gemini, custom endpoints) one after another, creating unnecessary latency when multiple providers were configured.
 26 | 
 27 | 2. **Incorrect Gemini API Schema**: Our interface definition didn't match the actual Gemini API response structure, which includes a `models` array and optional `nextPageToken` for pagination support.
 28 | 
 29 | 3. **Monolithic Function**: All the model fetching logic was embedded in a single event handler, making it difficult to maintain and extend for new providers.
 30 | 
 31 | 4. **Incomplete Field Utilization**: We were defining interface fields that the application didn't actually need, leading to unnecessary data processing.
 32 | 
 33 | ## The Solution: Parallel Execution and Modular Design
 34 | 
 35 | We approached this refactoring with three main goals: improve performance through parallelization, ensure API accuracy, and enhance maintainability through modular design.
 36 | 
 37 | ### 1. Extracting Provider-Specific Functions
 38 | 
 39 | First, we broke down the monolithic approach into dedicated functions for each provider:
 40 | 
 41 | ```typescript
 42 | // Fetch OpenAI models
 43 | async function fetchOpenAIModels(apiKey: string): Promise<ModelItem[]> {
 44 |   try {
 45 |     const response = await fetch('https://api.openai.com/v1/models', {
 46 |       headers: {
 47 |         'Authorization': `Bearer ${apiKey}`,
 48 |       }
 49 |     })
 50 |     // ... processing logic with fallback
 51 |   } catch (error) {
 52 |     console.error('Failed to fetch OpenAI models:', error)
 53 |   }
 54 |   // Fallback to static models
 55 |   return OPENAI_GPT_MODELS.map((model) => ({
 56 |     name: model,
 57 |     details: { family: MODEL_FAMILIES.openai }
 58 |   }))
 59 | }
 60 | ```
 61 | 
 62 | This pattern was replicated for `fetchGeminiModels()`, `fetchOllamaModels()`, and `fetchCustomModels()`, giving each provider its own isolated logic while maintaining consistent error handling and fallback mechanisms.
 63 | 
 64 | ### 2. Implementing Parallel Execution
 65 | 
 66 | The real performance breakthrough came from implementing parallel execution using `Promise.allSettled()`:
 67 | 
 68 | ```typescript
 69 | export default defineEventHandler(async (event) => {
 70 |   const keys = event.context.keys
 71 |   const models: ModelItem[] = []
 72 | 
 73 |   // Prepare parallel API calls for providers that support dynamic fetching
 74 |   const apiCalls: Promise<ModelItem[]>[] = []
 75 |   
 76 |   // Always try to fetch Ollama models
 77 |   apiCalls.push(fetchOllamaModels(event))
 78 |   
 79 |   // Add API calls based on available keys
 80 |   if (keys.openai.key) {
 81 |     apiCalls.push(fetchOpenAIModels(keys.openai.key))
 82 |   }
 83 |   
 84 |   if (keys.gemini.key) {
 85 |     apiCalls.push(fetchGeminiModels(keys.gemini.key))
 86 |   }
 87 |   
 88 |   // Execute all API calls in parallel
 89 |   const results = await Promise.allSettled(apiCalls)
 90 |   
 91 |   // Process results gracefully
 92 |   results.forEach((result) => {
 93 |     if (result.status === 'fulfilled') {
 94 |       models.push(...result.value)
 95 |     } else {
 96 |       console.error('Failed to fetch models:', result.reason)
 97 |     }
 98 |   })
 99 |   
100 |   // ... continue with static providers
101 | })
102 | ```
103 | 
104 | This approach ensures that if you have both OpenAI and Gemini API keys configured, both APIs are called simultaneously rather than sequentially, significantly reducing the total response time.
105 | 
106 | ### 3. Correcting the Gemini API Integration
107 | 
108 | We updated our Gemini API integration to match the actual response schema:
109 | 
110 | ```typescript
111 | // Updated interface matching actual Gemini API
112 | interface GeminiModelApiResponse {
113 |   models: Array<{
114 |     name: string
115 |     displayName?: string
116 |     description?: string
117 |     supportedGenerationMethods?: string[]
118 |   }>
119 |   nextPageToken?: string
120 | }
121 | 
122 | // Proper API call implementation
123 | async function fetchGeminiModels(apiKey: string): Promise<ModelItem[]> {
124 |   try {
125 |     const response = await fetch(`https://generativelanguage.googleapis.com/v1beta/models?key=${apiKey}`)
126 | 
127 |     if (response.ok) {
128 |       const data: GeminiModelApiResponse = await response.json()
129 |       return data.models
130 |         .filter(model => 
131 |           model.supportedGenerationMethods?.includes('generateContent') &&
132 |           !model.name.includes('embedding')
133 |         )
134 |         .map(model => ({
135 |           name: model.name.replace('models/', ''), // Remove API prefix
136 |           details: {
137 |             family: MODEL_FAMILIES.gemini
138 |           }
139 |         }))
140 |     }
141 |   } catch (error) {
142 |     console.error('Failed to fetch Gemini models:', error)
143 |   }
144 |   
145 |   // Fallback to static models
146 |   return GEMINI_MODELS.map((model) => ({
147 |     name: model,
148 |     details: {
149 |       family: MODEL_FAMILIES.gemini
150 |     }
151 |   }))
152 | }
153 | ```
154 | 
155 | We also ensured that only the fields actually needed by the application are included in our interface definition, optimizing both memory usage and type safety.
156 | 
157 | ## The Results
158 | 
159 | The refactoring delivered several tangible improvements:
160 | 
161 | **Performance Enhancement**: Users with multiple API providers configured now experience significantly faster model loading, as API calls execute in parallel rather than sequentially.
162 | 
163 | **Better Error Resilience**: Using `Promise.allSettled()` means that if one provider's API fails, others continue to work normally, providing a more robust user experience.
164 | 
165 | **Enhanced Maintainability**: The modular approach makes it much easier to add new AI providers or modify existing integrations without affecting other parts of the system.
166 | 
167 | **Accurate Data Integration**: The corrected Gemini API integration ensures we're getting the most up-to-date model information directly from Google's API, rather than relying solely on static lists.
168 | 
169 | **Future-Ready Architecture**: The inclusion of `nextPageToken` support means we're prepared for pagination if needed in the future, and the modular design makes extending functionality straightforward.
170 | 
171 | ## Reflecting on Technical Debt
172 | 
173 | This refactoring is a perfect example of how early pragmatic decisions can evolve into technical debt over time. The initial choice to hardcode model lists was absolutely the right decision for rapid prototyping and early development. It allowed us to focus on core features without getting bogged down in API integration complexity.
174 | 
175 | However, the AI landscape moves incredibly fast. What seemed like a manageable list of models quickly became a maintenance burden as providers like OpenAI and Google released new models monthly, sometimes weekly. The static approach that served us well in the beginning became a bottleneck for user experience and developer productivity.
176 | 
177 | The key lesson here is recognizing when technical debt has grown from "helpful shortcut" to "user-impacting limitation." The transition point came when we realized users were asking for models that existed in the wild but weren't available in our platform due to our hardcoded lists.
178 | 
179 | ## Technical Lessons Learned
180 | 
181 | This refactoring reinforced several important principles for API integration and technical debt management:
182 | 
183 | 1. **Parallel Over Sequential**: When dealing with multiple independent external APIs, always consider parallel execution to improve user experience.
184 | 
185 | 2. **Accuracy Over Assumption**: Always verify actual API response schemas rather than making assumptions based on documentation or other sources.
186 | 
187 | 3. **Modular Design**: Breaking down complex operations into focused, single-responsibility functions improves both maintainability and testability.
188 | 
189 | 4. **Graceful Degradation**: Each integration should have proper fallback mechanisms to ensure the application remains functional even when external services are unavailable.
190 | 
191 | 5. **Interface Minimalism**: Only include the data fields your application actually needs to optimize performance and maintain clean code.
192 | 
193 | 6. **Technical Debt Recognition**: Hardcoded solutions can be valuable for rapid development, but establishing clear criteria for when to transition to dynamic approaches prevents user-impacting limitations.
194 | 
195 | 7. **Progressive Enhancement**: The new dynamic system maintains static fallbacks, ensuring reliability while providing the benefits of real-time data.
196 | 
197 | ## Looking Forward
198 | 
199 | This refactoring sets a solid foundation for future enhancements to our model management system. The modular architecture makes it straightforward to add support for new AI providers, and the parallel execution pattern can be applied to other areas of the application where multiple external API calls are needed.
200 | 
201 | The improved Gemini integration also opens up opportunities to leverage additional features from Google's Generative AI API as they become available, while maintaining the performance benefits of our new parallel execution approach.
202 | 
203 | ---
204 | 
205 | *This improvement is part of our ongoing effort to optimize ChatOllama's performance and maintainability. For more technical insights and updates, follow our development blog series.*
206 | 


--------------------------------------------------------------------------------
/src/content/blog/2025-08-26-model-api-refactoring-parallel-execution.md:
--------------------------------------------------------------------------------
  1 | ---
  2 | title: "Model API Refactoring: Implementing Parallel Execution and Proper Gemini Integration"
  3 | date: "2025-08-26"
  4 | description: "Refactoring model API architecture for parallel execution and proper Gemini integration"
  5 | ---
  6 | 
  7 | 
  8 | *August 26, 2025*
  9 | 
 10 | ## The Challenge
 11 | 
 12 | Like many fast-moving projects, ChatOllama started with a pragmatic approach to model management. In the early stages, we simply hardcoded the supported models for different AI provider families in static arrays. This was a conscious decision to move fast and get the core functionality working quickly - a classic "make it work first, optimize later" approach.
 13 | 
 14 | However, as the AI landscape evolved rapidly and our platform matured, this technical debt started to create real problems:
 15 | 
 16 | **Outdated Model Lists**: New models from providers like OpenAI, Gemini, and others weren't immediately available to users. We had to manually update our static lists every time providers released new capabilities.
 17 | 
 18 | **Maintenance Overhead**: Each provider update meant code changes, testing, and deployment cycles just to keep our model lists current.
 19 | 
 20 | **User Frustration**: Power users who wanted to try the latest models (like GPT-4 Turbo variants or new Gemini models) had to wait for us to update our hardcoded lists.
 21 | 
 22 | **Performance Issues**: On top of the maintenance burden, we discovered that our model discovery API had architectural limitations affecting performance. The existing implementation was processing external API calls sequentially, and our Gemini API integration wasn't aligned with the actual API response schema.
 23 | 
 24 | It was time to address this technical debt properly and build a more dynamic, sustainable solution.
 25 | 
 26 | ## What We Discovered
 27 | 
 28 | During our analysis, we identified several key issues:
 29 | 
 30 | 1. **Sequential API Processing**: The existing code was making API calls to different providers (OpenAI, Gemini, custom endpoints) one after another, creating unnecessary latency when multiple providers were configured.
 31 | 
 32 | 2. **Incorrect Gemini API Schema**: Our interface definition didn't match the actual Gemini API response structure, which includes a `models` array and optional `nextPageToken` for pagination support.
 33 | 
 34 | 3. **Monolithic Function**: All the model fetching logic was embedded in a single event handler, making it difficult to maintain and extend for new providers.
 35 | 
 36 | 4. **Incomplete Field Utilization**: We were defining interface fields that the application didn't actually need, leading to unnecessary data processing.
 37 | 
 38 | ## The Solution: Parallel Execution and Modular Design
 39 | 
 40 | We approached this refactoring with three main goals: improve performance through parallelization, ensure API accuracy, and enhance maintainability through modular design.
 41 | 
 42 | ### 1. Extracting Provider-Specific Functions
 43 | 
 44 | First, we broke down the monolithic approach into dedicated functions for each provider:
 45 | 
 46 | ```typescript
 47 | // Fetch OpenAI models
 48 | async function fetchOpenAIModels(apiKey: string): Promise<ModelItem[]> {
 49 |   try {
 50 |     const response = await fetch('https://api.openai.com/v1/models', {
 51 |       headers: {
 52 |         'Authorization': `Bearer ${apiKey}`,
 53 |       }
 54 |     })
 55 |     // ... processing logic with fallback
 56 |   } catch (error) {
 57 |     console.error('Failed to fetch OpenAI models:', error)
 58 |   }
 59 |   // Fallback to static models
 60 |   return OPENAI_GPT_MODELS.map((model) => ({
 61 |     name: model,
 62 |     details: { family: MODEL_FAMILIES.openai }
 63 |   }))
 64 | }
 65 | ```
 66 | 
 67 | This pattern was replicated for `fetchGeminiModels()`, `fetchOllamaModels()`, and `fetchCustomModels()`, giving each provider its own isolated logic while maintaining consistent error handling and fallback mechanisms.
 68 | 
 69 | ### 2. Implementing Parallel Execution
 70 | 
 71 | The real performance breakthrough came from implementing parallel execution using `Promise.allSettled()`:
 72 | 
 73 | ```typescript
 74 | export default defineEventHandler(async (event) => {
 75 |   const keys = event.context.keys
 76 |   const models: ModelItem[] = []
 77 | 
 78 |   // Prepare parallel API calls for providers that support dynamic fetching
 79 |   const apiCalls: Promise<ModelItem[]>[] = []
 80 |   
 81 |   // Always try to fetch Ollama models
 82 |   apiCalls.push(fetchOllamaModels(event))
 83 |   
 84 |   // Add API calls based on available keys
 85 |   if (keys.openai.key) {
 86 |     apiCalls.push(fetchOpenAIModels(keys.openai.key))
 87 |   }
 88 |   
 89 |   if (keys.gemini.key) {
 90 |     apiCalls.push(fetchGeminiModels(keys.gemini.key))
 91 |   }
 92 |   
 93 |   // Execute all API calls in parallel
 94 |   const results = await Promise.allSettled(apiCalls)
 95 |   
 96 |   // Process results gracefully
 97 |   results.forEach((result) => {
 98 |     if (result.status === 'fulfilled') {
 99 |       models.push(...result.value)
100 |     } else {
101 |       console.error('Failed to fetch models:', result.reason)
102 |     }
103 |   })
104 |   
105 |   // ... continue with static providers
106 | })
107 | ```
108 | 
109 | This approach ensures that if you have both OpenAI and Gemini API keys configured, both APIs are called simultaneously rather than sequentially, significantly reducing the total response time.
110 | 
111 | ### 3. Correcting the Gemini API Integration
112 | 
113 | We updated our Gemini API integration to match the actual response schema:
114 | 
115 | ```typescript
116 | // Updated interface matching actual Gemini API
117 | interface GeminiModelApiResponse {
118 |   models: Array<{
119 |     name: string
120 |     displayName?: string
121 |     description?: string
122 |     supportedGenerationMethods?: string[]
123 |   }>
124 |   nextPageToken?: string
125 | }
126 | 
127 | // Proper API call implementation
128 | async function fetchGeminiModels(apiKey: string): Promise<ModelItem[]> {
129 |   try {
130 |     const response = await fetch(`https://generativelanguage.googleapis.com/v1beta/models?key=${apiKey}`)
131 | 
132 |     if (response.ok) {
133 |       const data: GeminiModelApiResponse = await response.json()
134 |       return data.models
135 |         .filter(model => 
136 |           model.supportedGenerationMethods?.includes('generateContent') &&
137 |           !model.name.includes('embedding')
138 |         )
139 |         .map(model => ({
140 |           name: model.name.replace('models/', ''), // Remove API prefix
141 |           details: {
142 |             family: MODEL_FAMILIES.gemini
143 |           }
144 |         }))
145 |     }
146 |   } catch (error) {
147 |     console.error('Failed to fetch Gemini models:', error)
148 |   }
149 |   
150 |   // Fallback to static models
151 |   return GEMINI_MODELS.map((model) => ({
152 |     name: model,
153 |     details: {
154 |       family: MODEL_FAMILIES.gemini
155 |     }
156 |   }))
157 | }
158 | ```
159 | 
160 | We also ensured that only the fields actually needed by the application are included in our interface definition, optimizing both memory usage and type safety.
161 | 
162 | ## The Results
163 | 
164 | The refactoring delivered several tangible improvements:
165 | 
166 | **Performance Enhancement**: Users with multiple API providers configured now experience significantly faster model loading, as API calls execute in parallel rather than sequentially.
167 | 
168 | **Better Error Resilience**: Using `Promise.allSettled()` means that if one provider's API fails, others continue to work normally, providing a more robust user experience.
169 | 
170 | **Enhanced Maintainability**: The modular approach makes it much easier to add new AI providers or modify existing integrations without affecting other parts of the system.
171 | 
172 | **Accurate Data Integration**: The corrected Gemini API integration ensures we're getting the most up-to-date model information directly from Google's API, rather than relying solely on static lists.
173 | 
174 | **Future-Ready Architecture**: The inclusion of `nextPageToken` support means we're prepared for pagination if needed in the future, and the modular design makes extending functionality straightforward.
175 | 
176 | ## Reflecting on Technical Debt
177 | 
178 | This refactoring is a perfect example of how early pragmatic decisions can evolve into technical debt over time. The initial choice to hardcode model lists was absolutely the right decision for rapid prototyping and early development. It allowed us to focus on core features without getting bogged down in API integration complexity.
179 | 
180 | However, the AI landscape moves incredibly fast. What seemed like a manageable list of models quickly became a maintenance burden as providers like OpenAI and Google released new models monthly, sometimes weekly. The static approach that served us well in the beginning became a bottleneck for user experience and developer productivity.
181 | 
182 | The key lesson here is recognizing when technical debt has grown from "helpful shortcut" to "user-impacting limitation." The transition point came when we realized users were asking for models that existed in the wild but weren't available in our platform due to our hardcoded lists.
183 | 
184 | ## Technical Lessons Learned
185 | 
186 | This refactoring reinforced several important principles for API integration and technical debt management:
187 | 
188 | 1. **Parallel Over Sequential**: When dealing with multiple independent external APIs, always consider parallel execution to improve user experience.
189 | 
190 | 2. **Accuracy Over Assumption**: Always verify actual API response schemas rather than making assumptions based on documentation or other sources.
191 | 
192 | 3. **Modular Design**: Breaking down complex operations into focused, single-responsibility functions improves both maintainability and testability.
193 | 
194 | 4. **Graceful Degradation**: Each integration should have proper fallback mechanisms to ensure the application remains functional even when external services are unavailable.
195 | 
196 | 5. **Interface Minimalism**: Only include the data fields your application actually needs to optimize performance and maintain clean code.
197 | 
198 | 6. **Technical Debt Recognition**: Hardcoded solutions can be valuable for rapid development, but establishing clear criteria for when to transition to dynamic approaches prevents user-impacting limitations.
199 | 
200 | 7. **Progressive Enhancement**: The new dynamic system maintains static fallbacks, ensuring reliability while providing the benefits of real-time data.
201 | 
202 | ## Looking Forward
203 | 
204 | This refactoring sets a solid foundation for future enhancements to our model management system. The modular architecture makes it straightforward to add support for new AI providers, and the parallel execution pattern can be applied to other areas of the application where multiple external API calls are needed.
205 | 
206 | The improved Gemini integration also opens up opportunities to leverage additional features from Google's Generative AI API as they become available, while maintaining the performance benefits of our new parallel execution approach.
207 | 
208 | ---
209 | 
210 | *This improvement is part of our ongoing effort to optimize ChatOllama's performance and maintainability. For more technical insights and updates, follow our development blog series.*
211 | 


--------------------------------------------------------------------------------
/content/20250909-improving-ai-chat-experience-with-smart-title-generation.md:
--------------------------------------------------------------------------------
  1 | # 用AI为AI对话生成标题：改进用户体验的技术实践
  2 | 
  3 | > 一个看似简单的功能，背后的技术思考和实现细节
  4 | 
  5 | ## 背景：从用户痛点到产品改进
  6 | 
  7 | 在AI对话应用中，我们经常遇到这样的场景：用户开始了一个新的对话，询问关于"意大利足球青训体系"的问题，但会话列表中显示的却是"新对话"或者一串没有意义的ID。当用户想要回顾之前的对话时，面对一排"新对话"的标题，只能逐个点击查看内容。
  8 | 
  9 | 这是一个典型的**用户体验债务**——功能完整，但缺乏人性化的细节。
 10 | 
 11 | ## 产品思维：小功能，大体验
 12 | 
 13 | ### 用户期望是什么？
 14 | 
 15 | - **即时识别**：一眼就能知道这个对话讨论了什么
 16 | - **智能生成**：不需要手动输入，自动理解内容
 17 | - **准确简洁**：标题既要准确又要简洁
 18 | - **实时更新**：生成后立即在界面上显示
 19 | 
 20 | ### 技术挑战是什么？
 21 | 
 22 | 看起来简单的功能，实际实现时会遇到不少挑战：
 23 | 
 24 | 1. **模型一致性**：标题生成要使用和对话相同的AI模型
 25 | 2. **触发时机**：什么时候生成标题？如何避免重复生成？
 26 | 3. **性能考虑**：不能影响正常对话的响应速度
 27 | 4. **错误处理**：生成失败时如何优雅降级？
 28 | 5. **UI同步**：如何实时更新界面显示？
 29 | 
 30 | ## 技术实现：从简单到优雅
 31 | 
 32 | ### 第一版：直接复制聊天逻辑
 33 | 
 34 | 最直观的想法是复制现有的聊天API逻辑，去掉知识库和流式返回：
 35 | 
 36 | ```typescript
 37 | // 简单粗暴的实现
 38 | export default defineEventHandler(async (event) => {
 39 |   const { model, family, userMessage } = await readBody(event)
 40 |   
 41 |   const llm = createChatModel(model, family, event)
 42 |   const systemPrompt = `生成一个简洁的标题`
 43 |   
 44 |   const response = await llm.invoke([
 45 |     ['system', systemPrompt],
 46 |     ['user', userMessage]
 47 |   ])
 48 |   
 49 |   return { title: response.content.trim() }
 50 | })
 51 | ```
 52 | 
 53 | 这个版本能工作，但有几个问题：
 54 | - 缺乏配置灵活性
 55 | - 错误处理不完善  
 56 | - 无法复用到其他场景
 57 | 
 58 | ### 第二版：解决模型配置问题
 59 | 
 60 | 实际测试时发现一个关键问题：聊天使用的是Moonshot的Kimi模型，但标题生成却回退到了本地Ollama。
 61 | 
 62 | **根本原因**：自定义模型配置没有正确传递到标题生成API。
 63 | 
 64 | 聊天API能正确工作是因为Web Worker传递了完整的请求头：
 65 | 
 66 | ```typescript
 67 | // 聊天请求包含关键的配置信息
 68 | const response = await fetch('/api/models/chat', {
 69 |   method: 'POST',
 70 |   headers: {
 71 |     ...headers, // 这里包含了 x-chat-ollama-keys
 72 |     'Content-Type': 'application/json',
 73 |   },
 74 |   body: JSON.stringify({...})
 75 | })
 76 | ```
 77 | 
 78 | 而我们的标题生成请求缺少了这个关键的header：
 79 | 
 80 | ```typescript
 81 | // 修复后的实现
 82 | const { getKeysHeader } = await import('~/utils/settings')
 83 | 
 84 | const response = await fetch(`/api/sessions/${sessionId}/title`, {
 85 |   method: 'POST',
 86 |   headers: { 
 87 |     'Content-Type': 'application/json',
 88 |     ...getKeysHeader() // 关键：传递模型配置
 89 |   },
 90 |   body: JSON.stringify({ model, family, userMessage })
 91 | })
 92 | ```
 93 | 
 94 | **技术洞察**：看似独立的功能，往往依赖于系统的基础设施。确保新功能使用相同的基础组件是一致性的关键。
 95 | 
 96 | ### 第三版：模块化重构
 97 | 
 98 | 随着功能逐渐完善，我意识到代码耦合度太高，难以复用。于是进行了全面重构：
 99 | 
100 | #### 1. 分层架构
101 | 
102 | ```
103 | Component Layer    → 使用自动标题生成
104 |    ↓
105 | Utility Layer     → 配置触发条件和策略  
106 |    ↓
107 | Composable Layer  → 核心逻辑和API调用
108 |    ↓
109 | API Layer         → 与AI模型交互
110 | ```
111 | 
112 | #### 2. 职责分离
113 | 
114 | **Composable层**负责核心逻辑：
115 | ```typescript
116 | export function useSessionTitle() {
117 |   const generateTitleAPI = async (model, family, userMessage, sessionId) => {
118 |     // 纯粹的API调用
119 |   }
120 | 
121 |   const updateSessionInDB = async (sessionId, title) => {
122 |     // 纯粹的数据库操作
123 |   }
124 | 
125 |   const generateSessionTitle = async (options) => {
126 |     // 组合API调用和数据库更新
127 |   }
128 | 
129 |   return { generateTitleAPI, updateSessionInDB, generateSessionTitle }
130 | }
131 | ```
132 | 
133 | **Utility层**负责策略配置：
134 | ```typescript
135 | export const titleTriggers = {
136 |   firstUserMessage: {
137 |     shouldGenerate: (context) => {
138 |       // 判断是否应该生成标题的逻辑
139 |     },
140 |     extractMessage: (context) => {
141 |       // 提取用于生成标题的内容
142 |     }
143 |   }
144 | }
145 | ```
146 | 
147 | **Component层**只需要简单配置：
148 | ```typescript
149 | // 组件中的使用非常简洁
150 | const autoTitleGenerator = createAutoTitleGenerator.forFirstMessage((title) => {
151 |   sessionInfo.value.title = title
152 |   emit('title-updated', title)
153 | })
154 | 
155 | // 在消息处理中调用
156 | autoTitleGenerator.attemptTitleGeneration(context, sessionId, model, family)
157 | ```
158 | 
159 | ## 设计模式的运用
160 | 
161 | ### 1. 策略模式（Strategy Pattern）
162 | 
163 | 不同场景下的标题生成策略：
164 | 
165 | ```typescript
166 | const strategies = {
167 |   firstMessage: { /* 首条消息触发 */ },
168 |   onDemand: { /* 按需生成 */ },
169 |   periodic: { /* 定期更新 */ }
170 | }
171 | ```
172 | 
173 | ### 2. 工厂模式（Factory Pattern）
174 | 
175 | 快速创建常用配置：
176 | 
177 | ```typescript
178 | const generator = createAutoTitleGenerator.forFirstMessage(callback)
179 | // vs 复杂的手动配置
180 | const generator = new AutoTitleGenerator({ 
181 |   enabled: true,
182 |   trigger: titleTriggers.firstUserMessage,
183 |   onTitleGenerated: callback 
184 | })
185 | ```
186 | 
187 | ### 3. 观察者模式（Observer Pattern）
188 | 
189 | 组件间的解耦通信：
190 | 
191 | ```typescript
192 | // Chat组件发出事件
193 | emit('title-updated', title)
194 | 
195 | // 父组件响应事件
196 | @title-updated="onTitleUpdated"
197 | ```
198 | 
199 | ## 用户体验的细节
200 | 
201 | ### 1. 非阻塞设计
202 | 
203 | 标题生成完全异步，不影响正常对话：
204 | 
205 | ```typescript
206 | // 发送消息后立即继续，标题生成在后台进行
207 | emits('message', userMessage)
208 | messages.value.push(userMessage)
209 | 
210 | // 异步生成标题，成功后更新UI
211 | autoTitleGenerator.attemptTitleGeneration(...)
212 | ```
213 | 
214 | ### 2. 优雅降级
215 | 
216 | 生成失败时不影响核心功能：
217 | 
218 | ```typescript
219 | generateSessionTitle(options)
220 |   .then(title => {
221 |     if (title) updateUI(title)
222 |   })
223 |   .catch(error => {
224 |     console.warn('Title generation failed:', error)
225 |     // 用户不会感知到失败，对话正常进行
226 |   })
227 | ```
228 | 
229 | ### 3. 实时反馈
230 | 
231 | 标题生成后立即更新多个UI位置：
232 | 
233 | ```typescript
234 | const onTitleGenerated = (title) => {
235 |   // 更新当前会话显示
236 |   sessionInfo.value.title = title
237 |   
238 |   // 更新会话列表
239 |   emit('title-updated', title)
240 | }
241 | ```
242 | 
243 | ## 技术亮点与创新
244 | 
245 | ### 1. 配置化的提示工程
246 | 
247 | 不同场景使用不同的提示策略：
248 | 
249 | ```typescript
250 | const TITLE_PROMPTS = {
251 |   concise: (maxWords) => `生成${maxWords}字的简洁标题`,
252 |   descriptive: (maxWords) => `生成${maxWords}字的描述性标题`,
253 |   technical: (maxWords) => `生成${maxWords}字的技术性标题`,
254 |   casual: (maxWords) => `生成${maxWords}字的轻松标题`
255 | }
256 | ```
257 | 
258 | ### 2. 智能内容提取
259 | 
260 | 支持多模态内容的智能提取：
261 | 
262 | ```typescript
263 | extractMessage: (context) => {
264 |   const content = context.messageContent
265 |   if (Array.isArray(content)) {
266 |     // 多模态内容：提取文本部分
267 |     return content
268 |       .filter(item => item.type === 'text' && item.text)
269 |       .map(item => item.text)
270 |       .join(' ')
271 |   }
272 |   // 纯文本内容
273 |   return content
274 | }
275 | ```
276 | 
277 | ### 3. 渐进式增强
278 | 
279 | 功能设计支持渐进式扩展：
280 | 
281 | ```typescript
282 | // 基础用法
283 | const title = await generateSessionTitle({
284 |   sessionId, model, family, userMessage
285 | })
286 | 
287 | // 高级用法
288 | const title = await generateSessionTitle({
289 |   sessionId, model, family, userMessage,
290 |   style: 'technical',
291 |   maxWords: 8,
292 |   onSuccess: (title) => notifyUser(title),
293 |   onError: (error) => logError(error)
294 | })
295 | ```
296 | 
297 | ## 开发者体验
298 | 
299 | ### 文档即代码
300 | 
301 | 为了让功能真正可复用，我们创建了完整的开发者文档：
302 | 
303 | - **主文档**：完整的架构说明和使用指南
304 | - **快速参考**：常用模式的代码片段  
305 | - **API参考**：完整的TypeScript类型定义
306 | 
307 | ### 示例驱动
308 | 
309 | 文档中包含了丰富的实际使用示例：
310 | 
311 | ```typescript
312 | // 文档聊天场景
313 | const generator = createAutoTitleGenerator.forFirstMessage(onTitleGenerated)
314 | 
315 | // 文档摘要场景  
316 | const title = await generateSessionTitle({
317 |   sessionId: docId,
318 |   model: 'gpt-4',
319 |   family: 'OpenAI',
320 |   userMessage: documentContent,
321 |   style: 'descriptive'
322 | })
323 | 
324 | // 批量处理场景
325 | const results = await Promise.allSettled(
326 |   sessions.map(session => generateTitleAPI(session.model, session.family, session.firstMessage, session.id))
327 | )
328 | ```
329 | 
330 | ## 性能优化
331 | 
332 | ### 1. 懒加载
333 | 
334 | 避免增加初始包体积：
335 | 
336 | ```typescript
337 | // 动态导入，需要时才加载
338 | import('~/composables/useSessionTitle').then(({ generateSessionTitle }) => {
339 |   generateSessionTitle(options)
340 | })
341 | ```
342 | 
343 | ### 2. 错误边界
344 | 
345 | 确保功能失败不影响主流程：
346 | 
347 | ```typescript
348 | try {
349 |   const title = await generateTitleAPI(model, family, userMessage, sessionId)
350 |   if (title) {
351 |     await updateSessionInDB(sessionId, title)
352 |     onSuccess?.(title)
353 |   }
354 | } catch (error) {
355 |   console.warn('Title generation failed:', error)
356 |   onError?.(error)
357 |   // 继续执行，不抛出异常
358 | }
359 | ```
360 | 
361 | ## 测试策略
362 | 
363 | ### 单元测试
364 | 
365 | 测试核心逻辑：
366 | 
367 | ```typescript
368 | describe('Title Triggers', () => {
369 |   it('should generate on first user message', () => {
370 |     const context = {
371 |       messages: [{ role: 'user', content: 'Hello' }],
372 |       sessionTitle: ''
373 |     }
374 |     
375 |     const shouldGenerate = titleTriggers.firstUserMessage.shouldGenerate(context)
376 |     expect(shouldGenerate).toBe(true)
377 |   })
378 | })
379 | ```
380 | 
381 | ### 集成测试
382 | 
383 | 测试完整流程：
384 | 
385 | ```typescript
386 | describe('Session Title Generation', () => {
387 |   it('should generate and save title', async () => {
388 |     const { generateSessionTitle } = useSessionTitle()
389 |     
390 |     const title = await generateSessionTitle({
391 |       sessionId: 1,
392 |       model: 'test-model', 
393 |       family: 'OpenAI',
394 |       userMessage: 'Test message'
395 |     })
396 |     
397 |     expect(title).toBeTruthy()
398 |   })
399 | })
400 | ```
401 | 
402 | ## 经验总结
403 | 
404 | ### 1. 从用户体验出发
405 | 
406 | 技术实现要服务于用户体验，而不是相反。"自动生成标题"看起来是技术功能，本质上是为了解决用户"难以管理对话历史"的痛点。
407 | 
408 | ### 2. 迭代式开发
409 | 
410 | - **第一版**：快速验证想法可行性
411 | - **第二版**：解决实际部署中的问题  
412 | - **第三版**：为长期维护和扩展做准备
413 | 
414 | ### 3. 基础设施的重要性
415 | 
416 | 新功能往往依赖现有的基础设施（如认证、配置管理、错误处理等）。确保新功能复用这些基础设施，而不是重复造轮子。
417 | 
418 | ### 4. 可测试性设计
419 | 
420 | - 分离纯函数和副作用
421 | - 依赖注入而不是硬编码
422 | - 提供清晰的错误边界
423 | 
424 | ### 5. 文档即投资
425 | 
426 | 完善的文档不仅帮助他人理解代码，更重要的是确保功能能被正确使用和扩展。
427 | 
428 | ## 未来展望
429 | 
430 | ### 1. 个性化标题风格
431 | 
432 | 根据用户偏好生成不同风格的标题：
433 | 
434 | ```typescript
435 | // 用户配置
436 | const userPrefs = {
437 |   titleStyle: 'technical',    // 偏好技术性表述
438 |   titleLength: 'medium',      // 中等长度
439 |   language: 'zh'              // 中文标题
440 | }
441 | ```
442 | 
443 | ### 2. 上下文感知生成
444 | 
445 | 结合对话历史生成更精准的标题：
446 | 
447 | ```typescript
448 | generateContextAwareTitle({
449 |   currentMessage: "具体问题",
450 |   conversationHistory: previousMessages,
451 |   userProfile: userInterests
452 | })
453 | ```
454 | 
455 | ### 3. 多语言支持
456 | 
457 | 基于用户消息语言自动选择标题语言：
458 | 
459 | ```typescript
460 | const detectedLanguage = detectLanguage(userMessage)
461 | const title = await generateSessionTitle({
462 |   ...options,
463 |   language: detectedLanguage
464 | })
465 | ```
466 | 
467 | ### 4. 批量优化
468 | 
469 | 为已有的大量"无标题"对话批量生成标题：
470 | 
471 | ```typescript
472 | const batchGenerateService = new BatchTitleGenerator({
473 |   concurrency: 5,
474 |   rateLimiting: true,
475 |   progressCallback: (progress) => updateUI(progress)
476 | })
477 | 
478 | await batchGenerateService.processExistingSessions()
479 | ```
480 | 
481 | ## 结语
482 | 
483 | 一个"简单"的标题生成功能，背后涉及了产品设计、系统架构、性能优化、用户体验等多个方面。这个项目让我们看到：
484 | 
485 | - **细节决定体验**：小功能也能带来大的用户体验提升
486 | - **技术服务产品**：技术实现要以用户需求为导向
487 | - **架构考量长远**：为未来的扩展和维护做好准备
488 | - **文档助力协作**：良好的文档让功能真正可复用
489 | 
490 | 在AI应用快速发展的今天，我们不仅要关注AI能力本身，更要关注如何让这些能力更好地服务用户，创造真正有价值的产品体验。
491 | 
492 | ---
493 | 
494 | *本文基于ChatOllama项目中自动标题生成功能的实际开发经验总结而成。相关代码和文档已开源，欢迎参考和讨论。*
495 | 
496 | **技术栈**：Vue3 + Nuxt3 + TypeScript + LangChain + 多种AI模型
497 | 
498 | **项目地址**：[ChatOllama](https://github.com/sugarforever/chat-ollama)
499 | 
500 | **文档路径**：`docs/guide/session-title-generation.md`


--------------------------------------------------------------------------------
/src/content/blog-zh/2025-09-09-improving-ai-chat-experience-with-smart-title-generation_zh.md:
--------------------------------------------------------------------------------
  1 | ---
  2 | title: "用AI为AI对话生成标题：改进用户体验的技术实践"
  3 | date: "2025-09-09"
  4 | description: "Blog post about 用AI为AI对话生成标题：改进用户体验的技术实践"
  5 | ---
  6 | 
  7 | 
  8 | > 一个看似简单的功能，背后的技术思考和实现细节
  9 | 
 10 | ## 背景：从用户痛点到产品改进
 11 | 
 12 | 在AI对话应用中，我们经常遇到这样的场景：用户开始了一个新的对话，询问关于"意大利足球青训体系"的问题，但会话列表中显示的却是"新对话"或者一串没有意义的ID。当用户想要回顾之前的对话时，面对一排"新对话"的标题，只能逐个点击查看内容。
 13 | 
 14 | 这是一个典型的**用户体验债务**——功能完整，但缺乏人性化的细节。
 15 | 
 16 | ## 产品思维：小功能，大体验
 17 | 
 18 | ### 用户期望是什么？
 19 | 
 20 | - **即时识别**：一眼就能知道这个对话讨论了什么
 21 | - **智能生成**：不需要手动输入，自动理解内容
 22 | - **准确简洁**：标题既要准确又要简洁
 23 | - **实时更新**：生成后立即在界面上显示
 24 | 
 25 | ### 技术挑战是什么？
 26 | 
 27 | 看起来简单的功能，实际实现时会遇到不少挑战：
 28 | 
 29 | 1. **模型一致性**：标题生成要使用和对话相同的AI模型
 30 | 2. **触发时机**：什么时候生成标题？如何避免重复生成？
 31 | 3. **性能考虑**：不能影响正常对话的响应速度
 32 | 4. **错误处理**：生成失败时如何优雅降级？
 33 | 5. **UI同步**：如何实时更新界面显示？
 34 | 
 35 | ## 技术实现：从简单到优雅
 36 | 
 37 | ### 第一版：直接复制聊天逻辑
 38 | 
 39 | 最直观的想法是复制现有的聊天API逻辑，去掉知识库和流式返回：
 40 | 
 41 | ```typescript
 42 | // 简单粗暴的实现
 43 | export default defineEventHandler(async (event) => {
 44 |   const { model, family, userMessage } = await readBody(event)
 45 |   
 46 |   const llm = createChatModel(model, family, event)
 47 |   const systemPrompt = `生成一个简洁的标题`
 48 |   
 49 |   const response = await llm.invoke([
 50 |     ['system', systemPrompt],
 51 |     ['user', userMessage]
 52 |   ])
 53 |   
 54 |   return { title: response.content.trim() }
 55 | })
 56 | ```
 57 | 
 58 | 这个版本能工作，但有几个问题：
 59 | - 缺乏配置灵活性
 60 | - 错误处理不完善  
 61 | - 无法复用到其他场景
 62 | 
 63 | ### 第二版：解决模型配置问题
 64 | 
 65 | 实际测试时发现一个关键问题：聊天使用的是Moonshot的Kimi模型，但标题生成却回退到了本地Ollama。
 66 | 
 67 | **根本原因**：自定义模型配置没有正确传递到标题生成API。
 68 | 
 69 | 聊天API能正确工作是因为Web Worker传递了完整的请求头：
 70 | 
 71 | ```typescript
 72 | // 聊天请求包含关键的配置信息
 73 | const response = await fetch('/api/models/chat', {
 74 |   method: 'POST',
 75 |   headers: {
 76 |     ...headers, // 这里包含了 x-chat-ollama-keys
 77 |     'Content-Type': 'application/json',
 78 |   },
 79 |   body: JSON.stringify({...})
 80 | })
 81 | ```
 82 | 
 83 | 而我们的标题生成请求缺少了这个关键的header：
 84 | 
 85 | ```typescript
 86 | // 修复后的实现
 87 | const { getKeysHeader } = await import('~/utils/settings')
 88 | 
 89 | const response = await fetch(`/api/sessions/${sessionId}/title`, {
 90 |   method: 'POST',
 91 |   headers: { 
 92 |     'Content-Type': 'application/json',
 93 |     ...getKeysHeader() // 关键：传递模型配置
 94 |   },
 95 |   body: JSON.stringify({ model, family, userMessage })
 96 | })
 97 | ```
 98 | 
 99 | **技术洞察**：看似独立的功能，往往依赖于系统的基础设施。确保新功能使用相同的基础组件是一致性的关键。
100 | 
101 | ### 第三版：模块化重构
102 | 
103 | 随着功能逐渐完善，我意识到代码耦合度太高，难以复用。于是进行了全面重构：
104 | 
105 | #### 1. 分层架构
106 | 
107 | ```
108 | Component Layer    → 使用自动标题生成
109 |    ↓
110 | Utility Layer     → 配置触发条件和策略  
111 |    ↓
112 | Composable Layer  → 核心逻辑和API调用
113 |    ↓
114 | API Layer         → 与AI模型交互
115 | ```
116 | 
117 | #### 2. 职责分离
118 | 
119 | **Composable层**负责核心逻辑：
120 | ```typescript
121 | export function useSessionTitle() {
122 |   const generateTitleAPI = async (model, family, userMessage, sessionId) => {
123 |     // 纯粹的API调用
124 |   }
125 | 
126 |   const updateSessionInDB = async (sessionId, title) => {
127 |     // 纯粹的数据库操作
128 |   }
129 | 
130 |   const generateSessionTitle = async (options) => {
131 |     // 组合API调用和数据库更新
132 |   }
133 | 
134 |   return { generateTitleAPI, updateSessionInDB, generateSessionTitle }
135 | }
136 | ```
137 | 
138 | **Utility层**负责策略配置：
139 | ```typescript
140 | export const titleTriggers = {
141 |   firstUserMessage: {
142 |     shouldGenerate: (context) => {
143 |       // 判断是否应该生成标题的逻辑
144 |     },
145 |     extractMessage: (context) => {
146 |       // 提取用于生成标题的内容
147 |     }
148 |   }
149 | }
150 | ```
151 | 
152 | **Component层**只需要简单配置：
153 | ```typescript
154 | // 组件中的使用非常简洁
155 | const autoTitleGenerator = createAutoTitleGenerator.forFirstMessage((title) => {
156 |   sessionInfo.value.title = title
157 |   emit('title-updated', title)
158 | })
159 | 
160 | // 在消息处理中调用
161 | autoTitleGenerator.attemptTitleGeneration(context, sessionId, model, family)
162 | ```
163 | 
164 | ## 设计模式的运用
165 | 
166 | ### 1. 策略模式（Strategy Pattern）
167 | 
168 | 不同场景下的标题生成策略：
169 | 
170 | ```typescript
171 | const strategies = {
172 |   firstMessage: { /* 首条消息触发 */ },
173 |   onDemand: { /* 按需生成 */ },
174 |   periodic: { /* 定期更新 */ }
175 | }
176 | ```
177 | 
178 | ### 2. 工厂模式（Factory Pattern）
179 | 
180 | 快速创建常用配置：
181 | 
182 | ```typescript
183 | const generator = createAutoTitleGenerator.forFirstMessage(callback)
184 | // vs 复杂的手动配置
185 | const generator = new AutoTitleGenerator({ 
186 |   enabled: true,
187 |   trigger: titleTriggers.firstUserMessage,
188 |   onTitleGenerated: callback 
189 | })
190 | ```
191 | 
192 | ### 3. 观察者模式（Observer Pattern）
193 | 
194 | 组件间的解耦通信：
195 | 
196 | ```typescript
197 | // Chat组件发出事件
198 | emit('title-updated', title)
199 | 
200 | // 父组件响应事件
201 | @title-updated="onTitleUpdated"
202 | ```
203 | 
204 | ## 用户体验的细节
205 | 
206 | ### 1. 非阻塞设计
207 | 
208 | 标题生成完全异步，不影响正常对话：
209 | 
210 | ```typescript
211 | // 发送消息后立即继续，标题生成在后台进行
212 | emits('message', userMessage)
213 | messages.value.push(userMessage)
214 | 
215 | // 异步生成标题，成功后更新UI
216 | autoTitleGenerator.attemptTitleGeneration(...)
217 | ```
218 | 
219 | ### 2. 优雅降级
220 | 
221 | 生成失败时不影响核心功能：
222 | 
223 | ```typescript
224 | generateSessionTitle(options)
225 |   .then(title => {
226 |     if (title) updateUI(title)
227 |   })
228 |   .catch(error => {
229 |     console.warn('Title generation failed:', error)
230 |     // 用户不会感知到失败，对话正常进行
231 |   })
232 | ```
233 | 
234 | ### 3. 实时反馈
235 | 
236 | 标题生成后立即更新多个UI位置：
237 | 
238 | ```typescript
239 | const onTitleGenerated = (title) => {
240 |   // 更新当前会话显示
241 |   sessionInfo.value.title = title
242 |   
243 |   // 更新会话列表
244 |   emit('title-updated', title)
245 | }
246 | ```
247 | 
248 | ## 技术亮点与创新
249 | 
250 | ### 1. 配置化的提示工程
251 | 
252 | 不同场景使用不同的提示策略：
253 | 
254 | ```typescript
255 | const TITLE_PROMPTS = {
256 |   concise: (maxWords) => `生成${maxWords}字的简洁标题`,
257 |   descriptive: (maxWords) => `生成${maxWords}字的描述性标题`,
258 |   technical: (maxWords) => `生成${maxWords}字的技术性标题`,
259 |   casual: (maxWords) => `生成${maxWords}字的轻松标题`
260 | }
261 | ```
262 | 
263 | ### 2. 智能内容提取
264 | 
265 | 支持多模态内容的智能提取：
266 | 
267 | ```typescript
268 | extractMessage: (context) => {
269 |   const content = context.messageContent
270 |   if (Array.isArray(content)) {
271 |     // 多模态内容：提取文本部分
272 |     return content
273 |       .filter(item => item.type === 'text' && item.text)
274 |       .map(item => item.text)
275 |       .join(' ')
276 |   }
277 |   // 纯文本内容
278 |   return content
279 | }
280 | ```
281 | 
282 | ### 3. 渐进式增强
283 | 
284 | 功能设计支持渐进式扩展：
285 | 
286 | ```typescript
287 | // 基础用法
288 | const title = await generateSessionTitle({
289 |   sessionId, model, family, userMessage
290 | })
291 | 
292 | // 高级用法
293 | const title = await generateSessionTitle({
294 |   sessionId, model, family, userMessage,
295 |   style: 'technical',
296 |   maxWords: 8,
297 |   onSuccess: (title) => notifyUser(title),
298 |   onError: (error) => logError(error)
299 | })
300 | ```
301 | 
302 | ## 开发者体验
303 | 
304 | ### 文档即代码
305 | 
306 | 为了让功能真正可复用，我们创建了完整的开发者文档：
307 | 
308 | - **主文档**：完整的架构说明和使用指南
309 | - **快速参考**：常用模式的代码片段  
310 | - **API参考**：完整的TypeScript类型定义
311 | 
312 | ### 示例驱动
313 | 
314 | 文档中包含了丰富的实际使用示例：
315 | 
316 | ```typescript
317 | // 文档聊天场景
318 | const generator = createAutoTitleGenerator.forFirstMessage(onTitleGenerated)
319 | 
320 | // 文档摘要场景  
321 | const title = await generateSessionTitle({
322 |   sessionId: docId,
323 |   model: 'gpt-4',
324 |   family: 'OpenAI',
325 |   userMessage: documentContent,
326 |   style: 'descriptive'
327 | })
328 | 
329 | // 批量处理场景
330 | const results = await Promise.allSettled(
331 |   sessions.map(session => generateTitleAPI(session.model, session.family, session.firstMessage, session.id))
332 | )
333 | ```
334 | 
335 | ## 性能优化
336 | 
337 | ### 1. 懒加载
338 | 
339 | 避免增加初始包体积：
340 | 
341 | ```typescript
342 | // 动态导入，需要时才加载
343 | import('~/composables/useSessionTitle').then(({ generateSessionTitle }) => {
344 |   generateSessionTitle(options)
345 | })
346 | ```
347 | 
348 | ### 2. 错误边界
349 | 
350 | 确保功能失败不影响主流程：
351 | 
352 | ```typescript
353 | try {
354 |   const title = await generateTitleAPI(model, family, userMessage, sessionId)
355 |   if (title) {
356 |     await updateSessionInDB(sessionId, title)
357 |     onSuccess?.(title)
358 |   }
359 | } catch (error) {
360 |   console.warn('Title generation failed:', error)
361 |   onError?.(error)
362 |   // 继续执行，不抛出异常
363 | }
364 | ```
365 | 
366 | ## 测试策略
367 | 
368 | ### 单元测试
369 | 
370 | 测试核心逻辑：
371 | 
372 | ```typescript
373 | describe('Title Triggers', () => {
374 |   it('should generate on first user message', () => {
375 |     const context = {
376 |       messages: [{ role: 'user', content: 'Hello' }],
377 |       sessionTitle: ''
378 |     }
379 |     
380 |     const shouldGenerate = titleTriggers.firstUserMessage.shouldGenerate(context)
381 |     expect(shouldGenerate).toBe(true)
382 |   })
383 | })
384 | ```
385 | 
386 | ### 集成测试
387 | 
388 | 测试完整流程：
389 | 
390 | ```typescript
391 | describe('Session Title Generation', () => {
392 |   it('should generate and save title', async () => {
393 |     const { generateSessionTitle } = useSessionTitle()
394 |     
395 |     const title = await generateSessionTitle({
396 |       sessionId: 1,
397 |       model: 'test-model', 
398 |       family: 'OpenAI',
399 |       userMessage: 'Test message'
400 |     })
401 |     
402 |     expect(title).toBeTruthy()
403 |   })
404 | })
405 | ```
406 | 
407 | ## 经验总结
408 | 
409 | ### 1. 从用户体验出发
410 | 
411 | 技术实现要服务于用户体验，而不是相反。"自动生成标题"看起来是技术功能，本质上是为了解决用户"难以管理对话历史"的痛点。
412 | 
413 | ### 2. 迭代式开发
414 | 
415 | - **第一版**：快速验证想法可行性
416 | - **第二版**：解决实际部署中的问题  
417 | - **第三版**：为长期维护和扩展做准备
418 | 
419 | ### 3. 基础设施的重要性
420 | 
421 | 新功能往往依赖现有的基础设施（如认证、配置管理、错误处理等）。确保新功能复用这些基础设施，而不是重复造轮子。
422 | 
423 | ### 4. 可测试性设计
424 | 
425 | - 分离纯函数和副作用
426 | - 依赖注入而不是硬编码
427 | - 提供清晰的错误边界
428 | 
429 | ### 5. 文档即投资
430 | 
431 | 完善的文档不仅帮助他人理解代码，更重要的是确保功能能被正确使用和扩展。
432 | 
433 | ## 未来展望
434 | 
435 | ### 1. 个性化标题风格
436 | 
437 | 根据用户偏好生成不同风格的标题：
438 | 
439 | ```typescript
440 | // 用户配置
441 | const userPrefs = {
442 |   titleStyle: 'technical',    // 偏好技术性表述
443 |   titleLength: 'medium',      // 中等长度
444 |   language: 'zh'              // 中文标题
445 | }
446 | ```
447 | 
448 | ### 2. 上下文感知生成
449 | 
450 | 结合对话历史生成更精准的标题：
451 | 
452 | ```typescript
453 | generateContextAwareTitle({
454 |   currentMessage: "具体问题",
455 |   conversationHistory: previousMessages,
456 |   userProfile: userInterests
457 | })
458 | ```
459 | 
460 | ### 3. 多语言支持
461 | 
462 | 基于用户消息语言自动选择标题语言：
463 | 
464 | ```typescript
465 | const detectedLanguage = detectLanguage(userMessage)
466 | const title = await generateSessionTitle({
467 |   ...options,
468 |   language: detectedLanguage
469 | })
470 | ```
471 | 
472 | ### 4. 批量优化
473 | 
474 | 为已有的大量"无标题"对话批量生成标题：
475 | 
476 | ```typescript
477 | const batchGenerateService = new BatchTitleGenerator({
478 |   concurrency: 5,
479 |   rateLimiting: true,
480 |   progressCallback: (progress) => updateUI(progress)
481 | })
482 | 
483 | await batchGenerateService.processExistingSessions()
484 | ```
485 | 
486 | ## 结语
487 | 
488 | 一个"简单"的标题生成功能，背后涉及了产品设计、系统架构、性能优化、用户体验等多个方面。这个项目让我们看到：
489 | 
490 | - **细节决定体验**：小功能也能带来大的用户体验提升
491 | - **技术服务产品**：技术实现要以用户需求为导向
492 | - **架构考量长远**：为未来的扩展和维护做好准备
493 | - **文档助力协作**：良好的文档让功能真正可复用
494 | 
495 | 在AI应用快速发展的今天，我们不仅要关注AI能力本身，更要关注如何让这些能力更好地服务用户，创造真正有价值的产品体验。
496 | 
497 | ---
498 | 
499 | *本文基于ChatOllama项目中自动标题生成功能的实际开发经验总结而成。相关代码和文档已开源，欢迎参考和讨论。*
500 | 
501 | **技术栈**：Vue3 + Nuxt3 + TypeScript + LangChain + 多种AI模型
502 | 
503 | **项目地址**：[ChatOllama](https://github.com/sugarforever/chat-ollama)
504 | 
505 | **文档路径**：`docs/guide/session-title-generation.md`


--------------------------------------------------------------------------------
/content/20250828-openai-langchain-image-parsing-fix.md:
--------------------------------------------------------------------------------
  1 | # OpenAI-Compatible Image Parsing: Fixing LangChain Streaming Limitations
  2 | 
  3 | **Date:** August 28, 2025  
  4 | **Issue:** OpenAI-compatible APIs returning images in streaming responses not parsed by LangChain.js  
  5 | **Resolution Time:** ~6 hours  
  6 | 
  7 | ## 🐛 The Problem
  8 | 
  9 | While ChatOllama supported image uploads from users, a critical gap existed in handling AI-generated images from multimodal models. When using OpenAI-compatible APIs (particularly OpenRouter with Gemini models) that return images as part of their responses, these images were completely ignored during streaming chat sessions.
 10 | 
 11 | The issue was particularly problematic for users leveraging advanced multimodal models that could generate charts, diagrams, or other visual content. Instead of seeing the generated images, users would only receive text responses, missing crucial visual information that models like Gemini Flash were producing.
 12 | 
 13 | This limitation significantly impacted the user experience, especially for:
 14 | - Data visualization requests (charts, graphs)  
 15 | - Diagram generation tasks
 16 | - Creative image generation workflows
 17 | - Technical documentation with visual aids
 18 | 
 19 | ## 🔍 Root Cause Investigation
 20 | 
 21 | After extensive debugging and API response analysis, we discovered that OpenAI-compatible providers use a different response structure for image content compared to the standard OpenAI format that LangChain.js expected.
 22 | 
 23 | ### The Hidden Response Structure
 24 | 
 25 | Most OpenAI-compatible APIs (like OpenRouter) return image content using an `images` field alongside the standard `content` field:
 26 | 
 27 | ```json
 28 | {
 29 |   "role": "assistant",
 30 |   "content": "Here's the chart you requested: ",
 31 |   "images": [
 32 |     {
 33 |       "type": "image_url",
 34 |       "image_url": {
 35 |         "url": "data:image/png;base64,iVBORw0KGgo...",
 36 |         "detail": "high"
 37 |       }
 38 |     }
 39 |   ]
 40 | }
 41 | ```
 42 | 
 43 | However, LangChain.js streaming processors only handled these fields:
 44 | - ✅ `content` field (text content)
 45 | - ✅ `tool_calls` field (function calls)  
 46 | - ✅ `function_call` field (legacy function calls)
 47 | - ✅ `audio` field (audio content)
 48 | - ❌ `images` field (**completely ignored**)
 49 | 
 50 | The core issue was in two critical functions within the LangChain OpenAI chat models:
 51 | 1. `_convertCompletionsDeltaToBaseMessageChunk()` - For streaming responses
 52 | 2. `_convertCompletionsMessageToBaseMessage()` - For non-streaming responses
 53 | 
 54 | Both functions simply discarded any `images` field data, causing visual content to vanish from the final message.
 55 | 
 56 | ## 🔧 The Fix Implementation
 57 | 
 58 | ### Step-by-Step Implementation Guide
 59 | 
 60 | To implement this fix in your own project, you'll need to make changes to three key areas:
 61 | 
 62 | 1. **Custom LangChain OpenAI Chat Model** - Parse `images` field from API responses
 63 | 2. **Server Endpoint** - Extract and handle multimodal content 
 64 | 3. **Frontend Components** - Display parsed images
 65 | 
 66 | ### Step 1: Create Custom LangChain Implementation
 67 | 
 68 | Since this was a fundamental limitation in LangChain.js itself, we created a customized version of the OpenAI chat models at `server/models/openai/chat_models.ts`.
 69 | 
 70 | **Required Changes:**
 71 | 
 72 | #### 1.1. Enhanced Streaming Delta Processing
 73 | 
 74 | Find the `_convertCompletionsDeltaToBaseMessageChunk()` method in your LangChain OpenAI chat model and modify it:
 75 | 
 76 | **Before (Original LangChain):**
 77 | ```typescript
 78 | const content = delta.content ?? ""
 79 | ```
 80 | 
 81 | **After (Fixed):**
 82 | ```typescript
 83 | let content = delta.content ?? ""
 84 | 
 85 | // Handle images field that might contain image_url content
 86 | if (delta.images && Array.isArray(delta.images)) {
 87 |   // Convert content to array format if it's a string and there are images
 88 |   if (typeof content === "string") {
 89 |     const contentArray = []
 90 |     if (content) {
 91 |       contentArray.push({ type: "text", text: content })
 92 |     }
 93 |     // Add image content from the images field
 94 |     for (const image of delta.images) {
 95 |       if (image.type === "image_url" && image.image_url) {
 96 |         contentArray.push({
 97 |           type: "image_url",
 98 |           image_url: image.image_url,
 99 |         })
100 |       }
101 |     }
102 |     content = contentArray
103 |   }
104 | }
105 | ```
106 | 
107 | #### 1.2. Enhanced Non-Streaming Message Processing  
108 | 
109 | Find the `_convertCompletionsMessageToBaseMessage()` method and modify it:
110 | 
111 | **Before (Original LangChain):**
112 | ```typescript
113 | return new AIMessage({
114 |   content: message.content || "",
115 |   // ... other fields
116 | })
117 | ```
118 | 
119 | **After (Fixed):**
120 | ```typescript
121 | // Handle images field that might contain image_url content
122 | let content = message.content || ""
123 | if (message.images && Array.isArray(message.images)) {
124 |   // Convert content to array format if it's a string and there are images
125 |   if (typeof content === "string") {
126 |     const contentArray = []
127 |     if (content) {
128 |       contentArray.push({ type: "text", text: content })
129 |     }
130 |     // Add image content from the images field
131 |     for (const image of message.images) {
132 |       if (image.type === "image_url" && image.image_url) {
133 |         contentArray.push({
134 |           type: "image_url",
135 |           image_url: image.image_url,
136 |         })
137 |       }
138 |     }
139 |     content = contentArray
140 |   }
141 | }
142 | 
143 | return new AIMessage({
144 |   content,
145 |   // ... other fields
146 | })
147 | ```
148 | 
149 | ### Step 2: Update Server Endpoint Content Processing
150 | 
151 | Modify your chat endpoint to extract and handle multimodal content from the enhanced LangChain implementation:
152 | 
153 | **File:** `server/api/models/chat/index.post.ts` (or your equivalent)
154 | 
155 | **Add this new function:**
156 | ```typescript
157 | const extractContentFromChunk = (chunk: BaseMessageChunk): { text: string; images: any[] } => {
158 |   let content = chunk?.content
159 |   let textContent = ''
160 |   let images: any[] = []
161 | 
162 |   // Handle array content (multimodal)
163 |   if (Array.isArray(content)) {
164 |     // Extract text content
165 |     textContent = content
166 |       .filter(item => item.type === 'text_delta' || item.type === 'text')
167 |       .map(item => ('text' in item ? item.text : ''))
168 |       .join('')
169 | 
170 |     // Extract image content
171 |     images = content
172 |       .filter(item => item.type === 'image_url' && item.image_url?.url)
173 |       .map(item => ({ type: 'image_url', image_url: item.image_url }))
174 |   } else {
175 |     // Handle string content
176 |     textContent = content || ''
177 |   }
178 | 
179 |   return { text: textContent, images }
180 | }
181 | ```
182 | 
183 | **Update your streaming logic:**
184 | ```typescript
185 | // Replace existing extractContentFromChunk calls
186 | const { text, images } = extractContentFromChunk(chunk)
187 | 
188 | // Handle both text and images in your response
189 | if (accumulatedImages.length > 0) {
190 |   const contentArray: MessageContent[] = []
191 |   if (accumulatedTextContent) {
192 |     contentArray.push({ type: 'text', text: accumulatedTextContent })
193 |   }
194 |   contentArray.push(...accumulatedImages)
195 |   contentToStream = contentArray
196 | } else {
197 |   contentToStream = accumulatedTextContent
198 | }
199 | ```
200 | 
201 | ### Step 3: Frontend Image Display Implementation
202 | 
203 | Ensure your frontend components can extract and display images from the multimodal content:
204 | 
205 | **File:** `components/ChatMessageItem.vue` (or your equivalent)
206 | 
207 | **Add image extraction logic:**
208 | ```typescript
209 | const messageImages = computed(() => {
210 |   const content = props.message.content
211 |   if (!content || !Array.isArray(content)) return []
212 | 
213 |   return content
214 |     .filter(item => item.type === 'image_url' && item.image_url?.url)
215 |     .map(item => item.image_url!.url)
216 | })
217 | ```
218 | 
219 | **Update your template to display images:**
220 | ```vue
221 | <template>
222 |   <!-- Text content -->
223 |   <div v-if="messageContent" v-html="markdown.render(messageContent)" />
224 |   
225 |   <!-- Image gallery -->
226 |   <div v-if="messageImages.length > 0" class="image-gallery">
227 |     <img v-for="(url, index) in messageImages"
228 |          :key="index"
229 |          :src="url"
230 |          :alt="`Image ${index + 1}`"
231 |          class="rounded-lg max-h-64 object-contain" />
232 |   </div>
233 | </template>
234 | ```
235 | 
236 | **Add basic CSS for image display:**
237 | ```css
238 | .image-gallery {
239 |   display: grid;
240 |   grid-template-columns: repeat(auto-fit, minmax(200px, 1fr));
241 |   gap: 0.5rem;
242 |   margin-top: 0.75rem;
243 | }
244 | 
245 | .image-gallery img {
246 |   width: 100%;
247 |   height: auto;
248 |   background: var(--color-gray-100);
249 |   cursor: pointer;
250 | }
251 | ```
252 | 
253 | ## 🧪 Comprehensive Testing Strategy
254 | 
255 | We implemented extensive testing to ensure robustness across different scenarios:
256 | 
257 | **Test Coverage:**
258 | 1. ✅ **Text with single image** - Proper array conversion
259 | 2. ✅ **Multiple images** - Maintains correct order and structure  
260 | 3. ✅ **Images only (empty content)** - Works without text content
261 | 4. ✅ **Backward compatibility** - No breaking changes for standard responses
262 | 5. ✅ **Invalid image objects** - Graceful error handling
263 | 6. ✅ **Empty images array** - Handles edge cases properly
264 | 7. ✅ **Malformed data** - Robust error handling for invalid inputs
265 | 
266 | **Validation Commands:**
267 | ```bash
268 | npx tsx server/models/openai/tests/validate-core-logic.ts
269 | npx tsx server/models/openai/tests/validate-image-url-parsing.ts
270 | ```
271 | 
272 | ## 🎯 Content Format Transformation
273 | 
274 | The fix intelligently transforms API responses into LangChain-compatible multimodal content:
275 | 
276 | ### Input (OpenAI-Compatible API):
277 | ```json
278 | {
279 |   "content": "Here are two visualizations: ",
280 |   "images": [
281 |     { 
282 |       "type": "image_url", 
283 |       "image_url": { "url": "data:image/png;base64,chart1..." } 
284 |     },
285 |     { 
286 |       "type": "image_url", 
287 |       "image_url": { "url": "data:image/png;base64,chart2..." } 
288 |     }
289 |   ]
290 | }
291 | ```
292 | 
293 | ### Output (LangChain Message):
294 | ```json
295 | [
296 |   { "type": "text", "text": "Here are two visualizations: " },
297 |   { "type": "image_url", "image_url": { "url": "data:image/png;base64,chart1..." } },
298 |   { "type": "image_url", "image_url": { "url": "data:image/png;base64,chart2..." } }
299 | ]
300 | ```
301 | 
302 | ## 📚 Lessons Learned
303 | 
304 | This implementation taught us several valuable lessons about working with evolving AI APIs:
305 | 
306 | **API Standardization is Still Evolving:** Different OpenAI-compatible providers use varying response formats for multimodal content. Being adaptable to these differences is crucial for maintaining broad compatibility.
307 | 
308 | **Custom LangChain Implementations Have Value:** While staying close to upstream LangChain is generally preferred, sometimes specific use cases require custom implementations to unlock functionality that standard libraries don't yet support.
309 | 
310 | **Robust Testing Prevents Regressions:** Comprehensive edge case testing was essential, especially when dealing with the variety of response formats from different API providers.
311 | 
312 | **Backward Compatibility is Non-Negotiable:** Any changes to core message processing must maintain 100% backward compatibility to avoid breaking existing workflows.
313 | 
314 | ## 🚀 Impact and Results
315 | 
316 | The implementation delivers significant improvements to ChatOllama's multimodal capabilities:
317 | 
318 | **Immediate Benefits:**
319 | - **Full Multimodal Support**: Users can now see AI-generated images from models like Gemini Flash
320 | - **Enhanced Visualizations**: Data charts, diagrams, and creative images display properly  
321 | - **API Provider Flexibility**: Works seamlessly with OpenRouter, OpenAI, and other compatible providers
322 | - **Zero Breaking Changes**: Existing text-only workflows remain completely unaffected
323 | 
324 | **Technical Improvements:**
325 | - **Streaming Performance**: Images appear in real-time as they're generated
326 | - **Memory Efficiency**: Optimized processing only activates when images are present
327 | - **Error Resilience**: Graceful handling of malformed or incomplete image data
328 | - **Future-Proof Architecture**: Ready for additional multimodal content types
329 | 
330 | ## 💡 Real-World Usage Examples
331 | 
332 | This fix enables powerful new workflows:
333 | 
334 | ```typescript
335 | // User Request: "Create a bar chart showing Q4 sales data"
336 | // API Response: Mixed text + generated image
337 | {
338 |   "role": "assistant", 
339 |   "content": "Here's your Q4 sales visualization:",
340 |   "images": [{
341 |     "type": "image_url",
342 |     "image_url": {
343 |       "url": "data:image/png;base64,<chart_data>",
344 |       "detail": "high"
345 |     }
346 |   }]
347 | }
348 | 
349 | // ChatOllama Now Displays: Text + Interactive Image
350 | ```
351 | 
352 | ## 🚀 Quick Implementation Checklist
353 | 
354 | For developers implementing this fix:
355 | 
356 | ### ✅ **Required Files to Modify:**
357 | 
358 | 1. **`server/models/openai/chat_models.ts`** (or copy from `@langchain/openai`)
359 |    - ✅ Add image parsing to `_convertCompletionsDeltaToBaseMessageChunk()` 
360 |    - ✅ Add image parsing to `_convertCompletionsMessageToBaseMessage()`
361 | 
362 | 2. **`server/api/models/chat/index.post.ts`** (your chat endpoint)
363 |    - ✅ Update `extractContentFromChunk()` function
364 |    - ✅ Handle multimodal content in streaming logic
365 | 
366 | 3. **`components/ChatMessageItem.vue`** (your message component)
367 |    - ✅ Add `messageImages` computed property
368 |    - ✅ Update template with image gallery
369 |    - ✅ Add CSS for image display
370 | 
371 | ### ✅ **Key Code Patterns to Look For:**
372 | 
373 | **Problem Indicators:**
374 | ```typescript
375 | // ❌ Only handles text content
376 | const content = delta.content ?? ""
377 | 
378 | // ❌ Ignores images field completely  
379 | return new AIMessage({ content: message.content })
380 | ```
381 | 
382 | **Solution Patterns:**
383 | ```typescript
384 | // ✅ Handles both text and images
385 | if (delta.images && Array.isArray(delta.images)) {
386 |   // Convert to multimodal array format
387 | }
388 | 
389 | // ✅ Extracts images from multimodal content
390 | return content
391 |   .filter(item => item.type === 'image_url' && item.image_url?.url)
392 |   .map(item => item.image_url!.url)
393 | ```
394 | 
395 | ### ✅ **Testing Your Implementation:**
396 | 
397 | 1. **Test with OpenRouter + Gemini Flash** (known to return `images` field)
398 | 2. **Verify both streaming and non-streaming responses**  
399 | 3. **Check multiple images in single response**
400 | 4. **Ensure backward compatibility with text-only responses**
401 | 
402 | ---
403 | 
404 | *This fix enables full multimodal support for OpenAI-compatible APIs that use the `images` response field. By implementing these three key changes, you can unlock image generation capabilities in your LangChain.js-based chat applications.*


--------------------------------------------------------------------------------