import ollama from 'ollama'

const response = await ollama.chat({
  model: 'llama3.2',
  messages: [{ role: 'user', content: '什么是 JavaScript？' }]
})

console.log(response.message.content)

多轮对话

const response = await ollama.chat({
  model: 'llama3.2',
  messages: [
    { role: 'user', content: '我叫小明' },
    { role: 'assistant', content: '你好小明！' },
    { role: 'user', content: '我叫什么名字？' }
  ]
})

console.log(response.message.content)

系统提示

const response = await ollama.chat({
  model: 'llama3.2',
  messages: [
    { role: 'system', content: '你是一个 JavaScript 专家' },
    { role: 'user', content: '什么是闭包？' }
  ]
})

带参数

const response = await ollama.chat({
  model: 'llama3.2',
  messages: [{ role: 'user', content: '写一首诗' }],
  options: {
    temperature: 0.7,
    num_ctx: 4096,
    top_p: 0.9
  }
})

生成接口

基本生成

const response = await ollama.generate({
  model: 'llama3.2',
  prompt: '用 JavaScript 写一个快速排序'
})

console.log(response.response)

带系统提示

const response = await ollama.generate({
  model: 'llama3.2',
  prompt: '写一个函数',
  system: '你是一个 JavaScript 编程专家'
})

JSON 格式输出

const response = await ollama.generate({
  model: 'llama3.2',
  prompt: '生成一个用户信息，包含姓名、年龄、邮箱',
  format: 'json'
})

const user = JSON.parse(response.response)
console.log(user)

嵌入接口

const response = await ollama.embeddings({
  model: 'nomic-embed-text',
  prompt: '这是一段需要向量化的文本'
})

console.log(`向量维度: ${response.embedding.length}`)

模型管理

列出模型

const { models } = await ollama.list()

models.forEach(model => {
  const sizeGB = (model.size / (1024 ** 3)).toFixed(2)
  console.log(`${model.name}: ${sizeGB} GB`)
})

拉取模型

const stream = await ollama.pull({ model: 'llama3.2', stream: true })

for await (const chunk of stream) {
  if (chunk.status === 'downloading digest') {
    const percent = (chunk.completed / chunk.total * 100).toFixed(1)
    process.stdout.write(`\r下载进度: ${percent}%`)
  } else {
    console.log(chunk.status)
  }
}

删除模型

await ollama.delete({ model: 'my-model' })
console.log('模型已删除')

创建模型

await ollama.create({
  model: 'my-assistant',
  modelfile: `
FROM llama3.2
SYSTEM 你是一个友好的助手
PARAMETER temperature 0.7
`
})

工具调用

const response = await ollama.chat({
  model: 'llama3.2',
  messages: [{ role: 'user', content: '北京今天天气怎么样？' }],
  tools: [{
    type: 'function',
    function: {
      name: 'get_weather',
      description: '获取城市天气',
      parameters: {
        type: 'object',
        properties: {
          city: { type: 'string', description: '城市名称' }
        },
        required: ['city']
      }
    }
  }]
})

if (response.message.tool_calls) {
  for (const tool of response.message.tool_calls) {
    console.log(`调用: ${tool.function.name}`)
    console.log(`参数:`, tool.function.arguments)
  }
}

图片输入

import { readFileSync } from 'fs'

const image = readFileSync('image.png')

const response = await ollama.chat({
  model: 'llava',
  messages: [{
    role: 'user',
    content: '这张图片里有什么？',
    images: [image]
  }]
})

console.log(response.message.content)

封装工具类

class OllamaChat {
  constructor(model = 'llama3.2', system = null) {
    this.model = model
    this.messages = []
    if (system) {
      this.messages.push({ role: 'system', content: system })
    }
  }
  
  async send(content) {
    this.messages.push({ role: 'user', content })
    
    const response = await ollama.chat({
      model: this.model,
      messages: this.messages
    })
    
    const reply = response.message.content
    this.messages.push({ role: 'assistant', content: reply })
    
    return reply
  }
  
  clear() {
    this.messages = this.messages.filter(m => m.role === 'system')
  }
}

// 使用
const chat = new OllamaChat('llama3.2', '你是一个友好的助手')
console.log(await chat.send('你好'))
console.log(await chat.send('我叫小明'))
console.log(await chat.send('我叫什么名字？'))

上一章：JavaScript SDK 安装与配置

下一章：JavaScript 流式处理