| 1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889 |
- import * as readline from 'node:readline'
- import { stdin, stdout } from 'node:process'
- const API_URL = 'http://127.0.0.1:8080'
- const chat = [
- {
- human: "Hello, Assistant.",
- assistant: "Hello. How may I help you today?"
- },
- {
- human: "Please tell me the largest city in Europe.",
- assistant: "Sure. The largest city in Europe is Moscow, the capital of Russia."
- },
- ]
- const instruction = `A chat between a curious human and an artificial intelligence assistant. The assistant gives helpful, detailed, and polite answers to the human's questions.`
- function format_prompt(question) {
- return `${instruction}\n${
- chat.map(m =>`### Human: ${m.human}\n### Assistant: ${m.assistant}`).join("\n")
- }\n### Human: ${question}\n### Assistant:`
- }
- async function tokenize(content) {
- const result = await fetch(`${API_URL}/tokenize`, {
- method: 'POST',
- body: JSON.stringify({ content })
- })
- if (!result.ok) {
- return []
- }
- return await result.json().tokens
- }
- const n_keep = await tokenize(instruction).length
- async function chat_completion(question) {
- const result = await fetch(`${API_URL}/completion`, {
- method: 'POST',
- body: JSON.stringify({
- prompt: format_prompt(question),
- temperature: 0.2,
- top_k: 40,
- top_p: 0.9,
- n_keep: n_keep,
- n_predict: 256,
- stop: ["\n### Human:"], // stop completion after generating this
- stream: true,
- })
- })
- if (!result.ok) {
- return
- }
- let answer = ''
- for await (var chunk of result.body) {
- const t = Buffer.from(chunk).toString('utf8')
- if (t.startsWith('data: ')) {
- const message = JSON.parse(t.substring(6))
- answer += message.content
- process.stdout.write(message.content)
- if (message.stop) {
- if (message.truncated) {
- chat.shift()
- }
- break
- }
- }
- }
- process.stdout.write('\n')
- chat.push({ human: question, assistant: answer.trimStart() })
- }
- const rl = readline.createInterface({ input: stdin, output: stdout });
- const readlineQuestion = (rl, query, options) => new Promise((resolve, reject) => {
- rl.question(query, options, resolve)
- });
- while(true) {
- const question = await readlineQuestion(rl, '> ')
- await chat_completion(question)
- }
|