chat.ts 18 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641
  1. import { create } from "zustand";
  2. import { persist } from "zustand/middleware";
  3. import { trimTopic } from "../utils";
  4. import Locale, { getLang } from "../locales";
  5. import { showToast } from "../components/ui-lib";
  6. import { ModelConfig, ModelType, useAppConfig } from "./config";
  7. import { createEmptyMask, Mask } from "./mask";
  8. import {
  9. DEFAULT_INPUT_TEMPLATE,
  10. DEFAULT_SYSTEM_TEMPLATE,
  11. StoreKey,
  12. } from "../constant";
  13. import { api, RequestMessage } from "../client/api";
  14. import { ChatControllerPool } from "../client/controller";
  15. import { prettyObject } from "../utils/format";
  16. import { estimateTokenLength } from "../utils/token";
  17. import { nanoid } from "nanoid";
  18. export type ChatMessage = RequestMessage & {
  19. date: string;
  20. streaming?: boolean;
  21. isError?: boolean;
  22. id: string;
  23. model?: ModelType;
  24. };
  25. export function createMessage(override: Partial<ChatMessage>): ChatMessage {
  26. return {
  27. id: nanoid(),
  28. date: new Date().toLocaleString(),
  29. role: "user",
  30. content: "",
  31. ...override,
  32. };
  33. }
  34. export interface ChatStat {
  35. tokenCount: number;
  36. wordCount: number;
  37. charCount: number;
  38. }
  39. export interface ChatSession {
  40. id: string;
  41. topic: string;
  42. memoryPrompt: string;
  43. messages: ChatMessage[];
  44. stat: ChatStat;
  45. lastUpdate: number;
  46. lastSummarizeIndex: number;
  47. clearContextIndex?: number;
  48. mask: Mask;
  49. }
  50. export const DEFAULT_TOPIC = Locale.Store.DefaultTopic;
  51. export const BOT_HELLO: ChatMessage = createMessage({
  52. role: "assistant",
  53. content: Locale.Store.BotHello,
  54. });
  55. function createEmptySession(): ChatSession {
  56. return {
  57. id: nanoid(),
  58. topic: DEFAULT_TOPIC,
  59. memoryPrompt: "",
  60. messages: [],
  61. stat: {
  62. tokenCount: 0,
  63. wordCount: 0,
  64. charCount: 0,
  65. },
  66. lastUpdate: Date.now(),
  67. lastSummarizeIndex: 0,
  68. mask: createEmptyMask(),
  69. };
  70. }
  71. interface ChatStore {
  72. sessions: ChatSession[];
  73. currentSessionIndex: number;
  74. clearSessions: () => void;
  75. moveSession: (from: number, to: number) => void;
  76. selectSession: (index: number) => void;
  77. newSession: (mask?: Mask) => void;
  78. deleteSession: (index: number) => void;
  79. currentSession: () => ChatSession;
  80. nextSession: (delta: number) => void;
  81. onNewMessage: (message: ChatMessage) => void;
  82. onUserInput: (content: string) => Promise<void>;
  83. summarizeSession: () => void;
  84. updateStat: (message: ChatMessage) => void;
  85. updateCurrentSession: (updater: (session: ChatSession) => void) => void;
  86. updateMessage: (
  87. sessionIndex: number,
  88. messageIndex: number,
  89. updater: (message?: ChatMessage) => void,
  90. ) => void;
  91. resetSession: () => void;
  92. getMessagesWithMemory: () => ChatMessage[];
  93. getMemoryPrompt: () => ChatMessage;
  94. clearAllData: () => void;
  95. }
  96. function countMessages(msgs: ChatMessage[]) {
  97. return msgs.reduce((pre, cur) => pre + estimateTokenLength(cur.content), 0);
  98. }
  99. function fillTemplateWith(input: string, modelConfig: ModelConfig) {
  100. const vars = {
  101. model: modelConfig.model,
  102. time: new Date().toLocaleString(),
  103. lang: getLang(),
  104. input: input,
  105. };
  106. let output = modelConfig.template ?? DEFAULT_INPUT_TEMPLATE;
  107. // must contains {{input}}
  108. const inputVar = "{{input}}";
  109. if (!output.includes(inputVar)) {
  110. output += "\n" + inputVar;
  111. }
  112. Object.entries(vars).forEach(([name, value]) => {
  113. output = output.replaceAll(`{{${name}}}`, value);
  114. });
  115. return output;
  116. }
  117. export const useChatStore = create<ChatStore>()(
  118. persist(
  119. (set, get) => ({
  120. sessions: [createEmptySession()],
  121. currentSessionIndex: 0,
  122. clearSessions() {
  123. set(() => ({
  124. sessions: [createEmptySession()],
  125. currentSessionIndex: 0,
  126. }));
  127. },
  128. selectSession(index: number) {
  129. set({
  130. currentSessionIndex: index,
  131. });
  132. },
  133. moveSession(from: number, to: number) {
  134. set((state) => {
  135. const { sessions, currentSessionIndex: oldIndex } = state;
  136. // move the session
  137. const newSessions = [...sessions];
  138. const session = newSessions[from];
  139. newSessions.splice(from, 1);
  140. newSessions.splice(to, 0, session);
  141. // modify current session id
  142. let newIndex = oldIndex === from ? to : oldIndex;
  143. if (oldIndex > from && oldIndex <= to) {
  144. newIndex -= 1;
  145. } else if (oldIndex < from && oldIndex >= to) {
  146. newIndex += 1;
  147. }
  148. return {
  149. currentSessionIndex: newIndex,
  150. sessions: newSessions,
  151. };
  152. });
  153. },
  154. newSession(mask) {
  155. const session = createEmptySession();
  156. if (mask) {
  157. const config = useAppConfig.getState();
  158. const globalModelConfig = config.modelConfig;
  159. session.mask = {
  160. ...mask,
  161. modelConfig: {
  162. ...globalModelConfig,
  163. ...mask.modelConfig,
  164. },
  165. };
  166. session.topic = mask.name;
  167. }
  168. set((state) => ({
  169. currentSessionIndex: 0,
  170. sessions: [session].concat(state.sessions),
  171. }));
  172. },
  173. nextSession(delta) {
  174. const n = get().sessions.length;
  175. const limit = (x: number) => (x + n) % n;
  176. const i = get().currentSessionIndex;
  177. get().selectSession(limit(i + delta));
  178. },
  179. deleteSession(index) {
  180. const deletingLastSession = get().sessions.length === 1;
  181. const deletedSession = get().sessions.at(index);
  182. if (!deletedSession) return;
  183. const sessions = get().sessions.slice();
  184. sessions.splice(index, 1);
  185. const currentIndex = get().currentSessionIndex;
  186. let nextIndex = Math.min(
  187. currentIndex - Number(index < currentIndex),
  188. sessions.length - 1,
  189. );
  190. if (deletingLastSession) {
  191. nextIndex = 0;
  192. sessions.push(createEmptySession());
  193. }
  194. // for undo delete action
  195. const restoreState = {
  196. currentSessionIndex: get().currentSessionIndex,
  197. sessions: get().sessions.slice(),
  198. };
  199. set(() => ({
  200. currentSessionIndex: nextIndex,
  201. sessions,
  202. }));
  203. showToast(
  204. Locale.Home.DeleteToast,
  205. {
  206. text: Locale.Home.Revert,
  207. onClick() {
  208. set(() => restoreState);
  209. },
  210. },
  211. 5000,
  212. );
  213. },
  214. currentSession() {
  215. let index = get().currentSessionIndex;
  216. const sessions = get().sessions;
  217. if (index < 0 || index >= sessions.length) {
  218. index = Math.min(sessions.length - 1, Math.max(0, index));
  219. set(() => ({ currentSessionIndex: index }));
  220. }
  221. const session = sessions[index];
  222. return session;
  223. },
  224. onNewMessage(message) {
  225. get().updateCurrentSession((session) => {
  226. session.messages = session.messages.concat();
  227. session.lastUpdate = Date.now();
  228. });
  229. get().updateStat(message);
  230. get().summarizeSession();
  231. },
  232. async onUserInput(content) {
  233. const session = get().currentSession();
  234. const modelConfig = session.mask.modelConfig;
  235. const userContent = fillTemplateWith(content, modelConfig);
  236. console.log("[User Input] after template: ", userContent);
  237. const userMessage: ChatMessage = createMessage({
  238. role: "user",
  239. content: userContent,
  240. });
  241. const botMessage: ChatMessage = createMessage({
  242. role: "assistant",
  243. streaming: true,
  244. model: modelConfig.model,
  245. });
  246. // get recent messages
  247. const recentMessages = get().getMessagesWithMemory();
  248. const sendMessages = recentMessages.concat(userMessage);
  249. const messageIndex = get().currentSession().messages.length + 1;
  250. // save user's and bot's message
  251. get().updateCurrentSession((session) => {
  252. const savedUserMessage = {
  253. ...userMessage,
  254. content,
  255. };
  256. session.messages = session.messages.concat([
  257. savedUserMessage,
  258. botMessage,
  259. ]);
  260. });
  261. // make request
  262. api.llm.chat({
  263. messages: sendMessages,
  264. config: { ...modelConfig, stream: true },
  265. onUpdate(message) {
  266. botMessage.streaming = true;
  267. if (message) {
  268. botMessage.content = message;
  269. }
  270. get().updateCurrentSession((session) => {
  271. session.messages = session.messages.concat();
  272. });
  273. },
  274. onFinish(message) {
  275. botMessage.streaming = false;
  276. if (message) {
  277. botMessage.content = message;
  278. get().onNewMessage(botMessage);
  279. }
  280. ChatControllerPool.remove(session.id, botMessage.id);
  281. },
  282. onError(error) {
  283. const isAborted = error.message.includes("aborted");
  284. botMessage.content +=
  285. "\n\n" +
  286. prettyObject({
  287. error: true,
  288. message: error.message,
  289. });
  290. botMessage.streaming = false;
  291. userMessage.isError = !isAborted;
  292. botMessage.isError = !isAborted;
  293. get().updateCurrentSession((session) => {
  294. session.messages = session.messages.concat();
  295. });
  296. ChatControllerPool.remove(
  297. session.id,
  298. botMessage.id ?? messageIndex,
  299. );
  300. console.error("[Chat] failed ", error);
  301. },
  302. onController(controller) {
  303. // collect controller for stop/retry
  304. ChatControllerPool.addController(
  305. session.id,
  306. botMessage.id ?? messageIndex,
  307. controller,
  308. );
  309. },
  310. });
  311. },
  312. getMemoryPrompt() {
  313. const session = get().currentSession();
  314. return {
  315. role: "system",
  316. content:
  317. session.memoryPrompt.length > 0
  318. ? Locale.Store.Prompt.History(session.memoryPrompt)
  319. : "",
  320. date: "",
  321. } as ChatMessage;
  322. },
  323. getMessagesWithMemory() {
  324. const session = get().currentSession();
  325. const modelConfig = session.mask.modelConfig;
  326. const clearContextIndex = session.clearContextIndex ?? 0;
  327. const messages = session.messages.slice();
  328. const totalMessageCount = session.messages.length;
  329. // in-context prompts
  330. const contextPrompts = session.mask.context.slice();
  331. // system prompts, to get close to OpenAI Web ChatGPT
  332. const shouldInjectSystemPrompts = modelConfig.enableInjectSystemPrompts;
  333. const systemPrompts = shouldInjectSystemPrompts
  334. ? [
  335. createMessage({
  336. role: "system",
  337. content: fillTemplateWith("", {
  338. ...modelConfig,
  339. template: DEFAULT_SYSTEM_TEMPLATE,
  340. }),
  341. }),
  342. ]
  343. : [];
  344. if (shouldInjectSystemPrompts) {
  345. console.log(
  346. "[Global System Prompt] ",
  347. systemPrompts.at(0)?.content ?? "empty",
  348. );
  349. }
  350. // long term memory
  351. const shouldSendLongTermMemory =
  352. modelConfig.sendMemory &&
  353. session.memoryPrompt &&
  354. session.memoryPrompt.length > 0 &&
  355. session.lastSummarizeIndex > clearContextIndex;
  356. const longTermMemoryPrompts = shouldSendLongTermMemory
  357. ? [get().getMemoryPrompt()]
  358. : [];
  359. const longTermMemoryStartIndex = session.lastSummarizeIndex;
  360. // short term memory
  361. const shortTermMemoryStartIndex = Math.max(
  362. 0,
  363. totalMessageCount - modelConfig.historyMessageCount,
  364. );
  365. // lets concat send messages, including 4 parts:
  366. // 0. system prompt: to get close to OpenAI Web ChatGPT
  367. // 1. long term memory: summarized memory messages
  368. // 2. pre-defined in-context prompts
  369. // 3. short term memory: latest n messages
  370. // 4. newest input message
  371. const memoryStartIndex = shouldSendLongTermMemory
  372. ? Math.min(longTermMemoryStartIndex, shortTermMemoryStartIndex)
  373. : shortTermMemoryStartIndex;
  374. // and if user has cleared history messages, we should exclude the memory too.
  375. const contextStartIndex = Math.max(clearContextIndex, memoryStartIndex);
  376. const maxTokenThreshold = modelConfig.max_tokens;
  377. // get recent messages as much as possible
  378. const reversedRecentMessages = [];
  379. for (
  380. let i = totalMessageCount - 1, tokenCount = 0;
  381. i >= contextStartIndex && tokenCount < maxTokenThreshold;
  382. i -= 1
  383. ) {
  384. const msg = messages[i];
  385. if (!msg || msg.isError) continue;
  386. tokenCount += estimateTokenLength(msg.content);
  387. reversedRecentMessages.push(msg);
  388. }
  389. // concat all messages
  390. const recentMessages = [
  391. ...systemPrompts,
  392. ...longTermMemoryPrompts,
  393. ...contextPrompts,
  394. ...reversedRecentMessages.reverse(),
  395. ];
  396. return recentMessages;
  397. },
  398. updateMessage(
  399. sessionIndex: number,
  400. messageIndex: number,
  401. updater: (message?: ChatMessage) => void,
  402. ) {
  403. const sessions = get().sessions;
  404. const session = sessions.at(sessionIndex);
  405. const messages = session?.messages;
  406. updater(messages?.at(messageIndex));
  407. set(() => ({ sessions }));
  408. },
  409. resetSession() {
  410. get().updateCurrentSession((session) => {
  411. session.messages = [];
  412. session.memoryPrompt = "";
  413. });
  414. },
  415. summarizeSession() {
  416. const session = get().currentSession();
  417. // remove error messages if any
  418. const messages = session.messages;
  419. // should summarize topic after chating more than 50 words
  420. const SUMMARIZE_MIN_LEN = 50;
  421. if (
  422. session.topic === DEFAULT_TOPIC &&
  423. countMessages(messages) >= SUMMARIZE_MIN_LEN
  424. ) {
  425. const topicMessages = messages.concat(
  426. createMessage({
  427. role: "user",
  428. content: Locale.Store.Prompt.Topic,
  429. }),
  430. );
  431. api.llm.chat({
  432. messages: topicMessages,
  433. config: {
  434. model: "gpt-3.5-turbo",
  435. },
  436. onFinish(message) {
  437. get().updateCurrentSession(
  438. (session) =>
  439. (session.topic =
  440. message.length > 0 ? trimTopic(message) : DEFAULT_TOPIC),
  441. );
  442. },
  443. });
  444. }
  445. const modelConfig = session.mask.modelConfig;
  446. const summarizeIndex = Math.max(
  447. session.lastSummarizeIndex,
  448. session.clearContextIndex ?? 0,
  449. );
  450. let toBeSummarizedMsgs = messages
  451. .filter((msg) => !msg.isError)
  452. .slice(summarizeIndex);
  453. const historyMsgLength = countMessages(toBeSummarizedMsgs);
  454. if (historyMsgLength > modelConfig?.max_tokens ?? 4000) {
  455. const n = toBeSummarizedMsgs.length;
  456. toBeSummarizedMsgs = toBeSummarizedMsgs.slice(
  457. Math.max(0, n - modelConfig.historyMessageCount),
  458. );
  459. }
  460. // add memory prompt
  461. toBeSummarizedMsgs.unshift(get().getMemoryPrompt());
  462. const lastSummarizeIndex = session.messages.length;
  463. console.log(
  464. "[Chat History] ",
  465. toBeSummarizedMsgs,
  466. historyMsgLength,
  467. modelConfig.compressMessageLengthThreshold,
  468. );
  469. if (
  470. historyMsgLength > modelConfig.compressMessageLengthThreshold &&
  471. modelConfig.sendMemory
  472. ) {
  473. api.llm.chat({
  474. messages: toBeSummarizedMsgs.concat(
  475. createMessage({
  476. role: "system",
  477. content: Locale.Store.Prompt.Summarize,
  478. date: "",
  479. }),
  480. ),
  481. config: { ...modelConfig, stream: true, model: "gpt-3.5-turbo" },
  482. onUpdate(message) {
  483. session.memoryPrompt = message;
  484. },
  485. onFinish(message) {
  486. console.log("[Memory] ", message);
  487. session.lastSummarizeIndex = lastSummarizeIndex;
  488. },
  489. onError(err) {
  490. console.error("[Summarize] ", err);
  491. },
  492. });
  493. }
  494. },
  495. updateStat(message) {
  496. get().updateCurrentSession((session) => {
  497. session.stat.charCount += message.content.length;
  498. // TODO: should update chat count and word count
  499. });
  500. },
  501. updateCurrentSession(updater) {
  502. const sessions = get().sessions;
  503. const index = get().currentSessionIndex;
  504. updater(sessions[index]);
  505. set(() => ({ sessions }));
  506. },
  507. clearAllData() {
  508. localStorage.clear();
  509. location.reload();
  510. },
  511. }),
  512. {
  513. name: StoreKey.Chat,
  514. version: 3.1,
  515. migrate(persistedState, version) {
  516. const state = persistedState as any;
  517. const newState = JSON.parse(JSON.stringify(state)) as ChatStore;
  518. if (version < 2) {
  519. newState.sessions = [];
  520. const oldSessions = state.sessions;
  521. for (const oldSession of oldSessions) {
  522. const newSession = createEmptySession();
  523. newSession.topic = oldSession.topic;
  524. newSession.messages = [...oldSession.messages];
  525. newSession.mask.modelConfig.sendMemory = true;
  526. newSession.mask.modelConfig.historyMessageCount = 4;
  527. newSession.mask.modelConfig.compressMessageLengthThreshold = 1000;
  528. newState.sessions.push(newSession);
  529. }
  530. }
  531. if (version < 3) {
  532. // migrate id to nanoid
  533. newState.sessions.forEach((s) => {
  534. s.id = nanoid();
  535. s.messages.forEach((m) => (m.id = nanoid()));
  536. });
  537. }
  538. // Enable `enableInjectSystemPrompts` attribute for old sessions.
  539. // Resolve issue of old sessions not automatically enabling.
  540. if (version < 3.1) {
  541. newState.sessions.forEach((s) => {
  542. if (
  543. // Exclude those already set by user
  544. !s.mask.modelConfig.hasOwnProperty("enableInjectSystemPrompts")
  545. ) {
  546. // Because users may have changed this configuration,
  547. // the user's current configuration is used instead of the default
  548. const config = useAppConfig.getState();
  549. s.mask.modelConfig.enableInjectSystemPrompts =
  550. config.modelConfig.enableInjectSystemPrompts;
  551. }
  552. });
  553. }
  554. return newState;
  555. },
  556. },
  557. ),
  558. );