chat.ts 18 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625
  1. import { create } from "zustand";
  2. import { persist } from "zustand/middleware";
  3. import { trimTopic } from "../utils";
  4. import Locale, { getLang } from "../locales";
  5. import { showToast } from "../components/ui-lib";
  6. import { ModelConfig, ModelType, useAppConfig } from "./config";
  7. import { createEmptyMask, Mask } from "./mask";
  8. import {
  9. DEFAULT_INPUT_TEMPLATE,
  10. DEFAULT_SYSTEM_TEMPLATE,
  11. StoreKey,
  12. } from "../constant";
  13. import { api, RequestMessage } from "../client/api";
  14. import { ChatControllerPool } from "../client/controller";
  15. import { prettyObject } from "../utils/format";
  16. import { estimateTokenLength } from "../utils/token";
  17. export type ChatMessage = RequestMessage & {
  18. date: string;
  19. streaming?: boolean;
  20. isError?: boolean;
  21. id?: number;
  22. model?: ModelType;
  23. };
  24. export function createMessage(override: Partial<ChatMessage>): ChatMessage {
  25. return {
  26. id: Date.now(),
  27. date: new Date().toLocaleString(),
  28. role: "user",
  29. content: "",
  30. ...override,
  31. };
  32. }
  33. export interface ChatStat {
  34. tokenCount: number;
  35. wordCount: number;
  36. charCount: number;
  37. }
  38. export interface ChatSession {
  39. id: number;
  40. topic: string;
  41. memoryPrompt: string;
  42. messages: ChatMessage[];
  43. stat: ChatStat;
  44. lastUpdate: number;
  45. lastSummarizeIndex: number;
  46. clearContextIndex?: number;
  47. mask: Mask;
  48. }
  49. export const DEFAULT_TOPIC = Locale.Store.DefaultTopic;
  50. export const BOT_HELLO: ChatMessage = createMessage({
  51. role: "assistant",
  52. content: Locale.Store.BotHello,
  53. });
  54. function createEmptySession(): ChatSession {
  55. return {
  56. id: Date.now() + Math.random(),
  57. topic: DEFAULT_TOPIC,
  58. memoryPrompt: "",
  59. messages: [],
  60. stat: {
  61. tokenCount: 0,
  62. wordCount: 0,
  63. charCount: 0,
  64. },
  65. lastUpdate: Date.now(),
  66. lastSummarizeIndex: 0,
  67. mask: createEmptyMask(),
  68. };
  69. }
  70. interface ChatStore {
  71. sessions: ChatSession[];
  72. currentSessionIndex: number;
  73. globalId: number;
  74. clearSessions: () => void;
  75. moveSession: (from: number, to: number) => void;
  76. selectSession: (index: number) => void;
  77. newSession: (mask?: Mask) => void;
  78. deleteSession: (index: number) => void;
  79. currentSession: () => ChatSession;
  80. nextSession: (delta: number) => void;
  81. onNewMessage: (message: ChatMessage) => void;
  82. onUserInput: (content: string) => Promise<void>;
  83. summarizeSession: () => void;
  84. updateStat: (message: ChatMessage) => void;
  85. updateCurrentSession: (updater: (session: ChatSession) => void) => void;
  86. updateMessage: (
  87. sessionIndex: number,
  88. messageIndex: number,
  89. updater: (message?: ChatMessage) => void,
  90. ) => void;
  91. resetSession: () => void;
  92. getMessagesWithMemory: () => ChatMessage[];
  93. getMemoryPrompt: () => ChatMessage;
  94. clearAllData: () => void;
  95. }
  96. function countMessages(msgs: ChatMessage[]) {
  97. return msgs.reduce((pre, cur) => pre + estimateTokenLength(cur.content), 0);
  98. }
  99. function fillTemplateWith(input: string, modelConfig: ModelConfig) {
  100. const vars = {
  101. model: modelConfig.model,
  102. time: new Date().toLocaleString(),
  103. lang: getLang(),
  104. input: input,
  105. };
  106. let output = modelConfig.template ?? DEFAULT_INPUT_TEMPLATE;
  107. // must contains {{input}}
  108. const inputVar = "{{input}}";
  109. if (!output.includes(inputVar)) {
  110. output += "\n" + inputVar;
  111. }
  112. Object.entries(vars).forEach(([name, value]) => {
  113. output = output.replaceAll(`{{${name}}}`, value);
  114. });
  115. return output;
  116. }
  117. export const useChatStore = create<ChatStore>()(
  118. persist(
  119. (set, get) => ({
  120. sessions: [createEmptySession()],
  121. currentSessionIndex: 0,
  122. globalId: 0,
  123. clearSessions() {
  124. set(() => ({
  125. sessions: [createEmptySession()],
  126. currentSessionIndex: 0,
  127. }));
  128. },
  129. selectSession(index: number) {
  130. set({
  131. currentSessionIndex: index,
  132. });
  133. },
  134. moveSession(from: number, to: number) {
  135. set((state) => {
  136. const { sessions, currentSessionIndex: oldIndex } = state;
  137. // move the session
  138. const newSessions = [...sessions];
  139. const session = newSessions[from];
  140. newSessions.splice(from, 1);
  141. newSessions.splice(to, 0, session);
  142. // modify current session id
  143. let newIndex = oldIndex === from ? to : oldIndex;
  144. if (oldIndex > from && oldIndex <= to) {
  145. newIndex -= 1;
  146. } else if (oldIndex < from && oldIndex >= to) {
  147. newIndex += 1;
  148. }
  149. return {
  150. currentSessionIndex: newIndex,
  151. sessions: newSessions,
  152. };
  153. });
  154. },
  155. newSession(mask) {
  156. const session = createEmptySession();
  157. set(() => ({ globalId: get().globalId + 1 }));
  158. session.id = get().globalId;
  159. if (mask) {
  160. const config = useAppConfig.getState();
  161. const globalModelConfig = config.modelConfig;
  162. session.mask = {
  163. ...mask,
  164. modelConfig: {
  165. ...globalModelConfig,
  166. ...mask.modelConfig,
  167. },
  168. };
  169. session.topic = mask.name;
  170. }
  171. set((state) => ({
  172. currentSessionIndex: 0,
  173. sessions: [session].concat(state.sessions),
  174. }));
  175. },
  176. nextSession(delta) {
  177. const n = get().sessions.length;
  178. const limit = (x: number) => (x + n) % n;
  179. const i = get().currentSessionIndex;
  180. get().selectSession(limit(i + delta));
  181. },
  182. deleteSession(index) {
  183. const deletingLastSession = get().sessions.length === 1;
  184. const deletedSession = get().sessions.at(index);
  185. if (!deletedSession) return;
  186. const sessions = get().sessions.slice();
  187. sessions.splice(index, 1);
  188. const currentIndex = get().currentSessionIndex;
  189. let nextIndex = Math.min(
  190. currentIndex - Number(index < currentIndex),
  191. sessions.length - 1,
  192. );
  193. if (deletingLastSession) {
  194. nextIndex = 0;
  195. sessions.push(createEmptySession());
  196. }
  197. // for undo delete action
  198. const restoreState = {
  199. currentSessionIndex: get().currentSessionIndex,
  200. sessions: get().sessions.slice(),
  201. };
  202. set(() => ({
  203. currentSessionIndex: nextIndex,
  204. sessions,
  205. }));
  206. showToast(
  207. Locale.Home.DeleteToast,
  208. {
  209. text: Locale.Home.Revert,
  210. onClick() {
  211. set(() => restoreState);
  212. },
  213. },
  214. 5000,
  215. );
  216. },
  217. currentSession() {
  218. let index = get().currentSessionIndex;
  219. const sessions = get().sessions;
  220. if (index < 0 || index >= sessions.length) {
  221. index = Math.min(sessions.length - 1, Math.max(0, index));
  222. set(() => ({ currentSessionIndex: index }));
  223. }
  224. const session = sessions[index];
  225. return session;
  226. },
  227. onNewMessage(message) {
  228. get().updateCurrentSession((session) => {
  229. session.messages = session.messages.concat();
  230. session.lastUpdate = Date.now();
  231. });
  232. get().updateStat(message);
  233. get().summarizeSession();
  234. },
  235. async onUserInput(content) {
  236. const session = get().currentSession();
  237. const modelConfig = session.mask.modelConfig;
  238. const userContent = fillTemplateWith(content, modelConfig);
  239. console.log("[User Input] after template: ", userContent);
  240. const userMessage: ChatMessage = createMessage({
  241. role: "user",
  242. content: userContent,
  243. });
  244. const botMessage: ChatMessage = createMessage({
  245. role: "assistant",
  246. streaming: true,
  247. id: userMessage.id! + 1,
  248. model: modelConfig.model,
  249. });
  250. // get recent messages
  251. const recentMessages = get().getMessagesWithMemory();
  252. const sendMessages = recentMessages.concat(userMessage);
  253. const sessionIndex = get().currentSessionIndex;
  254. const messageIndex = get().currentSession().messages.length + 1;
  255. // save user's and bot's message
  256. get().updateCurrentSession((session) => {
  257. const savedUserMessage = {
  258. ...userMessage,
  259. content,
  260. };
  261. session.messages = session.messages.concat([
  262. savedUserMessage,
  263. botMessage,
  264. ]);
  265. });
  266. // make request
  267. api.llm.chat({
  268. messages: sendMessages,
  269. config: { ...modelConfig, stream: true },
  270. onUpdate(message) {
  271. botMessage.streaming = true;
  272. if (message) {
  273. botMessage.content = message;
  274. }
  275. get().updateCurrentSession((session) => {
  276. session.messages = session.messages.concat();
  277. });
  278. },
  279. onFinish(message) {
  280. botMessage.streaming = false;
  281. if (message) {
  282. botMessage.content = message;
  283. get().onNewMessage(botMessage);
  284. }
  285. ChatControllerPool.remove(
  286. sessionIndex,
  287. botMessage.id ?? messageIndex,
  288. );
  289. },
  290. onError(error) {
  291. const isAborted = error.message.includes("aborted");
  292. botMessage.content =
  293. "\n\n" +
  294. prettyObject({
  295. error: true,
  296. message: error.message,
  297. });
  298. botMessage.streaming = false;
  299. userMessage.isError = !isAborted;
  300. botMessage.isError = !isAborted;
  301. get().updateCurrentSession((session) => {
  302. session.messages = session.messages.concat();
  303. });
  304. ChatControllerPool.remove(
  305. sessionIndex,
  306. botMessage.id ?? messageIndex,
  307. );
  308. console.error("[Chat] failed ", error);
  309. },
  310. onController(controller) {
  311. // collect controller for stop/retry
  312. ChatControllerPool.addController(
  313. sessionIndex,
  314. botMessage.id ?? messageIndex,
  315. controller,
  316. );
  317. },
  318. });
  319. },
  320. getMemoryPrompt() {
  321. const session = get().currentSession();
  322. return {
  323. role: "system",
  324. content:
  325. session.memoryPrompt.length > 0
  326. ? Locale.Store.Prompt.History(session.memoryPrompt)
  327. : "",
  328. date: "",
  329. } as ChatMessage;
  330. },
  331. getMessagesWithMemory() {
  332. const session = get().currentSession();
  333. const modelConfig = session.mask.modelConfig;
  334. const clearContextIndex = session.clearContextIndex ?? 0;
  335. const messages = session.messages.slice();
  336. const totalMessageCount = session.messages.length;
  337. // in-context prompts
  338. const contextPrompts = session.mask.context.slice();
  339. // system prompts, to get close to OpenAI Web ChatGPT
  340. // only will be injected if user does not use a mask or set none context prompts
  341. const shouldInjectSystemPrompts = contextPrompts.length === 0;
  342. const systemPrompts = shouldInjectSystemPrompts
  343. ? [
  344. createMessage({
  345. role: "system",
  346. content: fillTemplateWith("", {
  347. ...modelConfig,
  348. template: DEFAULT_SYSTEM_TEMPLATE,
  349. }),
  350. }),
  351. ]
  352. : [];
  353. if (shouldInjectSystemPrompts) {
  354. console.log(
  355. "[Global System Prompt] ",
  356. systemPrompts.at(0)?.content ?? "empty",
  357. );
  358. }
  359. // long term memory
  360. const shouldSendLongTermMemory =
  361. modelConfig.sendMemory &&
  362. session.memoryPrompt &&
  363. session.memoryPrompt.length > 0 &&
  364. session.lastSummarizeIndex <= clearContextIndex;
  365. const longTermMemoryPrompts = shouldSendLongTermMemory
  366. ? [get().getMemoryPrompt()]
  367. : [];
  368. const longTermMemoryStartIndex = session.lastSummarizeIndex;
  369. // short term memory
  370. const shortTermMemoryStartIndex = Math.max(
  371. 0,
  372. totalMessageCount - modelConfig.historyMessageCount,
  373. );
  374. // lets concat send messages, including 4 parts:
  375. // 0. system prompt: to get close to OpenAI Web ChatGPT
  376. // 1. long term memory: summarized memory messages
  377. // 2. pre-defined in-context prompts
  378. // 3. short term memory: latest n messages
  379. // 4. newest input message
  380. const memoryStartIndex = shouldSendLongTermMemory
  381. ? Math.min(longTermMemoryStartIndex, shortTermMemoryStartIndex)
  382. : shortTermMemoryStartIndex;
  383. // and if user has cleared history messages, we should exclude the memory too.
  384. const contextStartIndex = Math.max(clearContextIndex, memoryStartIndex);
  385. const maxTokenThreshold = modelConfig.max_tokens;
  386. // get recent messages as much as possible
  387. const reversedRecentMessages = [];
  388. for (
  389. let i = totalMessageCount - 1, tokenCount = 0;
  390. i >= contextStartIndex && tokenCount < maxTokenThreshold;
  391. i -= 1
  392. ) {
  393. const msg = messages[i];
  394. if (!msg || msg.isError) continue;
  395. tokenCount += estimateTokenLength(msg.content);
  396. reversedRecentMessages.push(msg);
  397. }
  398. // concat all messages
  399. const recentMessages = [
  400. ...systemPrompts,
  401. ...longTermMemoryPrompts,
  402. ...contextPrompts,
  403. ...reversedRecentMessages.reverse(),
  404. ];
  405. return recentMessages;
  406. },
  407. updateMessage(
  408. sessionIndex: number,
  409. messageIndex: number,
  410. updater: (message?: ChatMessage) => void,
  411. ) {
  412. const sessions = get().sessions;
  413. const session = sessions.at(sessionIndex);
  414. const messages = session?.messages;
  415. updater(messages?.at(messageIndex));
  416. set(() => ({ sessions }));
  417. },
  418. resetSession() {
  419. get().updateCurrentSession((session) => {
  420. session.messages = [];
  421. session.memoryPrompt = "";
  422. });
  423. },
  424. summarizeSession() {
  425. const session = get().currentSession();
  426. // remove error messages if any
  427. const messages = session.messages;
  428. // should summarize topic after chating more than 50 words
  429. const SUMMARIZE_MIN_LEN = 50;
  430. if (
  431. session.topic === DEFAULT_TOPIC &&
  432. countMessages(messages) >= SUMMARIZE_MIN_LEN
  433. ) {
  434. const topicMessages = messages.concat(
  435. createMessage({
  436. role: "user",
  437. content: Locale.Store.Prompt.Topic,
  438. }),
  439. );
  440. api.llm.chat({
  441. messages: topicMessages,
  442. config: {
  443. model: "gpt-3.5-turbo",
  444. },
  445. onFinish(message) {
  446. get().updateCurrentSession(
  447. (session) =>
  448. (session.topic =
  449. message.length > 0 ? trimTopic(message) : DEFAULT_TOPIC),
  450. );
  451. },
  452. });
  453. }
  454. const modelConfig = session.mask.modelConfig;
  455. const summarizeIndex = Math.max(
  456. session.lastSummarizeIndex,
  457. session.clearContextIndex ?? 0,
  458. );
  459. let toBeSummarizedMsgs = messages
  460. .filter((msg) => !msg.isError)
  461. .slice(summarizeIndex);
  462. const historyMsgLength = countMessages(toBeSummarizedMsgs);
  463. if (historyMsgLength > modelConfig?.max_tokens ?? 4000) {
  464. const n = toBeSummarizedMsgs.length;
  465. toBeSummarizedMsgs = toBeSummarizedMsgs.slice(
  466. Math.max(0, n - modelConfig.historyMessageCount),
  467. );
  468. }
  469. // add memory prompt
  470. toBeSummarizedMsgs.unshift(get().getMemoryPrompt());
  471. const lastSummarizeIndex = session.messages.length;
  472. console.log(
  473. "[Chat History] ",
  474. toBeSummarizedMsgs,
  475. historyMsgLength,
  476. modelConfig.compressMessageLengthThreshold,
  477. );
  478. if (
  479. historyMsgLength > modelConfig.compressMessageLengthThreshold &&
  480. modelConfig.sendMemory
  481. ) {
  482. api.llm.chat({
  483. messages: toBeSummarizedMsgs.concat({
  484. role: "system",
  485. content: Locale.Store.Prompt.Summarize,
  486. date: "",
  487. }),
  488. config: { ...modelConfig, stream: true },
  489. onUpdate(message) {
  490. session.memoryPrompt = message;
  491. },
  492. onFinish(message) {
  493. console.log("[Memory] ", message);
  494. session.lastSummarizeIndex = lastSummarizeIndex;
  495. },
  496. onError(err) {
  497. console.error("[Summarize] ", err);
  498. },
  499. });
  500. }
  501. },
  502. updateStat(message) {
  503. get().updateCurrentSession((session) => {
  504. session.stat.charCount += message.content.length;
  505. // TODO: should update chat count and word count
  506. });
  507. },
  508. updateCurrentSession(updater) {
  509. const sessions = get().sessions;
  510. const index = get().currentSessionIndex;
  511. updater(sessions[index]);
  512. set(() => ({ sessions }));
  513. },
  514. clearAllData() {
  515. localStorage.clear();
  516. location.reload();
  517. },
  518. }),
  519. {
  520. name: StoreKey.Chat,
  521. version: 2,
  522. migrate(persistedState, version) {
  523. const state = persistedState as any;
  524. const newState = JSON.parse(JSON.stringify(state)) as ChatStore;
  525. if (version < 2) {
  526. newState.globalId = 0;
  527. newState.sessions = [];
  528. const oldSessions = state.sessions;
  529. for (const oldSession of oldSessions) {
  530. const newSession = createEmptySession();
  531. newSession.topic = oldSession.topic;
  532. newSession.messages = [...oldSession.messages];
  533. newSession.mask.modelConfig.sendMemory = true;
  534. newSession.mask.modelConfig.historyMessageCount = 4;
  535. newSession.mask.modelConfig.compressMessageLengthThreshold = 1000;
  536. newState.sessions.push(newSession);
  537. }
  538. }
  539. return newState;
  540. },
  541. },
  542. ),
  543. );