chat.ts 17 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592
  1. import { create } from "zustand";
  2. import { persist } from "zustand/middleware";
  3. import { trimTopic } from "../utils";
  4. import Locale, { getLang } from "../locales";
  5. import { showToast } from "../components/ui-lib";
  6. import { ModelConfig, ModelType, useAppConfig } from "./config";
  7. import { createEmptyMask, Mask } from "./mask";
  8. import { DEFAULT_INPUT_TEMPLATE, StoreKey } from "../constant";
  9. import { api, RequestMessage } from "../client/api";
  10. import { ChatControllerPool } from "../client/controller";
  11. import { prettyObject } from "../utils/format";
  12. import { estimateTokenLength } from "../utils/token";
  13. export type ChatMessage = RequestMessage & {
  14. date: string;
  15. streaming?: boolean;
  16. isError?: boolean;
  17. id?: number;
  18. model?: ModelType;
  19. };
  20. export function createMessage(override: Partial<ChatMessage>): ChatMessage {
  21. return {
  22. id: Date.now(),
  23. date: new Date().toLocaleString(),
  24. role: "user",
  25. content: "",
  26. ...override,
  27. };
  28. }
  29. export interface ChatStat {
  30. tokenCount: number;
  31. wordCount: number;
  32. charCount: number;
  33. }
  34. export interface ChatSession {
  35. id: number;
  36. topic: string;
  37. memoryPrompt: string;
  38. messages: ChatMessage[];
  39. stat: ChatStat;
  40. lastUpdate: number;
  41. lastSummarizeIndex: number;
  42. clearContextIndex?: number;
  43. mask: Mask;
  44. }
  45. export const DEFAULT_TOPIC = Locale.Store.DefaultTopic;
  46. export const BOT_HELLO: ChatMessage = createMessage({
  47. role: "assistant",
  48. content: Locale.Store.BotHello,
  49. });
  50. function createEmptySession(): ChatSession {
  51. return {
  52. id: Date.now() + Math.random(),
  53. topic: DEFAULT_TOPIC,
  54. memoryPrompt: "",
  55. messages: [],
  56. stat: {
  57. tokenCount: 0,
  58. wordCount: 0,
  59. charCount: 0,
  60. },
  61. lastUpdate: Date.now(),
  62. lastSummarizeIndex: 0,
  63. mask: createEmptyMask(),
  64. };
  65. }
  66. interface ChatStore {
  67. sessions: ChatSession[];
  68. currentSessionIndex: number;
  69. globalId: number;
  70. clearSessions: () => void;
  71. moveSession: (from: number, to: number) => void;
  72. selectSession: (index: number) => void;
  73. newSession: (mask?: Mask) => void;
  74. deleteSession: (index: number) => void;
  75. currentSession: () => ChatSession;
  76. onNewMessage: (message: ChatMessage) => void;
  77. onUserInput: (content: string) => Promise<void>;
  78. summarizeSession: () => void;
  79. updateStat: (message: ChatMessage) => void;
  80. updateCurrentSession: (updater: (session: ChatSession) => void) => void;
  81. updateMessage: (
  82. sessionIndex: number,
  83. messageIndex: number,
  84. updater: (message?: ChatMessage) => void,
  85. ) => void;
  86. resetSession: () => void;
  87. getMessagesWithMemory: () => ChatMessage[];
  88. getMemoryPrompt: () => ChatMessage;
  89. clearAllData: () => void;
  90. }
  91. function countMessages(msgs: ChatMessage[]) {
  92. return msgs.reduce((pre, cur) => pre + estimateTokenLength(cur.content), 0);
  93. }
  94. function fillTemplateWith(input: string, modelConfig: ModelConfig) {
  95. const vars = {
  96. model: modelConfig.model,
  97. time: new Date().toLocaleString(),
  98. lang: getLang(),
  99. input: input,
  100. };
  101. let output = modelConfig.template ?? DEFAULT_INPUT_TEMPLATE;
  102. // must contains {{input}}
  103. const inputVar = "{{input}}";
  104. if (!output.includes(inputVar)) {
  105. output += "\n" + inputVar;
  106. }
  107. Object.entries(vars).forEach(([name, value]) => {
  108. output = output.replaceAll(`{{${name}}}`, value);
  109. });
  110. return output;
  111. }
  112. export const useChatStore = create<ChatStore>()(
  113. persist(
  114. (set, get) => ({
  115. sessions: [createEmptySession()],
  116. currentSessionIndex: 0,
  117. globalId: 0,
  118. clearSessions() {
  119. set(() => ({
  120. sessions: [createEmptySession()],
  121. currentSessionIndex: 0,
  122. }));
  123. },
  124. selectSession(index: number) {
  125. set({
  126. currentSessionIndex: index,
  127. });
  128. },
  129. moveSession(from: number, to: number) {
  130. set((state) => {
  131. const { sessions, currentSessionIndex: oldIndex } = state;
  132. // move the session
  133. const newSessions = [...sessions];
  134. const session = newSessions[from];
  135. newSessions.splice(from, 1);
  136. newSessions.splice(to, 0, session);
  137. // modify current session id
  138. let newIndex = oldIndex === from ? to : oldIndex;
  139. if (oldIndex > from && oldIndex <= to) {
  140. newIndex -= 1;
  141. } else if (oldIndex < from && oldIndex >= to) {
  142. newIndex += 1;
  143. }
  144. return {
  145. currentSessionIndex: newIndex,
  146. sessions: newSessions,
  147. };
  148. });
  149. },
  150. newSession(mask) {
  151. const session = createEmptySession();
  152. set(() => ({ globalId: get().globalId + 1 }));
  153. session.id = get().globalId;
  154. if (mask) {
  155. const config = useAppConfig.getState();
  156. const globalModelConfig = config.modelConfig;
  157. session.mask = {
  158. ...mask,
  159. modelConfig: {
  160. ...globalModelConfig,
  161. ...mask.modelConfig,
  162. },
  163. };
  164. session.topic = mask.name;
  165. }
  166. set((state) => ({
  167. currentSessionIndex: 0,
  168. sessions: [session].concat(state.sessions),
  169. }));
  170. },
  171. deleteSession(index) {
  172. const deletingLastSession = get().sessions.length === 1;
  173. const deletedSession = get().sessions.at(index);
  174. if (!deletedSession) return;
  175. const sessions = get().sessions.slice();
  176. sessions.splice(index, 1);
  177. const currentIndex = get().currentSessionIndex;
  178. let nextIndex = Math.min(
  179. currentIndex - Number(index < currentIndex),
  180. sessions.length - 1,
  181. );
  182. if (deletingLastSession) {
  183. nextIndex = 0;
  184. sessions.push(createEmptySession());
  185. }
  186. // for undo delete action
  187. const restoreState = {
  188. currentSessionIndex: get().currentSessionIndex,
  189. sessions: get().sessions.slice(),
  190. };
  191. set(() => ({
  192. currentSessionIndex: nextIndex,
  193. sessions,
  194. }));
  195. showToast(
  196. Locale.Home.DeleteToast,
  197. {
  198. text: Locale.Home.Revert,
  199. onClick() {
  200. set(() => restoreState);
  201. },
  202. },
  203. 5000,
  204. );
  205. },
  206. currentSession() {
  207. let index = get().currentSessionIndex;
  208. const sessions = get().sessions;
  209. if (index < 0 || index >= sessions.length) {
  210. index = Math.min(sessions.length - 1, Math.max(0, index));
  211. set(() => ({ currentSessionIndex: index }));
  212. }
  213. const session = sessions[index];
  214. return session;
  215. },
  216. onNewMessage(message) {
  217. get().updateCurrentSession((session) => {
  218. session.messages = session.messages.concat();
  219. session.lastUpdate = Date.now();
  220. });
  221. get().updateStat(message);
  222. get().summarizeSession();
  223. },
  224. async onUserInput(content) {
  225. const session = get().currentSession();
  226. const modelConfig = session.mask.modelConfig;
  227. const userContent = fillTemplateWith(content, modelConfig);
  228. console.log("[User Input] fill with template: ", userContent);
  229. const userMessage: ChatMessage = createMessage({
  230. role: "user",
  231. content: userContent,
  232. });
  233. const botMessage: ChatMessage = createMessage({
  234. role: "assistant",
  235. streaming: true,
  236. id: userMessage.id! + 1,
  237. model: modelConfig.model,
  238. });
  239. // get recent messages
  240. const recentMessages = get().getMessagesWithMemory();
  241. const sendMessages = recentMessages.concat(userMessage);
  242. const sessionIndex = get().currentSessionIndex;
  243. const messageIndex = get().currentSession().messages.length + 1;
  244. // save user's and bot's message
  245. get().updateCurrentSession((session) => {
  246. const savedUserMessage = {
  247. ...userMessage,
  248. content,
  249. };
  250. session.messages = session.messages.concat([
  251. savedUserMessage,
  252. botMessage,
  253. ]);
  254. });
  255. // make request
  256. console.log("[User Input] ", sendMessages);
  257. api.llm.chat({
  258. messages: sendMessages,
  259. config: { ...modelConfig, stream: true },
  260. onUpdate(message) {
  261. botMessage.streaming = true;
  262. if (message) {
  263. botMessage.content = message;
  264. }
  265. get().updateCurrentSession((session) => {
  266. session.messages = session.messages.concat();
  267. });
  268. },
  269. onFinish(message) {
  270. botMessage.streaming = false;
  271. if (message) {
  272. botMessage.content = message;
  273. get().onNewMessage(botMessage);
  274. }
  275. ChatControllerPool.remove(
  276. sessionIndex,
  277. botMessage.id ?? messageIndex,
  278. );
  279. },
  280. onError(error) {
  281. const isAborted = error.message.includes("aborted");
  282. botMessage.content =
  283. "\n\n" +
  284. prettyObject({
  285. error: true,
  286. message: error.message,
  287. });
  288. botMessage.streaming = false;
  289. userMessage.isError = !isAborted;
  290. botMessage.isError = !isAborted;
  291. get().updateCurrentSession((session) => {
  292. session.messages = session.messages.concat();
  293. });
  294. ChatControllerPool.remove(
  295. sessionIndex,
  296. botMessage.id ?? messageIndex,
  297. );
  298. console.error("[Chat] failed ", error);
  299. },
  300. onController(controller) {
  301. // collect controller for stop/retry
  302. ChatControllerPool.addController(
  303. sessionIndex,
  304. botMessage.id ?? messageIndex,
  305. controller,
  306. );
  307. },
  308. });
  309. },
  310. getMemoryPrompt() {
  311. const session = get().currentSession();
  312. return {
  313. role: "system",
  314. content:
  315. session.memoryPrompt.length > 0
  316. ? Locale.Store.Prompt.History(session.memoryPrompt)
  317. : "",
  318. date: "",
  319. } as ChatMessage;
  320. },
  321. getMessagesWithMemory() {
  322. const session = get().currentSession();
  323. const modelConfig = session.mask.modelConfig;
  324. const clearContextIndex = session.clearContextIndex ?? 0;
  325. const messages = session.messages.slice();
  326. const totalMessageCount = session.messages.length;
  327. // in-context prompts
  328. const contextPrompts = session.mask.context.slice();
  329. // long term memory
  330. const shouldSendLongTermMemory =
  331. modelConfig.sendMemory &&
  332. session.memoryPrompt &&
  333. session.memoryPrompt.length > 0 &&
  334. session.lastSummarizeIndex <= clearContextIndex;
  335. const longTermMemoryPrompts = shouldSendLongTermMemory
  336. ? [get().getMemoryPrompt()]
  337. : [];
  338. const longTermMemoryStartIndex = session.lastSummarizeIndex;
  339. // short term memory
  340. const shortTermMemoryStartIndex = Math.max(
  341. 0,
  342. totalMessageCount - modelConfig.historyMessageCount,
  343. );
  344. // lets concat send messages, including 4 parts:
  345. // 1. long term memory: summarized memory messages
  346. // 2. pre-defined in-context prompts
  347. // 3. short term memory: latest n messages
  348. // 4. newest input message
  349. const memoryStartIndex = Math.min(
  350. longTermMemoryStartIndex,
  351. shortTermMemoryStartIndex,
  352. );
  353. // and if user has cleared history messages, we should exclude the memory too.
  354. const contextStartIndex = Math.max(clearContextIndex, memoryStartIndex);
  355. const maxTokenThreshold = modelConfig.max_tokens;
  356. // get recent messages as much as possible
  357. const reversedRecentMessages = [];
  358. for (
  359. let i = totalMessageCount - 1, tokenCount = 0;
  360. i >= contextStartIndex && tokenCount < maxTokenThreshold;
  361. i -= 1
  362. ) {
  363. const msg = messages[i];
  364. if (!msg || msg.isError) continue;
  365. tokenCount += estimateTokenLength(msg.content);
  366. reversedRecentMessages.push(msg);
  367. }
  368. // concat all messages
  369. const recentMessages = [
  370. ...longTermMemoryPrompts,
  371. ...contextPrompts,
  372. ...reversedRecentMessages.reverse(),
  373. ];
  374. return recentMessages;
  375. },
  376. updateMessage(
  377. sessionIndex: number,
  378. messageIndex: number,
  379. updater: (message?: ChatMessage) => void,
  380. ) {
  381. const sessions = get().sessions;
  382. const session = sessions.at(sessionIndex);
  383. const messages = session?.messages;
  384. updater(messages?.at(messageIndex));
  385. set(() => ({ sessions }));
  386. },
  387. resetSession() {
  388. get().updateCurrentSession((session) => {
  389. session.messages = [];
  390. session.memoryPrompt = "";
  391. });
  392. },
  393. summarizeSession() {
  394. const session = get().currentSession();
  395. // remove error messages if any
  396. const messages = session.messages;
  397. // should summarize topic after chating more than 50 words
  398. const SUMMARIZE_MIN_LEN = 50;
  399. if (
  400. session.topic === DEFAULT_TOPIC &&
  401. countMessages(messages) >= SUMMARIZE_MIN_LEN
  402. ) {
  403. const topicMessages = messages.concat(
  404. createMessage({
  405. role: "user",
  406. content: Locale.Store.Prompt.Topic,
  407. }),
  408. );
  409. api.llm.chat({
  410. messages: topicMessages,
  411. config: {
  412. model: "gpt-3.5-turbo",
  413. },
  414. onFinish(message) {
  415. get().updateCurrentSession(
  416. (session) =>
  417. (session.topic =
  418. message.length > 0 ? trimTopic(message) : DEFAULT_TOPIC),
  419. );
  420. },
  421. });
  422. }
  423. const modelConfig = session.mask.modelConfig;
  424. const summarizeIndex = Math.max(
  425. session.lastSummarizeIndex,
  426. session.clearContextIndex ?? 0,
  427. );
  428. let toBeSummarizedMsgs = messages
  429. .filter((msg) => !msg.isError)
  430. .slice(summarizeIndex);
  431. const historyMsgLength = countMessages(toBeSummarizedMsgs);
  432. if (historyMsgLength > modelConfig?.max_tokens ?? 4000) {
  433. const n = toBeSummarizedMsgs.length;
  434. toBeSummarizedMsgs = toBeSummarizedMsgs.slice(
  435. Math.max(0, n - modelConfig.historyMessageCount),
  436. );
  437. }
  438. // add memory prompt
  439. toBeSummarizedMsgs.unshift(get().getMemoryPrompt());
  440. const lastSummarizeIndex = session.messages.length;
  441. console.log(
  442. "[Chat History] ",
  443. toBeSummarizedMsgs,
  444. historyMsgLength,
  445. modelConfig.compressMessageLengthThreshold,
  446. );
  447. if (
  448. historyMsgLength > modelConfig.compressMessageLengthThreshold &&
  449. modelConfig.sendMemory
  450. ) {
  451. api.llm.chat({
  452. messages: toBeSummarizedMsgs.concat({
  453. role: "system",
  454. content: Locale.Store.Prompt.Summarize,
  455. date: "",
  456. }),
  457. config: { ...modelConfig, stream: true },
  458. onUpdate(message) {
  459. session.memoryPrompt = message;
  460. },
  461. onFinish(message) {
  462. console.log("[Memory] ", message);
  463. session.lastSummarizeIndex = lastSummarizeIndex;
  464. },
  465. onError(err) {
  466. console.error("[Summarize] ", err);
  467. },
  468. });
  469. }
  470. },
  471. updateStat(message) {
  472. get().updateCurrentSession((session) => {
  473. session.stat.charCount += message.content.length;
  474. // TODO: should update chat count and word count
  475. });
  476. },
  477. updateCurrentSession(updater) {
  478. const sessions = get().sessions;
  479. const index = get().currentSessionIndex;
  480. updater(sessions[index]);
  481. set(() => ({ sessions }));
  482. },
  483. clearAllData() {
  484. localStorage.clear();
  485. location.reload();
  486. },
  487. }),
  488. {
  489. name: StoreKey.Chat,
  490. version: 2,
  491. migrate(persistedState, version) {
  492. const state = persistedState as any;
  493. const newState = JSON.parse(JSON.stringify(state)) as ChatStore;
  494. if (version < 2) {
  495. newState.globalId = 0;
  496. newState.sessions = [];
  497. const oldSessions = state.sessions;
  498. for (const oldSession of oldSessions) {
  499. const newSession = createEmptySession();
  500. newSession.topic = oldSession.topic;
  501. newSession.messages = [...oldSession.messages];
  502. newSession.mask.modelConfig.sendMemory = true;
  503. newSession.mask.modelConfig.historyMessageCount = 4;
  504. newSession.mask.modelConfig.compressMessageLengthThreshold = 1000;
  505. newState.sessions.push(newSession);
  506. }
  507. }
  508. return newState;
  509. },
  510. },
  511. ),
  512. );