chat.ts 17 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599
  1. import { create } from "zustand";
  2. import { persist } from "zustand/middleware";
  3. import { trimTopic } from "../utils";
  4. import Locale, { getLang } from "../locales";
  5. import { showToast } from "../components/ui-lib";
  6. import { ModelConfig, ModelType, useAppConfig } from "./config";
  7. import { createEmptyMask, Mask } from "./mask";
  8. import { DEFAULT_INPUT_TEMPLATE, StoreKey } from "../constant";
  9. import { api, RequestMessage } from "../client/api";
  10. import { ChatControllerPool } from "../client/controller";
  11. import { prettyObject } from "../utils/format";
  12. import { estimateTokenLength } from "../utils/token";
  13. export type ChatMessage = RequestMessage & {
  14. date: string;
  15. streaming?: boolean;
  16. isError?: boolean;
  17. id?: number;
  18. model?: ModelType;
  19. };
  20. export function createMessage(override: Partial<ChatMessage>): ChatMessage {
  21. return {
  22. id: Date.now(),
  23. date: new Date().toLocaleString(),
  24. role: "user",
  25. content: "",
  26. ...override,
  27. };
  28. }
  29. export interface ChatStat {
  30. tokenCount: number;
  31. wordCount: number;
  32. charCount: number;
  33. }
  34. export interface ChatSession {
  35. id: number;
  36. topic: string;
  37. memoryPrompt: string;
  38. messages: ChatMessage[];
  39. stat: ChatStat;
  40. lastUpdate: number;
  41. lastSummarizeIndex: number;
  42. clearContextIndex?: number;
  43. mask: Mask;
  44. }
  45. export const DEFAULT_TOPIC = Locale.Store.DefaultTopic;
  46. export const BOT_HELLO: ChatMessage = createMessage({
  47. role: "assistant",
  48. content: Locale.Store.BotHello,
  49. });
  50. function createEmptySession(): ChatSession {
  51. return {
  52. id: Date.now() + Math.random(),
  53. topic: DEFAULT_TOPIC,
  54. memoryPrompt: "",
  55. messages: [],
  56. stat: {
  57. tokenCount: 0,
  58. wordCount: 0,
  59. charCount: 0,
  60. },
  61. lastUpdate: Date.now(),
  62. lastSummarizeIndex: 0,
  63. mask: createEmptyMask(),
  64. };
  65. }
  66. interface ChatStore {
  67. sessions: ChatSession[];
  68. currentSessionIndex: number;
  69. globalId: number;
  70. clearSessions: () => void;
  71. moveSession: (from: number, to: number) => void;
  72. selectSession: (index: number) => void;
  73. newSession: (mask?: Mask) => void;
  74. deleteSession: (index: number) => void;
  75. currentSession: () => ChatSession;
  76. nextSession: (delta: number) => void;
  77. onNewMessage: (message: ChatMessage) => void;
  78. onUserInput: (content: string) => Promise<void>;
  79. summarizeSession: () => void;
  80. updateStat: (message: ChatMessage) => void;
  81. updateCurrentSession: (updater: (session: ChatSession) => void) => void;
  82. updateMessage: (
  83. sessionIndex: number,
  84. messageIndex: number,
  85. updater: (message?: ChatMessage) => void,
  86. ) => void;
  87. resetSession: () => void;
  88. getMessagesWithMemory: () => ChatMessage[];
  89. getMemoryPrompt: () => ChatMessage;
  90. clearAllData: () => void;
  91. }
  92. function countMessages(msgs: ChatMessage[]) {
  93. return msgs.reduce((pre, cur) => pre + estimateTokenLength(cur.content), 0);
  94. }
  95. function fillTemplateWith(input: string, modelConfig: ModelConfig) {
  96. const vars = {
  97. model: modelConfig.model,
  98. time: new Date().toLocaleString(),
  99. lang: getLang(),
  100. input: input,
  101. };
  102. let output = modelConfig.template ?? DEFAULT_INPUT_TEMPLATE;
  103. // must contains {{input}}
  104. const inputVar = "{{input}}";
  105. if (!output.includes(inputVar)) {
  106. output += "\n" + inputVar;
  107. }
  108. Object.entries(vars).forEach(([name, value]) => {
  109. output = output.replaceAll(`{{${name}}}`, value);
  110. });
  111. return output;
  112. }
  113. export const useChatStore = create<ChatStore>()(
  114. persist(
  115. (set, get) => ({
  116. sessions: [createEmptySession()],
  117. currentSessionIndex: 0,
  118. globalId: 0,
  119. clearSessions() {
  120. set(() => ({
  121. sessions: [createEmptySession()],
  122. currentSessionIndex: 0,
  123. }));
  124. },
  125. selectSession(index: number) {
  126. set({
  127. currentSessionIndex: index,
  128. });
  129. },
  130. moveSession(from: number, to: number) {
  131. set((state) => {
  132. const { sessions, currentSessionIndex: oldIndex } = state;
  133. // move the session
  134. const newSessions = [...sessions];
  135. const session = newSessions[from];
  136. newSessions.splice(from, 1);
  137. newSessions.splice(to, 0, session);
  138. // modify current session id
  139. let newIndex = oldIndex === from ? to : oldIndex;
  140. if (oldIndex > from && oldIndex <= to) {
  141. newIndex -= 1;
  142. } else if (oldIndex < from && oldIndex >= to) {
  143. newIndex += 1;
  144. }
  145. return {
  146. currentSessionIndex: newIndex,
  147. sessions: newSessions,
  148. };
  149. });
  150. },
  151. newSession(mask) {
  152. const session = createEmptySession();
  153. set(() => ({ globalId: get().globalId + 1 }));
  154. session.id = get().globalId;
  155. if (mask) {
  156. const config = useAppConfig.getState();
  157. const globalModelConfig = config.modelConfig;
  158. session.mask = {
  159. ...mask,
  160. modelConfig: {
  161. ...globalModelConfig,
  162. ...mask.modelConfig,
  163. },
  164. };
  165. session.topic = mask.name;
  166. }
  167. set((state) => ({
  168. currentSessionIndex: 0,
  169. sessions: [session].concat(state.sessions),
  170. }));
  171. },
  172. nextSession(delta) {
  173. const n = get().sessions.length;
  174. const limit = (x: number) => (x + n) % n;
  175. const i = get().currentSessionIndex;
  176. get().selectSession(limit(i + delta));
  177. },
  178. deleteSession(index) {
  179. const deletingLastSession = get().sessions.length === 1;
  180. const deletedSession = get().sessions.at(index);
  181. if (!deletedSession) return;
  182. const sessions = get().sessions.slice();
  183. sessions.splice(index, 1);
  184. const currentIndex = get().currentSessionIndex;
  185. let nextIndex = Math.min(
  186. currentIndex - Number(index < currentIndex),
  187. sessions.length - 1,
  188. );
  189. if (deletingLastSession) {
  190. nextIndex = 0;
  191. sessions.push(createEmptySession());
  192. }
  193. // for undo delete action
  194. const restoreState = {
  195. currentSessionIndex: get().currentSessionIndex,
  196. sessions: get().sessions.slice(),
  197. };
  198. set(() => ({
  199. currentSessionIndex: nextIndex,
  200. sessions,
  201. }));
  202. showToast(
  203. Locale.Home.DeleteToast,
  204. {
  205. text: Locale.Home.Revert,
  206. onClick() {
  207. set(() => restoreState);
  208. },
  209. },
  210. 5000,
  211. );
  212. },
  213. currentSession() {
  214. let index = get().currentSessionIndex;
  215. const sessions = get().sessions;
  216. if (index < 0 || index >= sessions.length) {
  217. index = Math.min(sessions.length - 1, Math.max(0, index));
  218. set(() => ({ currentSessionIndex: index }));
  219. }
  220. const session = sessions[index];
  221. return session;
  222. },
  223. onNewMessage(message) {
  224. get().updateCurrentSession((session) => {
  225. session.messages = session.messages.concat();
  226. session.lastUpdate = Date.now();
  227. });
  228. get().updateStat(message);
  229. get().summarizeSession();
  230. },
  231. async onUserInput(content) {
  232. const session = get().currentSession();
  233. const modelConfig = session.mask.modelConfig;
  234. const userContent = fillTemplateWith(content, modelConfig);
  235. console.log("[User Input] fill with template: ", userContent);
  236. const userMessage: ChatMessage = createMessage({
  237. role: "user",
  238. content: userContent,
  239. });
  240. const botMessage: ChatMessage = createMessage({
  241. role: "assistant",
  242. streaming: true,
  243. id: userMessage.id! + 1,
  244. model: modelConfig.model,
  245. });
  246. // get recent messages
  247. const recentMessages = get().getMessagesWithMemory();
  248. const sendMessages = recentMessages.concat(userMessage);
  249. const sessionIndex = get().currentSessionIndex;
  250. const messageIndex = get().currentSession().messages.length + 1;
  251. // save user's and bot's message
  252. get().updateCurrentSession((session) => {
  253. const savedUserMessage = {
  254. ...userMessage,
  255. content,
  256. };
  257. session.messages = session.messages.concat([
  258. savedUserMessage,
  259. botMessage,
  260. ]);
  261. });
  262. // make request
  263. console.log("[User Input] ", sendMessages);
  264. api.llm.chat({
  265. messages: sendMessages,
  266. config: { ...modelConfig, stream: true },
  267. onUpdate(message) {
  268. botMessage.streaming = true;
  269. if (message) {
  270. botMessage.content = message;
  271. }
  272. get().updateCurrentSession((session) => {
  273. session.messages = session.messages.concat();
  274. });
  275. },
  276. onFinish(message) {
  277. botMessage.streaming = false;
  278. if (message) {
  279. botMessage.content = message;
  280. get().onNewMessage(botMessage);
  281. }
  282. ChatControllerPool.remove(
  283. sessionIndex,
  284. botMessage.id ?? messageIndex,
  285. );
  286. },
  287. onError(error) {
  288. const isAborted = error.message.includes("aborted");
  289. botMessage.content =
  290. "\n\n" +
  291. prettyObject({
  292. error: true,
  293. message: error.message,
  294. });
  295. botMessage.streaming = false;
  296. userMessage.isError = !isAborted;
  297. botMessage.isError = !isAborted;
  298. get().updateCurrentSession((session) => {
  299. session.messages = session.messages.concat();
  300. });
  301. ChatControllerPool.remove(
  302. sessionIndex,
  303. botMessage.id ?? messageIndex,
  304. );
  305. console.error("[Chat] failed ", error);
  306. },
  307. onController(controller) {
  308. // collect controller for stop/retry
  309. ChatControllerPool.addController(
  310. sessionIndex,
  311. botMessage.id ?? messageIndex,
  312. controller,
  313. );
  314. },
  315. });
  316. },
  317. getMemoryPrompt() {
  318. const session = get().currentSession();
  319. return {
  320. role: "system",
  321. content:
  322. session.memoryPrompt.length > 0
  323. ? Locale.Store.Prompt.History(session.memoryPrompt)
  324. : "",
  325. date: "",
  326. } as ChatMessage;
  327. },
  328. getMessagesWithMemory() {
  329. const session = get().currentSession();
  330. const modelConfig = session.mask.modelConfig;
  331. const clearContextIndex = session.clearContextIndex ?? 0;
  332. const messages = session.messages.slice();
  333. const totalMessageCount = session.messages.length;
  334. // in-context prompts
  335. const contextPrompts = session.mask.context.slice();
  336. // long term memory
  337. const shouldSendLongTermMemory =
  338. modelConfig.sendMemory &&
  339. session.memoryPrompt &&
  340. session.memoryPrompt.length > 0 &&
  341. session.lastSummarizeIndex <= clearContextIndex;
  342. const longTermMemoryPrompts = shouldSendLongTermMemory
  343. ? [get().getMemoryPrompt()]
  344. : [];
  345. const longTermMemoryStartIndex = session.lastSummarizeIndex;
  346. // short term memory
  347. const shortTermMemoryStartIndex = Math.max(
  348. 0,
  349. totalMessageCount - modelConfig.historyMessageCount,
  350. );
  351. // lets concat send messages, including 4 parts:
  352. // 1. long term memory: summarized memory messages
  353. // 2. pre-defined in-context prompts
  354. // 3. short term memory: latest n messages
  355. // 4. newest input message
  356. const memoryStartIndex = shouldSendLongTermMemory
  357. ? Math.min(longTermMemoryStartIndex, shortTermMemoryStartIndex)
  358. : shortTermMemoryStartIndex;
  359. // and if user has cleared history messages, we should exclude the memory too.
  360. const contextStartIndex = Math.max(clearContextIndex, memoryStartIndex);
  361. const maxTokenThreshold = modelConfig.max_tokens;
  362. // get recent messages as much as possible
  363. const reversedRecentMessages = [];
  364. for (
  365. let i = totalMessageCount - 1, tokenCount = 0;
  366. i >= contextStartIndex && tokenCount < maxTokenThreshold;
  367. i -= 1
  368. ) {
  369. const msg = messages[i];
  370. if (!msg || msg.isError) continue;
  371. tokenCount += estimateTokenLength(msg.content);
  372. reversedRecentMessages.push(msg);
  373. }
  374. // concat all messages
  375. const recentMessages = [
  376. ...longTermMemoryPrompts,
  377. ...contextPrompts,
  378. ...reversedRecentMessages.reverse(),
  379. ];
  380. return recentMessages;
  381. },
  382. updateMessage(
  383. sessionIndex: number,
  384. messageIndex: number,
  385. updater: (message?: ChatMessage) => void,
  386. ) {
  387. const sessions = get().sessions;
  388. const session = sessions.at(sessionIndex);
  389. const messages = session?.messages;
  390. updater(messages?.at(messageIndex));
  391. set(() => ({ sessions }));
  392. },
  393. resetSession() {
  394. get().updateCurrentSession((session) => {
  395. session.messages = [];
  396. session.memoryPrompt = "";
  397. });
  398. },
  399. summarizeSession() {
  400. const session = get().currentSession();
  401. // remove error messages if any
  402. const messages = session.messages;
  403. // should summarize topic after chating more than 50 words
  404. const SUMMARIZE_MIN_LEN = 50;
  405. if (
  406. session.topic === DEFAULT_TOPIC &&
  407. countMessages(messages) >= SUMMARIZE_MIN_LEN
  408. ) {
  409. const topicMessages = messages.concat(
  410. createMessage({
  411. role: "user",
  412. content: Locale.Store.Prompt.Topic,
  413. }),
  414. );
  415. api.llm.chat({
  416. messages: topicMessages,
  417. config: {
  418. model: "gpt-3.5-turbo",
  419. },
  420. onFinish(message) {
  421. get().updateCurrentSession(
  422. (session) =>
  423. (session.topic =
  424. message.length > 0 ? trimTopic(message) : DEFAULT_TOPIC),
  425. );
  426. },
  427. });
  428. }
  429. const modelConfig = session.mask.modelConfig;
  430. const summarizeIndex = Math.max(
  431. session.lastSummarizeIndex,
  432. session.clearContextIndex ?? 0,
  433. );
  434. let toBeSummarizedMsgs = messages
  435. .filter((msg) => !msg.isError)
  436. .slice(summarizeIndex);
  437. const historyMsgLength = countMessages(toBeSummarizedMsgs);
  438. if (historyMsgLength > modelConfig?.max_tokens ?? 4000) {
  439. const n = toBeSummarizedMsgs.length;
  440. toBeSummarizedMsgs = toBeSummarizedMsgs.slice(
  441. Math.max(0, n - modelConfig.historyMessageCount),
  442. );
  443. }
  444. // add memory prompt
  445. toBeSummarizedMsgs.unshift(get().getMemoryPrompt());
  446. const lastSummarizeIndex = session.messages.length;
  447. console.log(
  448. "[Chat History] ",
  449. toBeSummarizedMsgs,
  450. historyMsgLength,
  451. modelConfig.compressMessageLengthThreshold,
  452. );
  453. if (
  454. historyMsgLength > modelConfig.compressMessageLengthThreshold &&
  455. modelConfig.sendMemory
  456. ) {
  457. api.llm.chat({
  458. messages: toBeSummarizedMsgs.concat({
  459. role: "system",
  460. content: Locale.Store.Prompt.Summarize,
  461. date: "",
  462. }),
  463. config: { ...modelConfig, stream: true },
  464. onUpdate(message) {
  465. session.memoryPrompt = message;
  466. },
  467. onFinish(message) {
  468. console.log("[Memory] ", message);
  469. session.lastSummarizeIndex = lastSummarizeIndex;
  470. },
  471. onError(err) {
  472. console.error("[Summarize] ", err);
  473. },
  474. });
  475. }
  476. },
  477. updateStat(message) {
  478. get().updateCurrentSession((session) => {
  479. session.stat.charCount += message.content.length;
  480. // TODO: should update chat count and word count
  481. });
  482. },
  483. updateCurrentSession(updater) {
  484. const sessions = get().sessions;
  485. const index = get().currentSessionIndex;
  486. updater(sessions[index]);
  487. set(() => ({ sessions }));
  488. },
  489. clearAllData() {
  490. localStorage.clear();
  491. location.reload();
  492. },
  493. }),
  494. {
  495. name: StoreKey.Chat,
  496. version: 2,
  497. migrate(persistedState, version) {
  498. const state = persistedState as any;
  499. const newState = JSON.parse(JSON.stringify(state)) as ChatStore;
  500. if (version < 2) {
  501. newState.globalId = 0;
  502. newState.sessions = [];
  503. const oldSessions = state.sessions;
  504. for (const oldSession of oldSessions) {
  505. const newSession = createEmptySession();
  506. newSession.topic = oldSession.topic;
  507. newSession.messages = [...oldSession.messages];
  508. newSession.mask.modelConfig.sendMemory = true;
  509. newSession.mask.modelConfig.historyMessageCount = 4;
  510. newSession.mask.modelConfig.compressMessageLengthThreshold = 1000;
  511. newState.sessions.push(newSession);
  512. }
  513. }
  514. return newState;
  515. },
  516. },
  517. ),
  518. );