chat.ts 16 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562
  1. import { create } from "zustand";
  2. import { persist } from "zustand/middleware";
  3. import { trimTopic } from "../utils";
  4. import Locale from "../locales";
  5. import { showToast } from "../components/ui-lib";
  6. import { ModelType } from "./config";
  7. import { createEmptyMask, Mask } from "./mask";
  8. import { StoreKey } from "../constant";
  9. import { api, RequestMessage } from "../client/api";
  10. import { ChatControllerPool } from "../client/controller";
  11. import { prettyObject } from "../utils/format";
  12. import { estimateTokenLength } from "../utils/token";
  13. export type ChatMessage = RequestMessage & {
  14. date: string;
  15. streaming?: boolean;
  16. isError?: boolean;
  17. id?: number;
  18. model?: ModelType;
  19. };
  20. export function createMessage(override: Partial<ChatMessage>): ChatMessage {
  21. return {
  22. id: Date.now(),
  23. date: new Date().toLocaleString(),
  24. role: "user",
  25. content: "",
  26. ...override,
  27. };
  28. }
  29. export interface ChatStat {
  30. tokenCount: number;
  31. wordCount: number;
  32. charCount: number;
  33. }
  34. export interface ChatSession {
  35. id: number;
  36. topic: string;
  37. memoryPrompt: string;
  38. messages: ChatMessage[];
  39. stat: ChatStat;
  40. lastUpdate: number;
  41. lastSummarizeIndex: number;
  42. clearContextIndex?: number;
  43. mask: Mask;
  44. }
  45. export const DEFAULT_TOPIC = Locale.Store.DefaultTopic;
  46. export const BOT_HELLO: ChatMessage = createMessage({
  47. role: "assistant",
  48. content: Locale.Store.BotHello,
  49. });
  50. function createEmptySession(): ChatSession {
  51. return {
  52. id: Date.now() + Math.random(),
  53. topic: DEFAULT_TOPIC,
  54. memoryPrompt: "",
  55. messages: [],
  56. stat: {
  57. tokenCount: 0,
  58. wordCount: 0,
  59. charCount: 0,
  60. },
  61. lastUpdate: Date.now(),
  62. lastSummarizeIndex: 0,
  63. mask: createEmptyMask(),
  64. };
  65. }
  66. interface ChatStore {
  67. sessions: ChatSession[];
  68. currentSessionIndex: number;
  69. globalId: number;
  70. clearSessions: () => void;
  71. moveSession: (from: number, to: number) => void;
  72. selectSession: (index: number) => void;
  73. newSession: (mask?: Mask) => void;
  74. deleteSession: (index: number) => void;
  75. currentSession: () => ChatSession;
  76. onNewMessage: (message: ChatMessage) => void;
  77. onUserInput: (content: string) => Promise<void>;
  78. summarizeSession: () => void;
  79. updateStat: (message: ChatMessage) => void;
  80. updateCurrentSession: (updater: (session: ChatSession) => void) => void;
  81. updateMessage: (
  82. sessionIndex: number,
  83. messageIndex: number,
  84. updater: (message?: ChatMessage) => void,
  85. ) => void;
  86. resetSession: () => void;
  87. getMessagesWithMemory: () => ChatMessage[];
  88. getMemoryPrompt: () => ChatMessage;
  89. clearAllData: () => void;
  90. }
  91. function countMessages(msgs: ChatMessage[]) {
  92. return msgs.reduce((pre, cur) => pre + estimateTokenLength(cur.content), 0);
  93. }
  94. export const useChatStore = create<ChatStore>()(
  95. persist(
  96. (set, get) => ({
  97. sessions: [createEmptySession()],
  98. currentSessionIndex: 0,
  99. globalId: 0,
  100. clearSessions() {
  101. set(() => ({
  102. sessions: [createEmptySession()],
  103. currentSessionIndex: 0,
  104. }));
  105. },
  106. selectSession(index: number) {
  107. set({
  108. currentSessionIndex: index,
  109. });
  110. },
  111. moveSession(from: number, to: number) {
  112. set((state) => {
  113. const { sessions, currentSessionIndex: oldIndex } = state;
  114. // move the session
  115. const newSessions = [...sessions];
  116. const session = newSessions[from];
  117. newSessions.splice(from, 1);
  118. newSessions.splice(to, 0, session);
  119. // modify current session id
  120. let newIndex = oldIndex === from ? to : oldIndex;
  121. if (oldIndex > from && oldIndex <= to) {
  122. newIndex -= 1;
  123. } else if (oldIndex < from && oldIndex >= to) {
  124. newIndex += 1;
  125. }
  126. return {
  127. currentSessionIndex: newIndex,
  128. sessions: newSessions,
  129. };
  130. });
  131. },
  132. newSession(mask) {
  133. const session = createEmptySession();
  134. set(() => ({ globalId: get().globalId + 1 }));
  135. session.id = get().globalId;
  136. if (mask) {
  137. session.mask = { ...mask };
  138. session.topic = mask.name;
  139. }
  140. set((state) => ({
  141. currentSessionIndex: 0,
  142. sessions: [session].concat(state.sessions),
  143. }));
  144. },
  145. deleteSession(index) {
  146. const deletingLastSession = get().sessions.length === 1;
  147. const deletedSession = get().sessions.at(index);
  148. if (!deletedSession) return;
  149. const sessions = get().sessions.slice();
  150. sessions.splice(index, 1);
  151. const currentIndex = get().currentSessionIndex;
  152. let nextIndex = Math.min(
  153. currentIndex - Number(index < currentIndex),
  154. sessions.length - 1,
  155. );
  156. if (deletingLastSession) {
  157. nextIndex = 0;
  158. sessions.push(createEmptySession());
  159. }
  160. // for undo delete action
  161. const restoreState = {
  162. currentSessionIndex: get().currentSessionIndex,
  163. sessions: get().sessions.slice(),
  164. };
  165. set(() => ({
  166. currentSessionIndex: nextIndex,
  167. sessions,
  168. }));
  169. showToast(
  170. Locale.Home.DeleteToast,
  171. {
  172. text: Locale.Home.Revert,
  173. onClick() {
  174. set(() => restoreState);
  175. },
  176. },
  177. 5000,
  178. );
  179. },
  180. currentSession() {
  181. let index = get().currentSessionIndex;
  182. const sessions = get().sessions;
  183. if (index < 0 || index >= sessions.length) {
  184. index = Math.min(sessions.length - 1, Math.max(0, index));
  185. set(() => ({ currentSessionIndex: index }));
  186. }
  187. const session = sessions[index];
  188. return session;
  189. },
  190. onNewMessage(message) {
  191. get().updateCurrentSession((session) => {
  192. session.messages = session.messages.concat();
  193. session.lastUpdate = Date.now();
  194. });
  195. get().updateStat(message);
  196. get().summarizeSession();
  197. },
  198. async onUserInput(content) {
  199. const session = get().currentSession();
  200. const modelConfig = session.mask.modelConfig;
  201. const userMessage: ChatMessage = createMessage({
  202. role: "user",
  203. content,
  204. });
  205. const botMessage: ChatMessage = createMessage({
  206. role: "assistant",
  207. streaming: true,
  208. id: userMessage.id! + 1,
  209. model: modelConfig.model,
  210. });
  211. const systemInfo = createMessage({
  212. role: "system",
  213. content: `IMPORTANT: You are a virtual assistant powered by the ${
  214. modelConfig.model
  215. } model, now time is ${new Date().toLocaleString()}}`,
  216. id: botMessage.id! + 1,
  217. });
  218. // get recent messages
  219. const systemMessages = [];
  220. // if user define a mask with context prompts, wont send system info
  221. if (session.mask.context.length === 0) {
  222. systemMessages.push(systemInfo);
  223. }
  224. const recentMessages = get().getMessagesWithMemory();
  225. const sendMessages = systemMessages.concat(
  226. recentMessages.concat(userMessage),
  227. );
  228. const sessionIndex = get().currentSessionIndex;
  229. const messageIndex = get().currentSession().messages.length + 1;
  230. // save user's and bot's message
  231. get().updateCurrentSession((session) => {
  232. // session.messages.push(userMessage);
  233. // session.messages.push(botMessage);
  234. session.messages = session.messages.concat([userMessage, botMessage]);
  235. });
  236. // make request
  237. console.log("[User Input] ", sendMessages);
  238. api.llm.chat({
  239. messages: sendMessages,
  240. config: { ...modelConfig, stream: true },
  241. onUpdate(message) {
  242. botMessage.streaming = true;
  243. if (message) {
  244. botMessage.content = message;
  245. }
  246. // set(() => ({}));
  247. get().updateCurrentSession((session) => {
  248. session.messages = session.messages.concat();
  249. });
  250. },
  251. onFinish(message) {
  252. botMessage.streaming = false;
  253. if (message) {
  254. botMessage.content = message;
  255. get().onNewMessage(botMessage);
  256. }
  257. ChatControllerPool.remove(
  258. sessionIndex,
  259. botMessage.id ?? messageIndex,
  260. );
  261. // set(() => ({}));
  262. },
  263. onError(error) {
  264. const isAborted = error.message.includes("aborted");
  265. botMessage.content =
  266. "\n\n" +
  267. prettyObject({
  268. error: true,
  269. message: error.message,
  270. });
  271. botMessage.streaming = false;
  272. userMessage.isError = !isAborted;
  273. botMessage.isError = !isAborted;
  274. get().updateCurrentSession((session) => {
  275. session.messages = session.messages.concat();
  276. });
  277. // set(() => ({}));
  278. ChatControllerPool.remove(
  279. sessionIndex,
  280. botMessage.id ?? messageIndex,
  281. );
  282. console.error("[Chat] failed ", error);
  283. },
  284. onController(controller) {
  285. // collect controller for stop/retry
  286. ChatControllerPool.addController(
  287. sessionIndex,
  288. botMessage.id ?? messageIndex,
  289. controller,
  290. );
  291. },
  292. });
  293. },
  294. getMemoryPrompt() {
  295. const session = get().currentSession();
  296. return {
  297. role: "system",
  298. content:
  299. session.memoryPrompt.length > 0
  300. ? Locale.Store.Prompt.History(session.memoryPrompt)
  301. : "",
  302. date: "",
  303. } as ChatMessage;
  304. },
  305. getMessagesWithMemory() {
  306. const session = get().currentSession();
  307. const modelConfig = session.mask.modelConfig;
  308. // wont send cleared context messages
  309. const clearedContextMessages = session.messages.slice(
  310. session.clearContextIndex ?? 0,
  311. );
  312. const messages = clearedContextMessages.filter((msg) => !msg.isError);
  313. const n = messages.length;
  314. const context = session.mask.context.slice();
  315. // long term memory
  316. if (
  317. modelConfig.sendMemory &&
  318. session.memoryPrompt &&
  319. session.memoryPrompt.length > 0
  320. ) {
  321. const memoryPrompt = get().getMemoryPrompt();
  322. context.push(memoryPrompt);
  323. }
  324. // get short term and unmemoried long term memory
  325. const shortTermMemoryMessageIndex = Math.max(
  326. 0,
  327. n - modelConfig.historyMessageCount,
  328. );
  329. const longTermMemoryMessageIndex = session.lastSummarizeIndex;
  330. const mostRecentIndex = Math.max(
  331. shortTermMemoryMessageIndex,
  332. longTermMemoryMessageIndex,
  333. );
  334. const threshold = modelConfig.compressMessageLengthThreshold * 2;
  335. // get recent messages as many as possible
  336. const reversedRecentMessages = [];
  337. for (
  338. let i = n - 1, count = 0;
  339. i >= mostRecentIndex && count < threshold;
  340. i -= 1
  341. ) {
  342. const msg = messages[i];
  343. if (!msg || msg.isError) continue;
  344. count += msg.content.length;
  345. reversedRecentMessages.push(msg);
  346. }
  347. // concat
  348. const recentMessages = context.concat(reversedRecentMessages.reverse());
  349. return recentMessages;
  350. },
  351. updateMessage(
  352. sessionIndex: number,
  353. messageIndex: number,
  354. updater: (message?: ChatMessage) => void,
  355. ) {
  356. const sessions = get().sessions;
  357. const session = sessions.at(sessionIndex);
  358. const messages = session?.messages;
  359. updater(messages?.at(messageIndex));
  360. set(() => ({ sessions }));
  361. },
  362. resetSession() {
  363. get().updateCurrentSession((session) => {
  364. session.messages = [];
  365. session.memoryPrompt = "";
  366. });
  367. },
  368. summarizeSession() {
  369. const session = get().currentSession();
  370. // remove error messages if any
  371. const messages = session.messages;
  372. // should summarize topic after chating more than 50 words
  373. const SUMMARIZE_MIN_LEN = 50;
  374. if (
  375. session.topic === DEFAULT_TOPIC &&
  376. countMessages(messages) >= SUMMARIZE_MIN_LEN
  377. ) {
  378. const topicMessages = messages.concat(
  379. createMessage({
  380. role: "user",
  381. content: Locale.Store.Prompt.Topic,
  382. }),
  383. );
  384. api.llm.chat({
  385. messages: topicMessages,
  386. config: {
  387. model: "gpt-3.5-turbo",
  388. },
  389. onFinish(message) {
  390. get().updateCurrentSession(
  391. (session) =>
  392. (session.topic =
  393. message.length > 0 ? trimTopic(message) : DEFAULT_TOPIC),
  394. );
  395. },
  396. });
  397. }
  398. const modelConfig = session.mask.modelConfig;
  399. const summarizeIndex = Math.max(
  400. session.lastSummarizeIndex,
  401. session.clearContextIndex ?? 0,
  402. );
  403. let toBeSummarizedMsgs = messages
  404. .filter((msg) => !msg.isError)
  405. .slice(summarizeIndex);
  406. const historyMsgLength = countMessages(toBeSummarizedMsgs);
  407. if (historyMsgLength > modelConfig?.max_tokens ?? 4000) {
  408. const n = toBeSummarizedMsgs.length;
  409. toBeSummarizedMsgs = toBeSummarizedMsgs.slice(
  410. Math.max(0, n - modelConfig.historyMessageCount),
  411. );
  412. }
  413. // add memory prompt
  414. toBeSummarizedMsgs.unshift(get().getMemoryPrompt());
  415. const lastSummarizeIndex = session.messages.length;
  416. console.log(
  417. "[Chat History] ",
  418. toBeSummarizedMsgs,
  419. historyMsgLength,
  420. modelConfig.compressMessageLengthThreshold,
  421. );
  422. if (
  423. historyMsgLength > modelConfig.compressMessageLengthThreshold &&
  424. modelConfig.sendMemory
  425. ) {
  426. api.llm.chat({
  427. messages: toBeSummarizedMsgs.concat({
  428. role: "system",
  429. content: Locale.Store.Prompt.Summarize,
  430. date: "",
  431. }),
  432. config: { ...modelConfig, stream: true },
  433. onUpdate(message) {
  434. session.memoryPrompt = message;
  435. },
  436. onFinish(message) {
  437. console.log("[Memory] ", message);
  438. session.lastSummarizeIndex = lastSummarizeIndex;
  439. },
  440. onError(err) {
  441. console.error("[Summarize] ", err);
  442. },
  443. });
  444. }
  445. },
  446. updateStat(message) {
  447. get().updateCurrentSession((session) => {
  448. session.stat.charCount += message.content.length;
  449. // TODO: should update chat count and word count
  450. });
  451. },
  452. updateCurrentSession(updater) {
  453. const sessions = get().sessions;
  454. const index = get().currentSessionIndex;
  455. updater(sessions[index]);
  456. set(() => ({ sessions }));
  457. },
  458. clearAllData() {
  459. localStorage.clear();
  460. location.reload();
  461. },
  462. }),
  463. {
  464. name: StoreKey.Chat,
  465. version: 2,
  466. migrate(persistedState, version) {
  467. const state = persistedState as any;
  468. const newState = JSON.parse(JSON.stringify(state)) as ChatStore;
  469. if (version < 2) {
  470. newState.globalId = 0;
  471. newState.sessions = [];
  472. const oldSessions = state.sessions;
  473. for (const oldSession of oldSessions) {
  474. const newSession = createEmptySession();
  475. newSession.topic = oldSession.topic;
  476. newSession.messages = [...oldSession.messages];
  477. newSession.mask.modelConfig.sendMemory = true;
  478. newSession.mask.modelConfig.historyMessageCount = 4;
  479. newSession.mask.modelConfig.compressMessageLengthThreshold = 1000;
  480. newState.sessions.push(newSession);
  481. }
  482. }
  483. return newState;
  484. },
  485. },
  486. ),
  487. );