chat.ts 19 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670
  1. import { trimTopic } from "../utils";
  2. import Locale, { getLang } from "../locales";
  3. import { showToast } from "../components/ui-lib";
  4. import { ModelConfig, ModelType, useAppConfig } from "./config";
  5. import { createEmptyMask, Mask } from "./mask";
  6. import {
  7. DEFAULT_INPUT_TEMPLATE,
  8. DEFAULT_SYSTEM_TEMPLATE,
  9. KnowledgeCutOffDate,
  10. StoreKey,
  11. SUMMARIZE_MODEL,
  12. } from "../constant";
  13. import { api, RequestMessage } from "../client/api";
  14. import { ChatControllerPool } from "../client/controller";
  15. import { prettyObject } from "../utils/format";
  16. import { estimateTokenLength } from "../utils/token";
  17. import { nanoid } from "nanoid";
  18. import { createPersistStore } from "../utils/store";
  19. export type ChatMessage = RequestMessage & {
  20. date: string;
  21. streaming?: boolean;
  22. isError?: boolean;
  23. id: string;
  24. model?: ModelType;
  25. };
  26. export function createMessage(override: Partial<ChatMessage>): ChatMessage {
  27. return {
  28. id: nanoid(),
  29. date: new Date().toLocaleString(),
  30. role: "user",
  31. content: "",
  32. ...override,
  33. };
  34. }
  35. export interface ChatStat {
  36. tokenCount: number;
  37. wordCount: number;
  38. charCount: number;
  39. }
  40. export interface ChatSession {
  41. id: string;
  42. topic: string;
  43. memoryPrompt: string;
  44. messages: ChatMessage[];
  45. stat: ChatStat;
  46. lastUpdate: number;
  47. lastSummarizeIndex: number;
  48. clearContextIndex?: number;
  49. mask: Mask;
  50. }
  51. export const DEFAULT_TOPIC = Locale.Store.DefaultTopic;
  52. export const BOT_HELLO: ChatMessage = createMessage({
  53. role: "assistant",
  54. content: Locale.Store.BotHello,
  55. });
  56. function createEmptySession(): ChatSession {
  57. return {
  58. id: nanoid(),
  59. topic: DEFAULT_TOPIC,
  60. memoryPrompt: "",
  61. messages: [],
  62. stat: {
  63. tokenCount: 0,
  64. wordCount: 0,
  65. charCount: 0,
  66. },
  67. lastUpdate: Date.now(),
  68. lastSummarizeIndex: 0,
  69. mask: createEmptyMask(),
  70. };
  71. }
  72. function getSummarizeModel(currentModel: string) {
  73. // if it is using gpt-* models, force to use 3.5 to summarize
  74. return currentModel.startsWith("gpt") ? SUMMARIZE_MODEL : currentModel;
  75. }
  76. interface ChatStore {
  77. sessions: ChatSession[];
  78. currentSessionIndex: number;
  79. clearSessions: () => void;
  80. moveSession: (from: number, to: number) => void;
  81. selectSession: (index: number) => void;
  82. newSession: (mask?: Mask) => void;
  83. deleteSession: (index: number) => void;
  84. currentSession: () => ChatSession;
  85. nextSession: (delta: number) => void;
  86. onNewMessage: (message: ChatMessage) => void;
  87. onUserInput: (content: string) => Promise<void>;
  88. summarizeSession: () => void;
  89. updateStat: (message: ChatMessage) => void;
  90. updateCurrentSession: (updater: (session: ChatSession) => void) => void;
  91. updateMessage: (
  92. sessionIndex: number,
  93. messageIndex: number,
  94. updater: (message?: ChatMessage) => void,
  95. ) => void;
  96. resetSession: () => void;
  97. getMessagesWithMemory: () => ChatMessage[];
  98. getMemoryPrompt: () => ChatMessage;
  99. clearAllData: () => void;
  100. }
  101. function countMessages(msgs: ChatMessage[]) {
  102. return msgs.reduce((pre, cur) => pre + estimateTokenLength(cur.content), 0);
  103. }
  104. function fillTemplateWith(input: string, modelConfig: ModelConfig) {
  105. let cutoff =
  106. KnowledgeCutOffDate[modelConfig.model] ?? KnowledgeCutOffDate.default;
  107. const vars = {
  108. cutoff,
  109. model: modelConfig.model,
  110. time: new Date().toLocaleString(),
  111. lang: getLang(),
  112. input: input,
  113. };
  114. let output = modelConfig.template ?? DEFAULT_INPUT_TEMPLATE;
  115. // must contains {{input}}
  116. const inputVar = "{{input}}";
  117. if (!output.includes(inputVar)) {
  118. output += "\n" + inputVar;
  119. }
  120. Object.entries(vars).forEach(([name, value]) => {
  121. output = output.replaceAll(`{{${name}}}`, value);
  122. });
  123. return output;
  124. }
  125. const DEFAULT_CHAT_STATE = {
  126. sessions: [createEmptySession()],
  127. currentSessionIndex: 0,
  128. };
  129. export const useChatStore = createPersistStore(
  130. DEFAULT_CHAT_STATE,
  131. (set, _get) => {
  132. function get() {
  133. return {
  134. ..._get(),
  135. ...methods,
  136. };
  137. }
  138. const methods = {
  139. clearSessions() {
  140. set(() => ({
  141. sessions: [createEmptySession()],
  142. currentSessionIndex: 0,
  143. }));
  144. },
  145. selectSession(index: number) {
  146. set({
  147. currentSessionIndex: index,
  148. });
  149. },
  150. moveSession(from: number, to: number) {
  151. set((state) => {
  152. const { sessions, currentSessionIndex: oldIndex } = state;
  153. // move the session
  154. const newSessions = [...sessions];
  155. const session = newSessions[from];
  156. newSessions.splice(from, 1);
  157. newSessions.splice(to, 0, session);
  158. // modify current session id
  159. let newIndex = oldIndex === from ? to : oldIndex;
  160. if (oldIndex > from && oldIndex <= to) {
  161. newIndex -= 1;
  162. } else if (oldIndex < from && oldIndex >= to) {
  163. newIndex += 1;
  164. }
  165. return {
  166. currentSessionIndex: newIndex,
  167. sessions: newSessions,
  168. };
  169. });
  170. },
  171. newSession(mask?: Mask) {
  172. const session = createEmptySession();
  173. if (mask) {
  174. const config = useAppConfig.getState();
  175. const globalModelConfig = config.modelConfig;
  176. session.mask = {
  177. ...mask,
  178. modelConfig: {
  179. ...globalModelConfig,
  180. ...mask.modelConfig,
  181. },
  182. };
  183. session.topic = mask.name;
  184. }
  185. set((state) => ({
  186. currentSessionIndex: 0,
  187. sessions: [session].concat(state.sessions),
  188. }));
  189. },
  190. nextSession(delta: number) {
  191. const n = get().sessions.length;
  192. const limit = (x: number) => (x + n) % n;
  193. const i = get().currentSessionIndex;
  194. get().selectSession(limit(i + delta));
  195. },
  196. deleteSession(index: number) {
  197. const deletingLastSession = get().sessions.length === 1;
  198. const deletedSession = get().sessions.at(index);
  199. if (!deletedSession) return;
  200. const sessions = get().sessions.slice();
  201. sessions.splice(index, 1);
  202. const currentIndex = get().currentSessionIndex;
  203. let nextIndex = Math.min(
  204. currentIndex - Number(index < currentIndex),
  205. sessions.length - 1,
  206. );
  207. if (deletingLastSession) {
  208. nextIndex = 0;
  209. sessions.push(createEmptySession());
  210. }
  211. // for undo delete action
  212. const restoreState = {
  213. currentSessionIndex: get().currentSessionIndex,
  214. sessions: get().sessions.slice(),
  215. };
  216. set(() => ({
  217. currentSessionIndex: nextIndex,
  218. sessions,
  219. }));
  220. showToast(
  221. Locale.Home.DeleteToast,
  222. {
  223. text: Locale.Home.Revert,
  224. onClick() {
  225. set(() => restoreState);
  226. },
  227. },
  228. 5000,
  229. );
  230. },
  231. currentSession() {
  232. let index = get().currentSessionIndex;
  233. const sessions = get().sessions;
  234. if (index < 0 || index >= sessions.length) {
  235. index = Math.min(sessions.length - 1, Math.max(0, index));
  236. set(() => ({ currentSessionIndex: index }));
  237. }
  238. const session = sessions[index];
  239. return session;
  240. },
  241. onNewMessage(message: ChatMessage) {
  242. get().updateCurrentSession((session) => {
  243. session.messages = session.messages.concat();
  244. session.lastUpdate = Date.now();
  245. });
  246. get().updateStat(message);
  247. get().summarizeSession();
  248. },
  249. async onUserInput(content: string) {
  250. const session = get().currentSession();
  251. const modelConfig = session.mask.modelConfig;
  252. const userContent = fillTemplateWith(content, modelConfig);
  253. console.log("[User Input] after template: ", userContent);
  254. const userMessage: ChatMessage = createMessage({
  255. role: "user",
  256. content: userContent,
  257. });
  258. const botMessage: ChatMessage = createMessage({
  259. role: "assistant",
  260. streaming: true,
  261. model: modelConfig.model,
  262. });
  263. // get recent messages
  264. const recentMessages = get().getMessagesWithMemory();
  265. const sendMessages = recentMessages.concat(userMessage);
  266. const messageIndex = get().currentSession().messages.length + 1;
  267. // save user's and bot's message
  268. get().updateCurrentSession((session) => {
  269. const savedUserMessage = {
  270. ...userMessage,
  271. content,
  272. };
  273. session.messages = session.messages.concat([
  274. savedUserMessage,
  275. botMessage,
  276. ]);
  277. });
  278. // make request
  279. api.llm.chat({
  280. messages: sendMessages,
  281. config: { ...modelConfig, stream: true },
  282. onUpdate(message) {
  283. botMessage.streaming = true;
  284. if (message) {
  285. botMessage.content = message;
  286. }
  287. get().updateCurrentSession((session) => {
  288. session.messages = session.messages.concat();
  289. });
  290. },
  291. onFinish(message) {
  292. botMessage.streaming = false;
  293. if (message) {
  294. botMessage.content = message;
  295. get().onNewMessage(botMessage);
  296. }
  297. ChatControllerPool.remove(session.id, botMessage.id);
  298. },
  299. onError(error) {
  300. const isAborted = error.message.includes("aborted");
  301. botMessage.content +=
  302. "\n\n" +
  303. prettyObject({
  304. error: true,
  305. message: error.message,
  306. });
  307. botMessage.streaming = false;
  308. userMessage.isError = !isAborted;
  309. botMessage.isError = !isAborted;
  310. get().updateCurrentSession((session) => {
  311. session.messages = session.messages.concat();
  312. });
  313. ChatControllerPool.remove(
  314. session.id,
  315. botMessage.id ?? messageIndex,
  316. );
  317. console.error("[Chat] failed ", error);
  318. },
  319. onController(controller) {
  320. // collect controller for stop/retry
  321. ChatControllerPool.addController(
  322. session.id,
  323. botMessage.id ?? messageIndex,
  324. controller,
  325. );
  326. },
  327. });
  328. },
  329. getMemoryPrompt() {
  330. const session = get().currentSession();
  331. return {
  332. role: "system",
  333. content:
  334. session.memoryPrompt.length > 0
  335. ? Locale.Store.Prompt.History(session.memoryPrompt)
  336. : "",
  337. date: "",
  338. } as ChatMessage;
  339. },
  340. getMessagesWithMemory() {
  341. const session = get().currentSession();
  342. const modelConfig = session.mask.modelConfig;
  343. const clearContextIndex = session.clearContextIndex ?? 0;
  344. const messages = session.messages.slice();
  345. const totalMessageCount = session.messages.length;
  346. // in-context prompts
  347. const contextPrompts = session.mask.context.slice();
  348. // system prompts, to get close to OpenAI Web ChatGPT
  349. const shouldInjectSystemPrompts = modelConfig.enableInjectSystemPrompts;
  350. const systemPrompts = shouldInjectSystemPrompts
  351. ? [
  352. createMessage({
  353. role: "system",
  354. content: fillTemplateWith("", {
  355. ...modelConfig,
  356. template: DEFAULT_SYSTEM_TEMPLATE,
  357. }),
  358. }),
  359. ]
  360. : [];
  361. if (shouldInjectSystemPrompts) {
  362. console.log(
  363. "[Global System Prompt] ",
  364. systemPrompts.at(0)?.content ?? "empty",
  365. );
  366. }
  367. // long term memory
  368. const shouldSendLongTermMemory =
  369. modelConfig.sendMemory &&
  370. session.memoryPrompt &&
  371. session.memoryPrompt.length > 0 &&
  372. session.lastSummarizeIndex > clearContextIndex;
  373. const longTermMemoryPrompts = shouldSendLongTermMemory
  374. ? [get().getMemoryPrompt()]
  375. : [];
  376. const longTermMemoryStartIndex = session.lastSummarizeIndex;
  377. // short term memory
  378. const shortTermMemoryStartIndex = Math.max(
  379. 0,
  380. totalMessageCount - modelConfig.historyMessageCount,
  381. );
  382. // lets concat send messages, including 4 parts:
  383. // 0. system prompt: to get close to OpenAI Web ChatGPT
  384. // 1. long term memory: summarized memory messages
  385. // 2. pre-defined in-context prompts
  386. // 3. short term memory: latest n messages
  387. // 4. newest input message
  388. const memoryStartIndex = shouldSendLongTermMemory
  389. ? Math.min(longTermMemoryStartIndex, shortTermMemoryStartIndex)
  390. : shortTermMemoryStartIndex;
  391. // and if user has cleared history messages, we should exclude the memory too.
  392. const contextStartIndex = Math.max(clearContextIndex, memoryStartIndex);
  393. const maxTokenThreshold = modelConfig.max_tokens;
  394. // get recent messages as much as possible
  395. const reversedRecentMessages = [];
  396. for (
  397. let i = totalMessageCount - 1, tokenCount = 0;
  398. i >= contextStartIndex && tokenCount < maxTokenThreshold;
  399. i -= 1
  400. ) {
  401. const msg = messages[i];
  402. if (!msg || msg.isError) continue;
  403. tokenCount += estimateTokenLength(msg.content);
  404. reversedRecentMessages.push(msg);
  405. }
  406. // concat all messages
  407. const recentMessages = [
  408. ...systemPrompts,
  409. ...longTermMemoryPrompts,
  410. ...contextPrompts,
  411. ...reversedRecentMessages.reverse(),
  412. ];
  413. return recentMessages;
  414. },
  415. updateMessage(
  416. sessionIndex: number,
  417. messageIndex: number,
  418. updater: (message?: ChatMessage) => void,
  419. ) {
  420. const sessions = get().sessions;
  421. const session = sessions.at(sessionIndex);
  422. const messages = session?.messages;
  423. updater(messages?.at(messageIndex));
  424. set(() => ({ sessions }));
  425. },
  426. resetSession() {
  427. get().updateCurrentSession((session) => {
  428. session.messages = [];
  429. session.memoryPrompt = "";
  430. });
  431. },
  432. summarizeSession() {
  433. const config = useAppConfig.getState();
  434. const session = get().currentSession();
  435. // remove error messages if any
  436. const messages = session.messages;
  437. // should summarize topic after chating more than 50 words
  438. const SUMMARIZE_MIN_LEN = 50;
  439. if (
  440. config.enableAutoGenerateTitle &&
  441. session.topic === DEFAULT_TOPIC &&
  442. countMessages(messages) >= SUMMARIZE_MIN_LEN
  443. ) {
  444. const topicMessages = messages.concat(
  445. createMessage({
  446. role: "user",
  447. content: Locale.Store.Prompt.Topic,
  448. }),
  449. );
  450. api.llm.chat({
  451. messages: topicMessages,
  452. config: {
  453. model: getSummarizeModel(session.mask.modelConfig.model),
  454. },
  455. onFinish(message) {
  456. get().updateCurrentSession(
  457. (session) =>
  458. (session.topic =
  459. message.length > 0 ? trimTopic(message) : DEFAULT_TOPIC),
  460. );
  461. },
  462. });
  463. }
  464. const modelConfig = session.mask.modelConfig;
  465. const summarizeIndex = Math.max(
  466. session.lastSummarizeIndex,
  467. session.clearContextIndex ?? 0,
  468. );
  469. let toBeSummarizedMsgs = messages
  470. .filter((msg) => !msg.isError)
  471. .slice(summarizeIndex);
  472. const historyMsgLength = countMessages(toBeSummarizedMsgs);
  473. if (historyMsgLength > modelConfig?.max_tokens ?? 4000) {
  474. const n = toBeSummarizedMsgs.length;
  475. toBeSummarizedMsgs = toBeSummarizedMsgs.slice(
  476. Math.max(0, n - modelConfig.historyMessageCount),
  477. );
  478. }
  479. // add memory prompt
  480. toBeSummarizedMsgs.unshift(get().getMemoryPrompt());
  481. const lastSummarizeIndex = session.messages.length;
  482. console.log(
  483. "[Chat History] ",
  484. toBeSummarizedMsgs,
  485. historyMsgLength,
  486. modelConfig.compressMessageLengthThreshold,
  487. );
  488. if (
  489. historyMsgLength > modelConfig.compressMessageLengthThreshold &&
  490. modelConfig.sendMemory
  491. ) {
  492. api.llm.chat({
  493. messages: toBeSummarizedMsgs.concat(
  494. createMessage({
  495. role: "system",
  496. content: Locale.Store.Prompt.Summarize,
  497. date: "",
  498. }),
  499. ),
  500. config: {
  501. ...modelConfig,
  502. stream: true,
  503. model: getSummarizeModel(session.mask.modelConfig.model),
  504. },
  505. onUpdate(message) {
  506. session.memoryPrompt = message;
  507. },
  508. onFinish(message) {
  509. console.log("[Memory] ", message);
  510. session.lastSummarizeIndex = lastSummarizeIndex;
  511. },
  512. onError(err) {
  513. console.error("[Summarize] ", err);
  514. },
  515. });
  516. }
  517. },
  518. updateStat(message: ChatMessage) {
  519. get().updateCurrentSession((session) => {
  520. session.stat.charCount += message.content.length;
  521. // TODO: should update chat count and word count
  522. });
  523. },
  524. updateCurrentSession(updater: (session: ChatSession) => void) {
  525. const sessions = get().sessions;
  526. const index = get().currentSessionIndex;
  527. updater(sessions[index]);
  528. set(() => ({ sessions }));
  529. },
  530. clearAllData() {
  531. localStorage.clear();
  532. location.reload();
  533. },
  534. };
  535. return methods;
  536. },
  537. {
  538. name: StoreKey.Chat,
  539. version: 3.1,
  540. migrate(persistedState, version) {
  541. const state = persistedState as any;
  542. const newState = JSON.parse(
  543. JSON.stringify(state),
  544. ) as typeof DEFAULT_CHAT_STATE;
  545. if (version < 2) {
  546. newState.sessions = [];
  547. const oldSessions = state.sessions;
  548. for (const oldSession of oldSessions) {
  549. const newSession = createEmptySession();
  550. newSession.topic = oldSession.topic;
  551. newSession.messages = [...oldSession.messages];
  552. newSession.mask.modelConfig.sendMemory = true;
  553. newSession.mask.modelConfig.historyMessageCount = 4;
  554. newSession.mask.modelConfig.compressMessageLengthThreshold = 1000;
  555. newState.sessions.push(newSession);
  556. }
  557. }
  558. if (version < 3) {
  559. // migrate id to nanoid
  560. newState.sessions.forEach((s) => {
  561. s.id = nanoid();
  562. s.messages.forEach((m) => (m.id = nanoid()));
  563. });
  564. }
  565. // Enable `enableInjectSystemPrompts` attribute for old sessions.
  566. // Resolve issue of old sessions not automatically enabling.
  567. if (version < 3.1) {
  568. newState.sessions.forEach((s) => {
  569. if (
  570. // Exclude those already set by user
  571. !s.mask.modelConfig.hasOwnProperty("enableInjectSystemPrompts")
  572. ) {
  573. // Because users may have changed this configuration,
  574. // the user's current configuration is used instead of the default
  575. const config = useAppConfig.getState();
  576. s.mask.modelConfig.enableInjectSystemPrompts =
  577. config.modelConfig.enableInjectSystemPrompts;
  578. }
  579. });
  580. }
  581. return newState as any;
  582. },
  583. },
  584. );