chat.ts 20 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673
  1. import { trimTopic } from "../utils";
  2. import Locale, { getLang } from "../locales";
  3. import { showToast } from "../components/ui-lib";
  4. import { ModelConfig, ModelType, useAppConfig } from "./config";
  5. import { createEmptyMask, Mask } from "./mask";
  6. import {
  7. DEFAULT_INPUT_TEMPLATE,
  8. DEFAULT_MODELS,
  9. DEFAULT_SYSTEM_TEMPLATE,
  10. KnowledgeCutOffDate,
  11. ModelProvider,
  12. StoreKey,
  13. SUMMARIZE_MODEL,
  14. } from "../constant";
  15. import { ClientApi, RequestMessage } from "../client/api";
  16. import { ChatControllerPool } from "../client/controller";
  17. import { prettyObject } from "../utils/format";
  18. import { estimateTokenLength } from "../utils/token";
  19. import { nanoid } from "nanoid";
  20. import { createPersistStore } from "../utils/store";
  21. export type ChatMessage = RequestMessage & {
  22. date: string;
  23. streaming?: boolean;
  24. isError?: boolean;
  25. id: string;
  26. model?: ModelType;
  27. };
  28. export function createMessage(override: Partial<ChatMessage>): ChatMessage {
  29. return {
  30. id: nanoid(),
  31. date: new Date().toLocaleString(),
  32. role: "user",
  33. content: "",
  34. ...override,
  35. };
  36. }
  37. export interface ChatStat {
  38. tokenCount: number;
  39. wordCount: number;
  40. charCount: number;
  41. }
  42. export interface ChatSession {
  43. id: string;
  44. topic: string;
  45. memoryPrompt: string;
  46. messages: ChatMessage[];
  47. stat: ChatStat;
  48. lastUpdate: number;
  49. lastSummarizeIndex: number;
  50. clearContextIndex?: number;
  51. mask: Mask;
  52. }
  53. export const DEFAULT_TOPIC = Locale.Store.DefaultTopic;
  54. export const BOT_HELLO: ChatMessage = createMessage({
  55. role: "assistant",
  56. content: Locale.Store.BotHello,
  57. });
  58. function createEmptySession(): ChatSession {
  59. return {
  60. id: nanoid(),
  61. topic: DEFAULT_TOPIC,
  62. memoryPrompt: "",
  63. messages: [],
  64. stat: {
  65. tokenCount: 0,
  66. wordCount: 0,
  67. charCount: 0,
  68. },
  69. lastUpdate: Date.now(),
  70. lastSummarizeIndex: 0,
  71. mask: createEmptyMask(),
  72. };
  73. }
  74. function getSummarizeModel(currentModel: string) {
  75. // if it is using gpt-* models, force to use 3.5 to summarize
  76. return currentModel.startsWith("gpt") ? SUMMARIZE_MODEL : currentModel;
  77. }
  78. function countMessages(msgs: ChatMessage[]) {
  79. return msgs.reduce((pre, cur) => pre + estimateTokenLength(cur.content), 0);
  80. }
  81. function fillTemplateWith(input: string, modelConfig: ModelConfig) {
  82. const cutoff = KnowledgeCutOffDate[modelConfig.model] ?? KnowledgeCutOffDate.default;
  83. // Find the model in the DEFAULT_MODELS array that matches the modelConfig.model
  84. const modelInfo = DEFAULT_MODELS.find(m => m.name === modelConfig.model);
  85. if (!modelInfo) {
  86. throw new Error(`Model ${modelConfig.model} not found in DEFAULT_MODELS array.`);
  87. }
  88. // Directly use the providerName from the modelInfo
  89. const serviceProvider = modelInfo.provider.providerName;
  90. const vars = {
  91. ServiceProvider: serviceProvider,
  92. cutoff,
  93. model: modelConfig.model,
  94. time: new Date().toLocaleString(),
  95. lang: getLang(),
  96. input: input,
  97. };
  98. let output = modelConfig.template ?? DEFAULT_INPUT_TEMPLATE;
  99. // must contains {{input}}
  100. const inputVar = "{{input}}";
  101. if (!output.includes(inputVar)) {
  102. output += "\n" + inputVar;
  103. }
  104. Object.entries(vars).forEach(([name, value]) => {
  105. const regex = new RegExp(`{{${name}}}`, 'g');
  106. output = output.replace(regex, value.toString()); // Ensure value is a string
  107. });
  108. return output;
  109. }
  110. const DEFAULT_CHAT_STATE = {
  111. sessions: [createEmptySession()],
  112. currentSessionIndex: 0,
  113. };
  114. export const useChatStore = createPersistStore(
  115. DEFAULT_CHAT_STATE,
  116. (set, _get) => {
  117. function get() {
  118. return {
  119. ..._get(),
  120. ...methods,
  121. };
  122. }
  123. const methods = {
  124. clearSessions() {
  125. set(() => ({
  126. sessions: [createEmptySession()],
  127. currentSessionIndex: 0,
  128. }));
  129. },
  130. selectSession(index: number) {
  131. set({
  132. currentSessionIndex: index,
  133. });
  134. },
  135. moveSession(from: number, to: number) {
  136. set((state) => {
  137. const { sessions, currentSessionIndex: oldIndex } = state;
  138. // move the session
  139. const newSessions = [...sessions];
  140. const session = newSessions[from];
  141. newSessions.splice(from, 1);
  142. newSessions.splice(to, 0, session);
  143. // modify current session id
  144. let newIndex = oldIndex === from ? to : oldIndex;
  145. if (oldIndex > from && oldIndex <= to) {
  146. newIndex -= 1;
  147. } else if (oldIndex < from && oldIndex >= to) {
  148. newIndex += 1;
  149. }
  150. return {
  151. currentSessionIndex: newIndex,
  152. sessions: newSessions,
  153. };
  154. });
  155. },
  156. newSession(mask?: Mask) {
  157. const session = createEmptySession();
  158. if (mask) {
  159. const config = useAppConfig.getState();
  160. const globalModelConfig = config.modelConfig;
  161. session.mask = {
  162. ...mask,
  163. modelConfig: {
  164. ...globalModelConfig,
  165. ...mask.modelConfig,
  166. },
  167. };
  168. session.topic = mask.name;
  169. }
  170. set((state) => ({
  171. currentSessionIndex: 0,
  172. sessions: [session].concat(state.sessions),
  173. }));
  174. },
  175. nextSession(delta: number) {
  176. const n = get().sessions.length;
  177. const limit = (x: number) => (x + n) % n;
  178. const i = get().currentSessionIndex;
  179. get().selectSession(limit(i + delta));
  180. },
  181. deleteSession(index: number) {
  182. const deletingLastSession = get().sessions.length === 1;
  183. const deletedSession = get().sessions.at(index);
  184. if (!deletedSession) return;
  185. const sessions = get().sessions.slice();
  186. sessions.splice(index, 1);
  187. const currentIndex = get().currentSessionIndex;
  188. let nextIndex = Math.min(
  189. currentIndex - Number(index < currentIndex),
  190. sessions.length - 1,
  191. );
  192. if (deletingLastSession) {
  193. nextIndex = 0;
  194. sessions.push(createEmptySession());
  195. }
  196. // for undo delete action
  197. const restoreState = {
  198. currentSessionIndex: get().currentSessionIndex,
  199. sessions: get().sessions.slice(),
  200. };
  201. set(() => ({
  202. currentSessionIndex: nextIndex,
  203. sessions,
  204. }));
  205. showToast(
  206. Locale.Home.DeleteToast,
  207. {
  208. text: Locale.Home.Revert,
  209. onClick() {
  210. set(() => restoreState);
  211. },
  212. },
  213. 5000,
  214. );
  215. },
  216. currentSession() {
  217. let index = get().currentSessionIndex;
  218. const sessions = get().sessions;
  219. if (index < 0 || index >= sessions.length) {
  220. index = Math.min(sessions.length - 1, Math.max(0, index));
  221. set(() => ({ currentSessionIndex: index }));
  222. }
  223. const session = sessions[index];
  224. return session;
  225. },
  226. onNewMessage(message: ChatMessage) {
  227. get().updateCurrentSession((session) => {
  228. session.messages = session.messages.concat();
  229. session.lastUpdate = Date.now();
  230. });
  231. get().updateStat(message);
  232. get().summarizeSession();
  233. },
  234. async onUserInput(content: string) {
  235. const session = get().currentSession();
  236. const modelConfig = session.mask.modelConfig;
  237. const userContent = fillTemplateWith(content, modelConfig);
  238. console.log("[User Input] after template: ", userContent);
  239. const userMessage: ChatMessage = createMessage({
  240. role: "user",
  241. content: userContent,
  242. });
  243. const botMessage: ChatMessage = createMessage({
  244. role: "assistant",
  245. streaming: true,
  246. model: modelConfig.model,
  247. });
  248. // get recent messages
  249. const recentMessages = get().getMessagesWithMemory();
  250. const sendMessages = recentMessages.concat(userMessage);
  251. const messageIndex = get().currentSession().messages.length + 1;
  252. // save user's and bot's message
  253. get().updateCurrentSession((session) => {
  254. const savedUserMessage = {
  255. ...userMessage,
  256. content,
  257. };
  258. session.messages = session.messages.concat([
  259. savedUserMessage,
  260. botMessage,
  261. ]);
  262. });
  263. var api: ClientApi;
  264. if (modelConfig.model === "gemini-pro") {
  265. api = new ClientApi(ModelProvider.GeminiPro);
  266. } else {
  267. api = new ClientApi(ModelProvider.GPT);
  268. }
  269. // make request
  270. api.llm.chat({
  271. messages: sendMessages,
  272. config: { ...modelConfig, stream: true },
  273. onUpdate(message) {
  274. botMessage.streaming = true;
  275. if (message) {
  276. botMessage.content = message;
  277. }
  278. get().updateCurrentSession((session) => {
  279. session.messages = session.messages.concat();
  280. });
  281. },
  282. onFinish(message) {
  283. botMessage.streaming = false;
  284. if (message) {
  285. botMessage.content = message;
  286. get().onNewMessage(botMessage);
  287. }
  288. ChatControllerPool.remove(session.id, botMessage.id);
  289. },
  290. onError(error) {
  291. const isAborted = error.message.includes("aborted");
  292. botMessage.content +=
  293. "\n\n" +
  294. prettyObject({
  295. error: true,
  296. message: error.message,
  297. });
  298. botMessage.streaming = false;
  299. userMessage.isError = !isAborted;
  300. botMessage.isError = !isAborted;
  301. get().updateCurrentSession((session) => {
  302. session.messages = session.messages.concat();
  303. });
  304. ChatControllerPool.remove(
  305. session.id,
  306. botMessage.id ?? messageIndex,
  307. );
  308. console.error("[Chat] failed ", error);
  309. },
  310. onController(controller) {
  311. // collect controller for stop/retry
  312. ChatControllerPool.addController(
  313. session.id,
  314. botMessage.id ?? messageIndex,
  315. controller,
  316. );
  317. },
  318. });
  319. },
  320. getMemoryPrompt() {
  321. const session = get().currentSession();
  322. return {
  323. role: "system",
  324. content:
  325. session.memoryPrompt.length > 0
  326. ? Locale.Store.Prompt.History(session.memoryPrompt)
  327. : "",
  328. date: "",
  329. } as ChatMessage;
  330. },
  331. getMessagesWithMemory() {
  332. const session = get().currentSession();
  333. const modelConfig = session.mask.modelConfig;
  334. const clearContextIndex = session.clearContextIndex ?? 0;
  335. const messages = session.messages.slice();
  336. const totalMessageCount = session.messages.length;
  337. // in-context prompts
  338. const contextPrompts = session.mask.context.slice();
  339. // system prompts, to get close to OpenAI Web ChatGPT
  340. const shouldInjectSystemPrompts =
  341. modelConfig.enableInjectSystemPrompts &&
  342. session.mask.modelConfig.model.startsWith("gpt-");
  343. var systemPrompts: ChatMessage[] = [];
  344. systemPrompts = shouldInjectSystemPrompts
  345. ? [
  346. createMessage({
  347. role: "system",
  348. content: fillTemplateWith("", {
  349. ...modelConfig,
  350. template: DEFAULT_SYSTEM_TEMPLATE,
  351. }),
  352. }),
  353. ]
  354. : [];
  355. if (shouldInjectSystemPrompts) {
  356. console.log(
  357. "[Global System Prompt] ",
  358. systemPrompts.at(0)?.content ?? "empty",
  359. );
  360. }
  361. // long term memory
  362. const shouldSendLongTermMemory =
  363. modelConfig.sendMemory &&
  364. session.memoryPrompt &&
  365. session.memoryPrompt.length > 0 &&
  366. session.lastSummarizeIndex > clearContextIndex;
  367. const longTermMemoryPrompts = shouldSendLongTermMemory
  368. ? [get().getMemoryPrompt()]
  369. : [];
  370. const longTermMemoryStartIndex = session.lastSummarizeIndex;
  371. // short term memory
  372. const shortTermMemoryStartIndex = Math.max(
  373. 0,
  374. totalMessageCount - modelConfig.historyMessageCount,
  375. );
  376. // lets concat send messages, including 4 parts:
  377. // 0. system prompt: to get close to OpenAI Web ChatGPT
  378. // 1. long term memory: summarized memory messages
  379. // 2. pre-defined in-context prompts
  380. // 3. short term memory: latest n messages
  381. // 4. newest input message
  382. const memoryStartIndex = shouldSendLongTermMemory
  383. ? Math.min(longTermMemoryStartIndex, shortTermMemoryStartIndex)
  384. : shortTermMemoryStartIndex;
  385. // and if user has cleared history messages, we should exclude the memory too.
  386. const contextStartIndex = Math.max(clearContextIndex, memoryStartIndex);
  387. const maxTokenThreshold = modelConfig.max_tokens;
  388. // get recent messages as much as possible
  389. const reversedRecentMessages = [];
  390. for (
  391. let i = totalMessageCount - 1, tokenCount = 0;
  392. i >= contextStartIndex && tokenCount < maxTokenThreshold;
  393. i -= 1
  394. ) {
  395. const msg = messages[i];
  396. if (!msg || msg.isError) continue;
  397. tokenCount += estimateTokenLength(msg.content);
  398. reversedRecentMessages.push(msg);
  399. }
  400. // concat all messages
  401. const recentMessages = [
  402. ...systemPrompts,
  403. ...longTermMemoryPrompts,
  404. ...contextPrompts,
  405. ...reversedRecentMessages.reverse(),
  406. ];
  407. return recentMessages;
  408. },
  409. updateMessage(
  410. sessionIndex: number,
  411. messageIndex: number,
  412. updater: (message?: ChatMessage) => void,
  413. ) {
  414. const sessions = get().sessions;
  415. const session = sessions.at(sessionIndex);
  416. const messages = session?.messages;
  417. updater(messages?.at(messageIndex));
  418. set(() => ({ sessions }));
  419. },
  420. resetSession() {
  421. get().updateCurrentSession((session) => {
  422. session.messages = [];
  423. session.memoryPrompt = "";
  424. });
  425. },
  426. summarizeSession() {
  427. const config = useAppConfig.getState();
  428. const session = get().currentSession();
  429. const modelConfig = session.mask.modelConfig;
  430. var api: ClientApi;
  431. if (modelConfig.model === "gemini-pro") {
  432. api = new ClientApi(ModelProvider.GeminiPro);
  433. } else {
  434. api = new ClientApi(ModelProvider.GPT);
  435. }
  436. // remove error messages if any
  437. const messages = session.messages;
  438. // should summarize topic after chating more than 50 words
  439. const SUMMARIZE_MIN_LEN = 50;
  440. if (
  441. config.enableAutoGenerateTitle &&
  442. session.topic === DEFAULT_TOPIC &&
  443. countMessages(messages) >= SUMMARIZE_MIN_LEN
  444. ) {
  445. const topicMessages = messages.concat(
  446. createMessage({
  447. role: "user",
  448. content: Locale.Store.Prompt.Topic,
  449. }),
  450. );
  451. api.llm.chat({
  452. messages: topicMessages,
  453. config: {
  454. model: getSummarizeModel(session.mask.modelConfig.model),
  455. },
  456. onFinish(message) {
  457. get().updateCurrentSession(
  458. (session) =>
  459. (session.topic =
  460. message.length > 0 ? trimTopic(message) : DEFAULT_TOPIC),
  461. );
  462. },
  463. });
  464. }
  465. const summarizeIndex = Math.max(
  466. session.lastSummarizeIndex,
  467. session.clearContextIndex ?? 0,
  468. );
  469. let toBeSummarizedMsgs = messages
  470. .filter((msg) => !msg.isError)
  471. .slice(summarizeIndex);
  472. const historyMsgLength = countMessages(toBeSummarizedMsgs);
  473. if (historyMsgLength > modelConfig?.max_tokens ?? 4000) {
  474. const n = toBeSummarizedMsgs.length;
  475. toBeSummarizedMsgs = toBeSummarizedMsgs.slice(
  476. Math.max(0, n - modelConfig.historyMessageCount),
  477. );
  478. }
  479. // add memory prompt
  480. toBeSummarizedMsgs.unshift(get().getMemoryPrompt());
  481. const lastSummarizeIndex = session.messages.length;
  482. console.log(
  483. "[Chat History] ",
  484. toBeSummarizedMsgs,
  485. historyMsgLength,
  486. modelConfig.compressMessageLengthThreshold,
  487. );
  488. if (
  489. historyMsgLength > modelConfig.compressMessageLengthThreshold &&
  490. modelConfig.sendMemory
  491. ) {
  492. api.llm.chat({
  493. messages: toBeSummarizedMsgs.concat(
  494. createMessage({
  495. role: "system",
  496. content: Locale.Store.Prompt.Summarize,
  497. date: "",
  498. }),
  499. ),
  500. config: {
  501. ...modelConfig,
  502. stream: true,
  503. model: getSummarizeModel(session.mask.modelConfig.model),
  504. },
  505. onUpdate(message) {
  506. session.memoryPrompt = message;
  507. },
  508. onFinish(message) {
  509. console.log("[Memory] ", message);
  510. get().updateCurrentSession((session) => {
  511. session.lastSummarizeIndex = lastSummarizeIndex;
  512. session.memoryPrompt = message; // Update the memory prompt for stored it in local storage
  513. });
  514. },
  515. onError(err) {
  516. console.error("[Summarize] ", err);
  517. },
  518. });
  519. }
  520. },
  521. updateStat(message: ChatMessage) {
  522. get().updateCurrentSession((session) => {
  523. session.stat.charCount += message.content.length;
  524. // TODO: should update chat count and word count
  525. });
  526. },
  527. updateCurrentSession(updater: (session: ChatSession) => void) {
  528. const sessions = get().sessions;
  529. const index = get().currentSessionIndex;
  530. updater(sessions[index]);
  531. set(() => ({ sessions }));
  532. },
  533. clearAllData() {
  534. localStorage.clear();
  535. location.reload();
  536. },
  537. };
  538. return methods;
  539. },
  540. {
  541. name: StoreKey.Chat,
  542. version: 3.1,
  543. migrate(persistedState, version) {
  544. const state = persistedState as any;
  545. const newState = JSON.parse(
  546. JSON.stringify(state),
  547. ) as typeof DEFAULT_CHAT_STATE;
  548. if (version < 2) {
  549. newState.sessions = [];
  550. const oldSessions = state.sessions;
  551. for (const oldSession of oldSessions) {
  552. const newSession = createEmptySession();
  553. newSession.topic = oldSession.topic;
  554. newSession.messages = [...oldSession.messages];
  555. newSession.mask.modelConfig.sendMemory = true;
  556. newSession.mask.modelConfig.historyMessageCount = 4;
  557. newSession.mask.modelConfig.compressMessageLengthThreshold = 1000;
  558. newState.sessions.push(newSession);
  559. }
  560. }
  561. if (version < 3) {
  562. // migrate id to nanoid
  563. newState.sessions.forEach((s) => {
  564. s.id = nanoid();
  565. s.messages.forEach((m) => (m.id = nanoid()));
  566. });
  567. }
  568. // Enable `enableInjectSystemPrompts` attribute for old sessions.
  569. // Resolve issue of old sessions not automatically enabling.
  570. if (version < 3.1) {
  571. newState.sessions.forEach((s) => {
  572. if (
  573. // Exclude those already set by user
  574. !s.mask.modelConfig.hasOwnProperty("enableInjectSystemPrompts")
  575. ) {
  576. // Because users may have changed this configuration,
  577. // the user's current configuration is used instead of the default
  578. const config = useAppConfig.getState();
  579. s.mask.modelConfig.enableInjectSystemPrompts =
  580. config.modelConfig.enableInjectSystemPrompts;
  581. }
  582. });
  583. }
  584. return newState as any;
  585. },
  586. },
  587. );