chat.ts 21 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726
  1. import { trimTopic, getMessageTextContent } from "../utils";
  2. import Locale, { getLang } from "../locales";
  3. import { showToast } from "../components/ui-lib";
  4. import { ModelConfig, ModelType, useAppConfig } from "./config";
  5. import { createEmptyMask, Mask } from "./mask";
  6. import {
  7. DEFAULT_INPUT_TEMPLATE,
  8. DEFAULT_MODELS,
  9. DEFAULT_SYSTEM_TEMPLATE,
  10. KnowledgeCutOffDate,
  11. StoreKey,
  12. SUMMARIZE_MODEL,
  13. GEMINI_SUMMARIZE_MODEL,
  14. } from "../constant";
  15. import { getClientApi } from "../client/api";
  16. import type {
  17. ClientApi,
  18. RequestMessage,
  19. MultimodalContent,
  20. } from "../client/api";
  21. import { ChatControllerPool } from "../client/controller";
  22. import { prettyObject } from "../utils/format";
  23. import { estimateTokenLength } from "../utils/token";
  24. import { nanoid } from "nanoid";
  25. import { createPersistStore } from "../utils/store";
  26. import { collectModelsWithDefaultModel } from "../utils/model";
  27. import { useAccessStore } from "./access";
  28. import { isDalle3 } from "../utils";
  29. export type ChatMessage = RequestMessage & {
  30. date: string;
  31. streaming?: boolean;
  32. isError?: boolean;
  33. id: string;
  34. model?: ModelType;
  35. };
  36. export function createMessage(override: Partial<ChatMessage>): ChatMessage {
  37. return {
  38. id: nanoid(),
  39. date: new Date().toLocaleString(),
  40. role: "user",
  41. content: "",
  42. ...override,
  43. };
  44. }
  45. export interface ChatStat {
  46. tokenCount: number;
  47. wordCount: number;
  48. charCount: number;
  49. }
  50. export interface ChatSession {
  51. id: string;
  52. topic: string;
  53. memoryPrompt: string;
  54. messages: ChatMessage[];
  55. stat: ChatStat;
  56. lastUpdate: number;
  57. lastSummarizeIndex: number;
  58. clearContextIndex?: number;
  59. mask: Mask;
  60. }
  61. export const DEFAULT_TOPIC = Locale.Store.DefaultTopic;
  62. export const BOT_HELLO: ChatMessage = createMessage({
  63. role: "assistant",
  64. content: Locale.Store.BotHello,
  65. });
  66. function createEmptySession(): ChatSession {
  67. return {
  68. id: nanoid(),
  69. topic: DEFAULT_TOPIC,
  70. memoryPrompt: "",
  71. messages: [],
  72. stat: {
  73. tokenCount: 0,
  74. wordCount: 0,
  75. charCount: 0,
  76. },
  77. lastUpdate: Date.now(),
  78. lastSummarizeIndex: 0,
  79. mask: createEmptyMask(),
  80. };
  81. }
  82. function getSummarizeModel(currentModel: string) {
  83. // if it is using gpt-* models, force to use 4o-mini to summarize
  84. if (currentModel.startsWith("gpt")) {
  85. const configStore = useAppConfig.getState();
  86. const accessStore = useAccessStore.getState();
  87. const allModel = collectModelsWithDefaultModel(
  88. configStore.models,
  89. [configStore.customModels, accessStore.customModels].join(","),
  90. accessStore.defaultModel,
  91. );
  92. const summarizeModel = allModel.find(
  93. (m) => m.name === SUMMARIZE_MODEL && m.available,
  94. );
  95. return summarizeModel?.name ?? currentModel;
  96. }
  97. if (currentModel.startsWith("gemini")) {
  98. return GEMINI_SUMMARIZE_MODEL;
  99. }
  100. return currentModel;
  101. }
  102. function countMessages(msgs: ChatMessage[]) {
  103. return msgs.reduce(
  104. (pre, cur) => pre + estimateTokenLength(getMessageTextContent(cur)),
  105. 0,
  106. );
  107. }
  108. function fillTemplateWith(input: string, modelConfig: ModelConfig) {
  109. const cutoff =
  110. KnowledgeCutOffDate[modelConfig.model] ?? KnowledgeCutOffDate.default;
  111. // Find the model in the DEFAULT_MODELS array that matches the modelConfig.model
  112. const modelInfo = DEFAULT_MODELS.find((m) => m.name === modelConfig.model);
  113. var serviceProvider = "OpenAI";
  114. if (modelInfo) {
  115. // TODO: auto detect the providerName from the modelConfig.model
  116. // Directly use the providerName from the modelInfo
  117. serviceProvider = modelInfo.provider.providerName;
  118. }
  119. const vars = {
  120. ServiceProvider: serviceProvider,
  121. cutoff,
  122. model: modelConfig.model,
  123. time: new Date().toString(),
  124. lang: getLang(),
  125. input: input,
  126. };
  127. let output = modelConfig.template ?? DEFAULT_INPUT_TEMPLATE;
  128. // remove duplicate
  129. if (input.startsWith(output)) {
  130. output = "";
  131. }
  132. // must contains {{input}}
  133. const inputVar = "{{input}}";
  134. if (!output.includes(inputVar)) {
  135. output += "\n" + inputVar;
  136. }
  137. Object.entries(vars).forEach(([name, value]) => {
  138. const regex = new RegExp(`{{${name}}}`, "g");
  139. output = output.replace(regex, value.toString()); // Ensure value is a string
  140. });
  141. return output;
  142. }
  143. const DEFAULT_CHAT_STATE = {
  144. sessions: [createEmptySession()],
  145. currentSessionIndex: 0,
  146. };
  147. export const useChatStore = createPersistStore(
  148. DEFAULT_CHAT_STATE,
  149. (set, _get) => {
  150. function get() {
  151. return {
  152. ..._get(),
  153. ...methods,
  154. };
  155. }
  156. const methods = {
  157. clearSessions() {
  158. set(() => ({
  159. sessions: [createEmptySession()],
  160. currentSessionIndex: 0,
  161. }));
  162. },
  163. selectSession(index: number) {
  164. set({
  165. currentSessionIndex: index,
  166. });
  167. },
  168. moveSession(from: number, to: number) {
  169. set((state) => {
  170. const { sessions, currentSessionIndex: oldIndex } = state;
  171. // move the session
  172. const newSessions = [...sessions];
  173. const session = newSessions[from];
  174. newSessions.splice(from, 1);
  175. newSessions.splice(to, 0, session);
  176. // modify current session id
  177. let newIndex = oldIndex === from ? to : oldIndex;
  178. if (oldIndex > from && oldIndex <= to) {
  179. newIndex -= 1;
  180. } else if (oldIndex < from && oldIndex >= to) {
  181. newIndex += 1;
  182. }
  183. return {
  184. currentSessionIndex: newIndex,
  185. sessions: newSessions,
  186. };
  187. });
  188. },
  189. newSession(mask?: Mask) {
  190. const session = createEmptySession();
  191. if (mask) {
  192. const config = useAppConfig.getState();
  193. const globalModelConfig = config.modelConfig;
  194. session.mask = {
  195. ...mask,
  196. modelConfig: {
  197. ...globalModelConfig,
  198. ...mask.modelConfig,
  199. },
  200. };
  201. session.topic = mask.name;
  202. }
  203. set((state) => ({
  204. currentSessionIndex: 0,
  205. sessions: [session].concat(state.sessions),
  206. }));
  207. },
  208. nextSession(delta: number) {
  209. const n = get().sessions.length;
  210. const limit = (x: number) => (x + n) % n;
  211. const i = get().currentSessionIndex;
  212. get().selectSession(limit(i + delta));
  213. },
  214. deleteSession(index: number) {
  215. const deletingLastSession = get().sessions.length === 1;
  216. const deletedSession = get().sessions.at(index);
  217. if (!deletedSession) return;
  218. const sessions = get().sessions.slice();
  219. sessions.splice(index, 1);
  220. const currentIndex = get().currentSessionIndex;
  221. let nextIndex = Math.min(
  222. currentIndex - Number(index < currentIndex),
  223. sessions.length - 1,
  224. );
  225. if (deletingLastSession) {
  226. nextIndex = 0;
  227. sessions.push(createEmptySession());
  228. }
  229. // for undo delete action
  230. const restoreState = {
  231. currentSessionIndex: get().currentSessionIndex,
  232. sessions: get().sessions.slice(),
  233. };
  234. set(() => ({
  235. currentSessionIndex: nextIndex,
  236. sessions,
  237. }));
  238. showToast(
  239. Locale.Home.DeleteToast,
  240. {
  241. text: Locale.Home.Revert,
  242. onClick() {
  243. set(() => restoreState);
  244. },
  245. },
  246. 5000,
  247. );
  248. },
  249. currentSession() {
  250. let index = get().currentSessionIndex;
  251. const sessions = get().sessions;
  252. if (index < 0 || index >= sessions.length) {
  253. index = Math.min(sessions.length - 1, Math.max(0, index));
  254. set(() => ({ currentSessionIndex: index }));
  255. }
  256. const session = sessions[index];
  257. return session;
  258. },
  259. onNewMessage(message: ChatMessage) {
  260. get().updateCurrentSession((session) => {
  261. session.messages = session.messages.concat();
  262. session.lastUpdate = Date.now();
  263. });
  264. get().updateStat(message);
  265. get().summarizeSession();
  266. },
  267. async onUserInput(content: string, attachImages?: string[]) {
  268. const session = get().currentSession();
  269. const modelConfig = session.mask.modelConfig;
  270. const userContent = fillTemplateWith(content, modelConfig);
  271. console.log("[User Input] after template: ", userContent);
  272. let mContent: string | MultimodalContent[] = userContent;
  273. if (attachImages && attachImages.length > 0) {
  274. mContent = [
  275. {
  276. type: "text",
  277. text: userContent,
  278. },
  279. ];
  280. mContent = mContent.concat(
  281. attachImages.map((url) => {
  282. return {
  283. type: "image_url",
  284. image_url: {
  285. url: url,
  286. },
  287. };
  288. }),
  289. );
  290. }
  291. let userMessage: ChatMessage = createMessage({
  292. role: "user",
  293. content: mContent,
  294. });
  295. const botMessage: ChatMessage = createMessage({
  296. role: "assistant",
  297. streaming: true,
  298. model: modelConfig.model,
  299. });
  300. // get recent messages
  301. const recentMessages = get().getMessagesWithMemory();
  302. const sendMessages = recentMessages.concat(userMessage);
  303. const messageIndex = get().currentSession().messages.length + 1;
  304. // save user's and bot's message
  305. get().updateCurrentSession((session) => {
  306. const savedUserMessage = {
  307. ...userMessage,
  308. content: mContent,
  309. };
  310. session.messages = session.messages.concat([
  311. savedUserMessage,
  312. botMessage,
  313. ]);
  314. });
  315. const api: ClientApi = getClientApi(modelConfig.providerName);
  316. // make request
  317. api.llm.chat({
  318. messages: sendMessages,
  319. config: { ...modelConfig, stream: true },
  320. onUpdate(message) {
  321. botMessage.streaming = true;
  322. if (message) {
  323. botMessage.content = message;
  324. }
  325. get().updateCurrentSession((session) => {
  326. session.messages = session.messages.concat();
  327. });
  328. },
  329. onFinish(message) {
  330. botMessage.streaming = false;
  331. if (message) {
  332. botMessage.content = message;
  333. get().onNewMessage(botMessage);
  334. }
  335. ChatControllerPool.remove(session.id, botMessage.id);
  336. },
  337. onError(error) {
  338. const isAborted = error.message.includes("aborted");
  339. botMessage.content +=
  340. "\n\n" +
  341. prettyObject({
  342. error: true,
  343. message: error.message,
  344. });
  345. botMessage.streaming = false;
  346. userMessage.isError = !isAborted;
  347. botMessage.isError = !isAborted;
  348. get().updateCurrentSession((session) => {
  349. session.messages = session.messages.concat();
  350. });
  351. ChatControllerPool.remove(
  352. session.id,
  353. botMessage.id ?? messageIndex,
  354. );
  355. console.error("[Chat] failed ", error);
  356. },
  357. onController(controller) {
  358. // collect controller for stop/retry
  359. ChatControllerPool.addController(
  360. session.id,
  361. botMessage.id ?? messageIndex,
  362. controller,
  363. );
  364. },
  365. });
  366. },
  367. getMemoryPrompt() {
  368. const session = get().currentSession();
  369. if (session.memoryPrompt.length) {
  370. return {
  371. role: "system",
  372. content: Locale.Store.Prompt.History(session.memoryPrompt),
  373. date: "",
  374. } as ChatMessage;
  375. }
  376. },
  377. getMessagesWithMemory() {
  378. const session = get().currentSession();
  379. const modelConfig = session.mask.modelConfig;
  380. const clearContextIndex = session.clearContextIndex ?? 0;
  381. const messages = session.messages.slice();
  382. const totalMessageCount = session.messages.length;
  383. // in-context prompts
  384. const contextPrompts = session.mask.context.slice();
  385. // system prompts, to get close to OpenAI Web ChatGPT
  386. const shouldInjectSystemPrompts =
  387. modelConfig.enableInjectSystemPrompts &&
  388. session.mask.modelConfig.model.startsWith("gpt-");
  389. var systemPrompts: ChatMessage[] = [];
  390. systemPrompts = shouldInjectSystemPrompts
  391. ? [
  392. createMessage({
  393. role: "system",
  394. content: fillTemplateWith("", {
  395. ...modelConfig,
  396. template: DEFAULT_SYSTEM_TEMPLATE,
  397. }),
  398. }),
  399. ]
  400. : [];
  401. if (shouldInjectSystemPrompts) {
  402. console.log(
  403. "[Global System Prompt] ",
  404. systemPrompts.at(0)?.content ?? "empty",
  405. );
  406. }
  407. const memoryPrompt = get().getMemoryPrompt();
  408. // long term memory
  409. const shouldSendLongTermMemory =
  410. modelConfig.sendMemory &&
  411. session.memoryPrompt &&
  412. session.memoryPrompt.length > 0 &&
  413. session.lastSummarizeIndex > clearContextIndex;
  414. const longTermMemoryPrompts =
  415. shouldSendLongTermMemory && memoryPrompt ? [memoryPrompt] : [];
  416. const longTermMemoryStartIndex = session.lastSummarizeIndex;
  417. // short term memory
  418. const shortTermMemoryStartIndex = Math.max(
  419. 0,
  420. totalMessageCount - modelConfig.historyMessageCount,
  421. );
  422. // lets concat send messages, including 4 parts:
  423. // 0. system prompt: to get close to OpenAI Web ChatGPT
  424. // 1. long term memory: summarized memory messages
  425. // 2. pre-defined in-context prompts
  426. // 3. short term memory: latest n messages
  427. // 4. newest input message
  428. const memoryStartIndex = shouldSendLongTermMemory
  429. ? Math.min(longTermMemoryStartIndex, shortTermMemoryStartIndex)
  430. : shortTermMemoryStartIndex;
  431. // and if user has cleared history messages, we should exclude the memory too.
  432. const contextStartIndex = Math.max(clearContextIndex, memoryStartIndex);
  433. const maxTokenThreshold = modelConfig.max_tokens;
  434. // get recent messages as much as possible
  435. const reversedRecentMessages = [];
  436. for (
  437. let i = totalMessageCount - 1, tokenCount = 0;
  438. i >= contextStartIndex && tokenCount < maxTokenThreshold;
  439. i -= 1
  440. ) {
  441. const msg = messages[i];
  442. if (!msg || msg.isError) continue;
  443. tokenCount += estimateTokenLength(getMessageTextContent(msg));
  444. reversedRecentMessages.push(msg);
  445. }
  446. // concat all messages
  447. const recentMessages = [
  448. ...systemPrompts,
  449. ...longTermMemoryPrompts,
  450. ...contextPrompts,
  451. ...reversedRecentMessages.reverse(),
  452. ];
  453. return recentMessages;
  454. },
  455. updateMessage(
  456. sessionIndex: number,
  457. messageIndex: number,
  458. updater: (message?: ChatMessage) => void,
  459. ) {
  460. const sessions = get().sessions;
  461. const session = sessions.at(sessionIndex);
  462. const messages = session?.messages;
  463. updater(messages?.at(messageIndex));
  464. set(() => ({ sessions }));
  465. },
  466. resetSession() {
  467. get().updateCurrentSession((session) => {
  468. session.messages = [];
  469. session.memoryPrompt = "";
  470. });
  471. },
  472. summarizeSession() {
  473. const config = useAppConfig.getState();
  474. const session = get().currentSession();
  475. const modelConfig = session.mask.modelConfig;
  476. // skip summarize when using dalle3?
  477. if (isDalle3(modelConfig.model)) {
  478. return;
  479. }
  480. const api: ClientApi = getClientApi(modelConfig.providerName);
  481. // remove error messages if any
  482. const messages = session.messages;
  483. // should summarize topic after chating more than 50 words
  484. const SUMMARIZE_MIN_LEN = 50;
  485. if (
  486. config.enableAutoGenerateTitle &&
  487. session.topic === DEFAULT_TOPIC &&
  488. countMessages(messages) >= SUMMARIZE_MIN_LEN
  489. ) {
  490. const topicMessages = messages.concat(
  491. createMessage({
  492. role: "user",
  493. content: Locale.Store.Prompt.Topic,
  494. }),
  495. );
  496. api.llm.chat({
  497. messages: topicMessages,
  498. config: {
  499. model: getSummarizeModel(session.mask.modelConfig.model),
  500. stream: false,
  501. },
  502. onFinish(message) {
  503. get().updateCurrentSession(
  504. (session) =>
  505. (session.topic =
  506. message.length > 0 ? trimTopic(message) : DEFAULT_TOPIC),
  507. );
  508. },
  509. });
  510. }
  511. const summarizeIndex = Math.max(
  512. session.lastSummarizeIndex,
  513. session.clearContextIndex ?? 0,
  514. );
  515. let toBeSummarizedMsgs = messages
  516. .filter((msg) => !msg.isError)
  517. .slice(summarizeIndex);
  518. const historyMsgLength = countMessages(toBeSummarizedMsgs);
  519. if (historyMsgLength > modelConfig?.max_tokens ?? 4000) {
  520. const n = toBeSummarizedMsgs.length;
  521. toBeSummarizedMsgs = toBeSummarizedMsgs.slice(
  522. Math.max(0, n - modelConfig.historyMessageCount),
  523. );
  524. }
  525. const memoryPrompt = get().getMemoryPrompt();
  526. if (memoryPrompt) {
  527. // add memory prompt
  528. toBeSummarizedMsgs.unshift(memoryPrompt);
  529. }
  530. const lastSummarizeIndex = session.messages.length;
  531. console.log(
  532. "[Chat History] ",
  533. toBeSummarizedMsgs,
  534. historyMsgLength,
  535. modelConfig.compressMessageLengthThreshold,
  536. );
  537. if (
  538. historyMsgLength > modelConfig.compressMessageLengthThreshold &&
  539. modelConfig.sendMemory
  540. ) {
  541. /** Destruct max_tokens while summarizing
  542. * this param is just shit
  543. **/
  544. const { max_tokens, ...modelcfg } = modelConfig;
  545. api.llm.chat({
  546. messages: toBeSummarizedMsgs.concat(
  547. createMessage({
  548. role: "system",
  549. content: Locale.Store.Prompt.Summarize,
  550. date: "",
  551. }),
  552. ),
  553. config: {
  554. ...modelcfg,
  555. stream: true,
  556. model: getSummarizeModel(session.mask.modelConfig.model),
  557. },
  558. onUpdate(message) {
  559. session.memoryPrompt = message;
  560. },
  561. onFinish(message) {
  562. console.log("[Memory] ", message);
  563. get().updateCurrentSession((session) => {
  564. session.lastSummarizeIndex = lastSummarizeIndex;
  565. session.memoryPrompt = message; // Update the memory prompt for stored it in local storage
  566. });
  567. },
  568. onError(err) {
  569. console.error("[Summarize] ", err);
  570. },
  571. });
  572. }
  573. },
  574. updateStat(message: ChatMessage) {
  575. get().updateCurrentSession((session) => {
  576. session.stat.charCount += message.content.length;
  577. // TODO: should update chat count and word count
  578. });
  579. },
  580. updateCurrentSession(updater: (session: ChatSession) => void) {
  581. const sessions = get().sessions;
  582. const index = get().currentSessionIndex;
  583. updater(sessions[index]);
  584. set(() => ({ sessions }));
  585. },
  586. clearAllData() {
  587. localStorage.clear();
  588. location.reload();
  589. },
  590. };
  591. return methods;
  592. },
  593. {
  594. name: StoreKey.Chat,
  595. version: 3.1,
  596. migrate(persistedState, version) {
  597. const state = persistedState as any;
  598. const newState = JSON.parse(
  599. JSON.stringify(state),
  600. ) as typeof DEFAULT_CHAT_STATE;
  601. if (version < 2) {
  602. newState.sessions = [];
  603. const oldSessions = state.sessions;
  604. for (const oldSession of oldSessions) {
  605. const newSession = createEmptySession();
  606. newSession.topic = oldSession.topic;
  607. newSession.messages = [...oldSession.messages];
  608. newSession.mask.modelConfig.sendMemory = true;
  609. newSession.mask.modelConfig.historyMessageCount = 4;
  610. newSession.mask.modelConfig.compressMessageLengthThreshold = 1000;
  611. newState.sessions.push(newSession);
  612. }
  613. }
  614. if (version < 3) {
  615. // migrate id to nanoid
  616. newState.sessions.forEach((s) => {
  617. s.id = nanoid();
  618. s.messages.forEach((m) => (m.id = nanoid()));
  619. });
  620. }
  621. // Enable `enableInjectSystemPrompts` attribute for old sessions.
  622. // Resolve issue of old sessions not automatically enabling.
  623. if (version < 3.1) {
  624. newState.sessions.forEach((s) => {
  625. if (
  626. // Exclude those already set by user
  627. !s.mask.modelConfig.hasOwnProperty("enableInjectSystemPrompts")
  628. ) {
  629. // Because users may have changed this configuration,
  630. // the user's current configuration is used instead of the default
  631. const config = useAppConfig.getState();
  632. s.mask.modelConfig.enableInjectSystemPrompts =
  633. config.modelConfig.enableInjectSystemPrompts;
  634. }
  635. });
  636. }
  637. return newState as any;
  638. },
  639. },
  640. );