chat.ts 21 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728
  1. import { trimTopic, getMessageTextContent } from "../utils";
  2. import Locale, { getLang } from "../locales";
  3. import { showToast } from "../components/ui-lib";
  4. import { ModelConfig, ModelType, useAppConfig } from "./config";
  5. import { createEmptyMask, Mask } from "./mask";
  6. import {
  7. DEFAULT_INPUT_TEMPLATE,
  8. DEFAULT_MODELS,
  9. DEFAULT_SYSTEM_TEMPLATE,
  10. KnowledgeCutOffDate,
  11. StoreKey,
  12. SUMMARIZE_MODEL,
  13. GEMINI_SUMMARIZE_MODEL,
  14. } from "../constant";
  15. import { getClientApi } from "../client/api";
  16. import type {
  17. ClientApi,
  18. RequestMessage,
  19. MultimodalContent,
  20. } from "../client/api";
  21. import { ChatControllerPool } from "../client/controller";
  22. import { prettyObject } from "../utils/format";
  23. import { estimateTokenLength } from "../utils/token";
  24. import { nanoid } from "nanoid";
  25. import { createPersistStore } from "../utils/store";
  26. import { collectModelsWithDefaultModel } from "../utils/model";
  27. import { useAccessStore } from "./access";
  28. import { isDalle3 } from "../utils";
  29. export type ChatMessage = RequestMessage & {
  30. date: string;
  31. streaming?: boolean;
  32. isError?: boolean;
  33. id: string;
  34. model?: ModelType;
  35. };
  36. export function createMessage(override: Partial<ChatMessage>): ChatMessage {
  37. return {
  38. id: nanoid(),
  39. date: new Date().toLocaleString(),
  40. role: "user",
  41. content: "",
  42. ...override,
  43. };
  44. }
  45. export interface ChatStat {
  46. tokenCount: number;
  47. wordCount: number;
  48. charCount: number;
  49. }
  50. export interface ChatSession {
  51. id: string;
  52. topic: string;
  53. memoryPrompt: string;
  54. messages: ChatMessage[];
  55. stat: ChatStat;
  56. lastUpdate: number;
  57. lastSummarizeIndex: number;
  58. clearContextIndex?: number;
  59. mask: Mask;
  60. }
  61. export const DEFAULT_TOPIC = Locale.Store.DefaultTopic;
  62. export const BOT_HELLO: ChatMessage = createMessage({
  63. role: "assistant",
  64. content: Locale.Store.BotHello,
  65. });
  66. function createEmptySession(): ChatSession {
  67. return {
  68. id: nanoid(),
  69. topic: DEFAULT_TOPIC,
  70. memoryPrompt: "",
  71. messages: [],
  72. stat: {
  73. tokenCount: 0,
  74. wordCount: 0,
  75. charCount: 0,
  76. },
  77. lastUpdate: Date.now(),
  78. lastSummarizeIndex: 0,
  79. mask: createEmptyMask(),
  80. };
  81. }
  82. function getSummarizeModel(currentModel: string) {
  83. // if it is using gpt-* models, force to use 4o-mini to summarize
  84. if (currentModel.startsWith("gpt")) {
  85. const configStore = useAppConfig.getState();
  86. const accessStore = useAccessStore.getState();
  87. const allModel = collectModelsWithDefaultModel(
  88. configStore.models,
  89. [configStore.customModels, accessStore.customModels].join(","),
  90. accessStore.defaultModel,
  91. );
  92. const summarizeModel = allModel.find(
  93. (m) => m.name === SUMMARIZE_MODEL && m.available,
  94. );
  95. return summarizeModel?.name ?? currentModel;
  96. }
  97. if (currentModel.startsWith("gemini")) {
  98. return GEMINI_SUMMARIZE_MODEL;
  99. }
  100. return currentModel;
  101. }
  102. function countMessages(msgs: ChatMessage[]) {
  103. return msgs.reduce(
  104. (pre, cur) => pre + estimateTokenLength(getMessageTextContent(cur)),
  105. 0,
  106. );
  107. }
  108. function fillTemplateWith(input: string, modelConfig: ModelConfig) {
  109. const cutoff =
  110. KnowledgeCutOffDate[modelConfig.model] ?? KnowledgeCutOffDate.default;
  111. // Find the model in the DEFAULT_MODELS array that matches the modelConfig.model
  112. const modelInfo = DEFAULT_MODELS.find((m) => m.name === modelConfig.model);
  113. var serviceProvider = "OpenAI";
  114. if (modelInfo) {
  115. // TODO: auto detect the providerName from the modelConfig.model
  116. // Directly use the providerName from the modelInfo
  117. serviceProvider = modelInfo.provider.providerName;
  118. }
  119. const vars = {
  120. ServiceProvider: serviceProvider,
  121. cutoff,
  122. model: modelConfig.model,
  123. time: new Date().toString(),
  124. lang: getLang(),
  125. input: input,
  126. };
  127. let output = modelConfig.template ?? DEFAULT_INPUT_TEMPLATE;
  128. // remove duplicate
  129. if (input.startsWith(output)) {
  130. output = "";
  131. }
  132. // must contains {{input}}
  133. const inputVar = "{{input}}";
  134. if (!output.includes(inputVar)) {
  135. output += "\n" + inputVar;
  136. }
  137. Object.entries(vars).forEach(([name, value]) => {
  138. const regex = new RegExp(`{{${name}}}`, "g");
  139. output = output.replace(regex, value.toString()); // Ensure value is a string
  140. });
  141. return output;
  142. }
  143. const DEFAULT_CHAT_STATE = {
  144. sessions: [createEmptySession()],
  145. currentSessionIndex: 0,
  146. };
  147. export const useChatStore = createPersistStore(
  148. DEFAULT_CHAT_STATE,
  149. (set, _get) => {
  150. function get() {
  151. return {
  152. ..._get(),
  153. ...methods,
  154. };
  155. }
  156. const methods = {
  157. clearSessions() {
  158. set(() => ({
  159. sessions: [createEmptySession()],
  160. currentSessionIndex: 0,
  161. }));
  162. },
  163. selectSession(index: number) {
  164. set({
  165. currentSessionIndex: index,
  166. });
  167. },
  168. moveSession(from: number, to: number) {
  169. set((state) => {
  170. const { sessions, currentSessionIndex: oldIndex } = state;
  171. // move the session
  172. const newSessions = [...sessions];
  173. const session = newSessions[from];
  174. newSessions.splice(from, 1);
  175. newSessions.splice(to, 0, session);
  176. // modify current session id
  177. let newIndex = oldIndex === from ? to : oldIndex;
  178. if (oldIndex > from && oldIndex <= to) {
  179. newIndex -= 1;
  180. } else if (oldIndex < from && oldIndex >= to) {
  181. newIndex += 1;
  182. }
  183. return {
  184. currentSessionIndex: newIndex,
  185. sessions: newSessions,
  186. };
  187. });
  188. },
  189. newSession(mask?: Mask) {
  190. const session = createEmptySession();
  191. if (mask) {
  192. const config = useAppConfig.getState();
  193. const globalModelConfig = config.modelConfig;
  194. session.mask = {
  195. ...mask,
  196. modelConfig: {
  197. ...globalModelConfig,
  198. ...mask.modelConfig,
  199. },
  200. };
  201. session.topic = mask.name;
  202. }
  203. set((state) => ({
  204. currentSessionIndex: 0,
  205. sessions: [session].concat(state.sessions),
  206. }));
  207. },
  208. nextSession(delta: number) {
  209. const n = get().sessions.length;
  210. const limit = (x: number) => (x + n) % n;
  211. const i = get().currentSessionIndex;
  212. get().selectSession(limit(i + delta));
  213. },
  214. deleteSession(index: number) {
  215. const deletingLastSession = get().sessions.length === 1;
  216. const deletedSession = get().sessions.at(index);
  217. if (!deletedSession) return;
  218. const sessions = get().sessions.slice();
  219. sessions.splice(index, 1);
  220. const currentIndex = get().currentSessionIndex;
  221. let nextIndex = Math.min(
  222. currentIndex - Number(index < currentIndex),
  223. sessions.length - 1,
  224. );
  225. if (deletingLastSession) {
  226. nextIndex = 0;
  227. sessions.push(createEmptySession());
  228. }
  229. // for undo delete action
  230. const restoreState = {
  231. currentSessionIndex: get().currentSessionIndex,
  232. sessions: get().sessions.slice(),
  233. };
  234. set(() => ({
  235. currentSessionIndex: nextIndex,
  236. sessions,
  237. }));
  238. showToast(
  239. Locale.Home.DeleteToast,
  240. {
  241. text: Locale.Home.Revert,
  242. onClick() {
  243. set(() => restoreState);
  244. },
  245. },
  246. 5000,
  247. );
  248. },
  249. currentSession() {
  250. let index = get().currentSessionIndex;
  251. const sessions = get().sessions;
  252. if (index < 0 || index >= sessions.length) {
  253. index = Math.min(sessions.length - 1, Math.max(0, index));
  254. set(() => ({ currentSessionIndex: index }));
  255. }
  256. const session = sessions[index];
  257. return session;
  258. },
  259. onNewMessage(message: ChatMessage) {
  260. get().updateCurrentSession((session) => {
  261. session.messages = session.messages.concat();
  262. session.lastUpdate = Date.now();
  263. });
  264. get().updateStat(message);
  265. get().summarizeSession();
  266. },
  267. async onUserInput(content: string, attachImages?: string[]) {
  268. const session = get().currentSession();
  269. const modelConfig = session.mask.modelConfig;
  270. const userContent = fillTemplateWith(content, modelConfig);
  271. console.log("[User Input] after template: ", userContent);
  272. let mContent: string | MultimodalContent[] = userContent;
  273. if (attachImages && attachImages.length > 0) {
  274. mContent = [
  275. {
  276. type: "text",
  277. text: userContent,
  278. },
  279. ];
  280. mContent = mContent.concat(
  281. attachImages.map((url) => {
  282. return {
  283. type: "image_url",
  284. image_url: {
  285. url: url,
  286. },
  287. };
  288. }),
  289. );
  290. }
  291. let userMessage: ChatMessage = createMessage({
  292. role: "user",
  293. content: mContent,
  294. });
  295. const botMessage: ChatMessage = createMessage({
  296. role: "assistant",
  297. streaming: true,
  298. model: modelConfig.model,
  299. });
  300. // get recent messages
  301. const recentMessages = get().getMessagesWithMemory();
  302. const sendMessages = recentMessages.concat(userMessage);
  303. const messageIndex = get().currentSession().messages.length + 1;
  304. // save user's and bot's message
  305. get().updateCurrentSession((session) => {
  306. const savedUserMessage = {
  307. ...userMessage,
  308. content: mContent,
  309. };
  310. session.messages = session.messages.concat([
  311. savedUserMessage,
  312. botMessage,
  313. ]);
  314. });
  315. const api: ClientApi = getClientApi(modelConfig.providerName);
  316. // make request
  317. api.llm.chat({
  318. messages: sendMessages,
  319. config: { ...modelConfig, stream: true },
  320. onUpdate(message) {
  321. botMessage.streaming = true;
  322. if (message) {
  323. botMessage.content = message;
  324. }
  325. get().updateCurrentSession((session) => {
  326. session.messages = session.messages.concat();
  327. });
  328. },
  329. onFinish(message) {
  330. botMessage.streaming = false;
  331. if (message) {
  332. botMessage.content = message;
  333. get().onNewMessage(botMessage);
  334. }
  335. ChatControllerPool.remove(session.id, botMessage.id);
  336. },
  337. onError(error) {
  338. const isAborted = error.message.includes("aborted");
  339. botMessage.content +=
  340. "\n\n" +
  341. prettyObject({
  342. error: true,
  343. message: error.message,
  344. });
  345. botMessage.streaming = false;
  346. userMessage.isError = !isAborted;
  347. botMessage.isError = !isAborted;
  348. get().updateCurrentSession((session) => {
  349. session.messages = session.messages.concat();
  350. });
  351. ChatControllerPool.remove(
  352. session.id,
  353. botMessage.id ?? messageIndex,
  354. );
  355. console.error("[Chat] failed ", error);
  356. },
  357. onController(controller) {
  358. // collect controller for stop/retry
  359. ChatControllerPool.addController(
  360. session.id,
  361. botMessage.id ?? messageIndex,
  362. controller,
  363. );
  364. },
  365. });
  366. },
  367. getMemoryPrompt() {
  368. const session = get().currentSession();
  369. if (session.memoryPrompt.length) {
  370. return {
  371. role: "system",
  372. content: Locale.Store.Prompt.History(session.memoryPrompt),
  373. date: "",
  374. } as ChatMessage;
  375. }
  376. },
  377. getMessagesWithMemory() {
  378. const session = get().currentSession();
  379. const modelConfig = session.mask.modelConfig;
  380. const clearContextIndex = session.clearContextIndex ?? 0;
  381. const messages = session.messages.slice();
  382. const totalMessageCount = session.messages.length;
  383. // in-context prompts
  384. const contextPrompts = session.mask.context.slice();
  385. // system prompts, to get close to OpenAI Web ChatGPT
  386. const shouldInjectSystemPrompts =
  387. modelConfig.enableInjectSystemPrompts &&
  388. session.mask.modelConfig.model.startsWith("gpt-");
  389. var systemPrompts: ChatMessage[] = [];
  390. systemPrompts = shouldInjectSystemPrompts
  391. ? [
  392. createMessage({
  393. role: "system",
  394. content: fillTemplateWith("", {
  395. ...modelConfig,
  396. template: DEFAULT_SYSTEM_TEMPLATE,
  397. }),
  398. }),
  399. ]
  400. : [];
  401. if (shouldInjectSystemPrompts) {
  402. console.log(
  403. "[Global System Prompt] ",
  404. systemPrompts.at(0)?.content ?? "empty",
  405. );
  406. }
  407. const memoryPrompt = get().getMemoryPrompt();
  408. // long term memory
  409. const shouldSendLongTermMemory =
  410. modelConfig.sendMemory &&
  411. session.memoryPrompt &&
  412. session.memoryPrompt.length > 0 &&
  413. session.lastSummarizeIndex > clearContextIndex;
  414. const longTermMemoryPrompts =
  415. shouldSendLongTermMemory && memoryPrompt ? [memoryPrompt] : [];
  416. const longTermMemoryStartIndex = session.lastSummarizeIndex;
  417. // short term memory
  418. const shortTermMemoryStartIndex = Math.max(
  419. 0,
  420. totalMessageCount - modelConfig.historyMessageCount,
  421. );
  422. // lets concat send messages, including 4 parts:
  423. // 0. system prompt: to get close to OpenAI Web ChatGPT
  424. // 1. long term memory: summarized memory messages
  425. // 2. pre-defined in-context prompts
  426. // 3. short term memory: latest n messages
  427. // 4. newest input message
  428. const memoryStartIndex = shouldSendLongTermMemory
  429. ? Math.min(longTermMemoryStartIndex, shortTermMemoryStartIndex)
  430. : shortTermMemoryStartIndex;
  431. // and if user has cleared history messages, we should exclude the memory too.
  432. const contextStartIndex = Math.max(clearContextIndex, memoryStartIndex);
  433. const maxTokenThreshold = modelConfig.max_tokens;
  434. // get recent messages as much as possible
  435. const reversedRecentMessages = [];
  436. for (
  437. let i = totalMessageCount - 1, tokenCount = 0;
  438. i >= contextStartIndex && tokenCount < maxTokenThreshold;
  439. i -= 1
  440. ) {
  441. const msg = messages[i];
  442. if (!msg || msg.isError) continue;
  443. tokenCount += estimateTokenLength(getMessageTextContent(msg));
  444. reversedRecentMessages.push(msg);
  445. }
  446. // concat all messages
  447. const recentMessages = [
  448. ...systemPrompts,
  449. ...longTermMemoryPrompts,
  450. ...contextPrompts,
  451. ...reversedRecentMessages.reverse(),
  452. ];
  453. return recentMessages;
  454. },
  455. updateMessage(
  456. sessionIndex: number,
  457. messageIndex: number,
  458. updater: (message?: ChatMessage) => void,
  459. ) {
  460. const sessions = get().sessions;
  461. const session = sessions.at(sessionIndex);
  462. const messages = session?.messages;
  463. updater(messages?.at(messageIndex));
  464. set(() => ({ sessions }));
  465. },
  466. resetSession() {
  467. get().updateCurrentSession((session) => {
  468. session.messages = [];
  469. session.memoryPrompt = "";
  470. });
  471. },
  472. summarizeSession() {
  473. const config = useAppConfig.getState();
  474. const session = get().currentSession();
  475. const modelConfig = session.mask.modelConfig;
  476. // skip summarize when using dalle3?
  477. if (isDalle3(modelConfig.model)) {
  478. return;
  479. }
  480. const providerName = modelConfig.providerName;
  481. const api: ClientApi = getClientApi(providerName);
  482. // remove error messages if any
  483. const messages = session.messages;
  484. // should summarize topic after chating more than 50 words
  485. const SUMMARIZE_MIN_LEN = 50;
  486. if (
  487. config.enableAutoGenerateTitle &&
  488. session.topic === DEFAULT_TOPIC &&
  489. countMessages(messages) >= SUMMARIZE_MIN_LEN
  490. ) {
  491. const topicMessages = messages.concat(
  492. createMessage({
  493. role: "user",
  494. content: Locale.Store.Prompt.Topic,
  495. }),
  496. );
  497. api.llm.chat({
  498. messages: topicMessages,
  499. config: {
  500. model: getSummarizeModel(session.mask.modelConfig.model),
  501. stream: false,
  502. providerName,
  503. },
  504. onFinish(message) {
  505. get().updateCurrentSession(
  506. (session) =>
  507. (session.topic =
  508. message.length > 0 ? trimTopic(message) : DEFAULT_TOPIC),
  509. );
  510. },
  511. });
  512. }
  513. const summarizeIndex = Math.max(
  514. session.lastSummarizeIndex,
  515. session.clearContextIndex ?? 0,
  516. );
  517. let toBeSummarizedMsgs = messages
  518. .filter((msg) => !msg.isError)
  519. .slice(summarizeIndex);
  520. const historyMsgLength = countMessages(toBeSummarizedMsgs);
  521. if (historyMsgLength > modelConfig?.max_tokens ?? 4000) {
  522. const n = toBeSummarizedMsgs.length;
  523. toBeSummarizedMsgs = toBeSummarizedMsgs.slice(
  524. Math.max(0, n - modelConfig.historyMessageCount),
  525. );
  526. }
  527. const memoryPrompt = get().getMemoryPrompt();
  528. if (memoryPrompt) {
  529. // add memory prompt
  530. toBeSummarizedMsgs.unshift(memoryPrompt);
  531. }
  532. const lastSummarizeIndex = session.messages.length;
  533. console.log(
  534. "[Chat History] ",
  535. toBeSummarizedMsgs,
  536. historyMsgLength,
  537. modelConfig.compressMessageLengthThreshold,
  538. );
  539. if (
  540. historyMsgLength > modelConfig.compressMessageLengthThreshold &&
  541. modelConfig.sendMemory
  542. ) {
  543. /** Destruct max_tokens while summarizing
  544. * this param is just shit
  545. **/
  546. const { max_tokens, ...modelcfg } = modelConfig;
  547. api.llm.chat({
  548. messages: toBeSummarizedMsgs.concat(
  549. createMessage({
  550. role: "system",
  551. content: Locale.Store.Prompt.Summarize,
  552. date: "",
  553. }),
  554. ),
  555. config: {
  556. ...modelcfg,
  557. stream: true,
  558. model: getSummarizeModel(session.mask.modelConfig.model),
  559. },
  560. onUpdate(message) {
  561. session.memoryPrompt = message;
  562. },
  563. onFinish(message) {
  564. console.log("[Memory] ", message);
  565. get().updateCurrentSession((session) => {
  566. session.lastSummarizeIndex = lastSummarizeIndex;
  567. session.memoryPrompt = message; // Update the memory prompt for stored it in local storage
  568. });
  569. },
  570. onError(err) {
  571. console.error("[Summarize] ", err);
  572. },
  573. });
  574. }
  575. },
  576. updateStat(message: ChatMessage) {
  577. get().updateCurrentSession((session) => {
  578. session.stat.charCount += message.content.length;
  579. // TODO: should update chat count and word count
  580. });
  581. },
  582. updateCurrentSession(updater: (session: ChatSession) => void) {
  583. const sessions = get().sessions;
  584. const index = get().currentSessionIndex;
  585. updater(sessions[index]);
  586. set(() => ({ sessions }));
  587. },
  588. clearAllData() {
  589. localStorage.clear();
  590. location.reload();
  591. },
  592. };
  593. return methods;
  594. },
  595. {
  596. name: StoreKey.Chat,
  597. version: 3.1,
  598. migrate(persistedState, version) {
  599. const state = persistedState as any;
  600. const newState = JSON.parse(
  601. JSON.stringify(state),
  602. ) as typeof DEFAULT_CHAT_STATE;
  603. if (version < 2) {
  604. newState.sessions = [];
  605. const oldSessions = state.sessions;
  606. for (const oldSession of oldSessions) {
  607. const newSession = createEmptySession();
  608. newSession.topic = oldSession.topic;
  609. newSession.messages = [...oldSession.messages];
  610. newSession.mask.modelConfig.sendMemory = true;
  611. newSession.mask.modelConfig.historyMessageCount = 4;
  612. newSession.mask.modelConfig.compressMessageLengthThreshold = 1000;
  613. newState.sessions.push(newSession);
  614. }
  615. }
  616. if (version < 3) {
  617. // migrate id to nanoid
  618. newState.sessions.forEach((s) => {
  619. s.id = nanoid();
  620. s.messages.forEach((m) => (m.id = nanoid()));
  621. });
  622. }
  623. // Enable `enableInjectSystemPrompts` attribute for old sessions.
  624. // Resolve issue of old sessions not automatically enabling.
  625. if (version < 3.1) {
  626. newState.sessions.forEach((s) => {
  627. if (
  628. // Exclude those already set by user
  629. !s.mask.modelConfig.hasOwnProperty("enableInjectSystemPrompts")
  630. ) {
  631. // Because users may have changed this configuration,
  632. // the user's current configuration is used instead of the default
  633. const config = useAppConfig.getState();
  634. s.mask.modelConfig.enableInjectSystemPrompts =
  635. config.modelConfig.enableInjectSystemPrompts;
  636. }
  637. });
  638. }
  639. return newState as any;
  640. },
  641. },
  642. );