chat.ts 22 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737
  1. import { trimTopic, getMessageTextContent } from "../utils";
  2. import Locale, { getLang } from "../locales";
  3. import { showToast } from "../components/ui-lib";
  4. import { ModelConfig, ModelType, useAppConfig } from "./config";
  5. import { createEmptyMask, Mask } from "./mask";
  6. import {
  7. DEFAULT_INPUT_TEMPLATE,
  8. DEFAULT_MODELS,
  9. DEFAULT_SYSTEM_TEMPLATE,
  10. KnowledgeCutOffDate,
  11. ServiceProvider,
  12. ModelProvider,
  13. StoreKey,
  14. SUMMARIZE_MODEL,
  15. GEMINI_SUMMARIZE_MODEL,
  16. } from "../constant";
  17. import { ClientApi, RequestMessage, MultimodalContent } from "../client/api";
  18. import { ChatControllerPool } from "../client/controller";
  19. import { prettyObject } from "../utils/format";
  20. import { estimateTokenLength } from "../utils/token";
  21. import { nanoid } from "nanoid";
  22. import { createPersistStore } from "../utils/store";
  23. import { collectModelsWithDefaultModel } from "../utils/model";
  24. import { useAccessStore } from "./access";
  25. export type ChatMessage = RequestMessage & {
  26. date: string;
  27. streaming?: boolean;
  28. isError?: boolean;
  29. id: string;
  30. model?: ModelType;
  31. };
  32. export function createMessage(override: Partial<ChatMessage>): ChatMessage {
  33. return {
  34. id: nanoid(),
  35. date: new Date().toLocaleString(),
  36. role: "user",
  37. content: "",
  38. ...override,
  39. };
  40. }
  41. export interface ChatStat {
  42. tokenCount: number;
  43. wordCount: number;
  44. charCount: number;
  45. }
  46. export interface ChatSession {
  47. id: string;
  48. topic: string;
  49. memoryPrompt: string;
  50. messages: ChatMessage[];
  51. stat: ChatStat;
  52. lastUpdate: number;
  53. lastSummarizeIndex: number;
  54. clearContextIndex?: number;
  55. mask: Mask;
  56. }
  57. export const DEFAULT_TOPIC = Locale.Store.DefaultTopic;
  58. export const BOT_HELLO: ChatMessage = createMessage({
  59. role: "assistant",
  60. content: Locale.Store.BotHello,
  61. });
  62. function createEmptySession(): ChatSession {
  63. return {
  64. id: nanoid(),
  65. topic: DEFAULT_TOPIC,
  66. memoryPrompt: "",
  67. messages: [],
  68. stat: {
  69. tokenCount: 0,
  70. wordCount: 0,
  71. charCount: 0,
  72. },
  73. lastUpdate: Date.now(),
  74. lastSummarizeIndex: 0,
  75. mask: createEmptyMask(),
  76. };
  77. }
  78. function getSummarizeModel(currentModel: string) {
  79. // if it is using gpt-* models, force to use 3.5 to summarize
  80. if (currentModel.startsWith("gpt")) {
  81. const configStore = useAppConfig.getState();
  82. const accessStore = useAccessStore.getState();
  83. const allModel = collectModelsWithDefaultModel(
  84. configStore.models,
  85. [configStore.customModels, accessStore.customModels].join(","),
  86. accessStore.defaultModel,
  87. );
  88. const summarizeModel = allModel.find(
  89. (m) => m.name === SUMMARIZE_MODEL && m.available,
  90. );
  91. return summarizeModel?.name ?? currentModel;
  92. }
  93. if (currentModel.startsWith("gemini")) {
  94. return GEMINI_SUMMARIZE_MODEL;
  95. }
  96. return currentModel;
  97. }
  98. function countMessages(msgs: ChatMessage[]) {
  99. return msgs.reduce(
  100. (pre, cur) => pre + estimateTokenLength(getMessageTextContent(cur)),
  101. 0,
  102. );
  103. }
  104. function fillTemplateWith(input: string, modelConfig: ModelConfig) {
  105. const cutoff =
  106. KnowledgeCutOffDate[modelConfig.model] ?? KnowledgeCutOffDate.default;
  107. // Find the model in the DEFAULT_MODELS array that matches the modelConfig.model
  108. const modelInfo = DEFAULT_MODELS.find((m) => m.name === modelConfig.model);
  109. var serviceProvider = "OpenAI";
  110. if (modelInfo) {
  111. // TODO: auto detect the providerName from the modelConfig.model
  112. // Directly use the providerName from the modelInfo
  113. serviceProvider = modelInfo.provider.providerName;
  114. }
  115. const vars = {
  116. ServiceProvider: serviceProvider,
  117. cutoff,
  118. model: modelConfig.model,
  119. time: new Date().toString(),
  120. lang: getLang(),
  121. input: input,
  122. };
  123. let output = modelConfig.template ?? DEFAULT_INPUT_TEMPLATE;
  124. // remove duplicate
  125. if (input.startsWith(output)) {
  126. output = "";
  127. }
  128. // must contains {{input}}
  129. const inputVar = "{{input}}";
  130. if (!output.includes(inputVar)) {
  131. output += "\n" + inputVar;
  132. }
  133. Object.entries(vars).forEach(([name, value]) => {
  134. const regex = new RegExp(`{{${name}}}`, "g");
  135. output = output.replace(regex, value.toString()); // Ensure value is a string
  136. });
  137. return output;
  138. }
  139. const DEFAULT_CHAT_STATE = {
  140. sessions: [createEmptySession()],
  141. currentSessionIndex: 0,
  142. };
  143. export const useChatStore = createPersistStore(
  144. DEFAULT_CHAT_STATE,
  145. (set, _get) => {
  146. function get() {
  147. return {
  148. ..._get(),
  149. ...methods,
  150. };
  151. }
  152. const methods = {
  153. clearSessions() {
  154. set(() => ({
  155. sessions: [createEmptySession()],
  156. currentSessionIndex: 0,
  157. }));
  158. },
  159. selectSession(index: number) {
  160. set({
  161. currentSessionIndex: index,
  162. });
  163. },
  164. moveSession(from: number, to: number) {
  165. set((state) => {
  166. const { sessions, currentSessionIndex: oldIndex } = state;
  167. // move the session
  168. const newSessions = [...sessions];
  169. const session = newSessions[from];
  170. newSessions.splice(from, 1);
  171. newSessions.splice(to, 0, session);
  172. // modify current session id
  173. let newIndex = oldIndex === from ? to : oldIndex;
  174. if (oldIndex > from && oldIndex <= to) {
  175. newIndex -= 1;
  176. } else if (oldIndex < from && oldIndex >= to) {
  177. newIndex += 1;
  178. }
  179. return {
  180. currentSessionIndex: newIndex,
  181. sessions: newSessions,
  182. };
  183. });
  184. },
  185. newSession(mask?: Mask) {
  186. const session = createEmptySession();
  187. if (mask) {
  188. const config = useAppConfig.getState();
  189. const globalModelConfig = config.modelConfig;
  190. session.mask = {
  191. ...mask,
  192. modelConfig: {
  193. ...globalModelConfig,
  194. ...mask.modelConfig,
  195. },
  196. };
  197. session.topic = mask.name;
  198. }
  199. set((state) => ({
  200. currentSessionIndex: 0,
  201. sessions: [session].concat(state.sessions),
  202. }));
  203. },
  204. nextSession(delta: number) {
  205. const n = get().sessions.length;
  206. const limit = (x: number) => (x + n) % n;
  207. const i = get().currentSessionIndex;
  208. get().selectSession(limit(i + delta));
  209. },
  210. deleteSession(index: number) {
  211. const deletingLastSession = get().sessions.length === 1;
  212. const deletedSession = get().sessions.at(index);
  213. if (!deletedSession) return;
  214. const sessions = get().sessions.slice();
  215. sessions.splice(index, 1);
  216. const currentIndex = get().currentSessionIndex;
  217. let nextIndex = Math.min(
  218. currentIndex - Number(index < currentIndex),
  219. sessions.length - 1,
  220. );
  221. if (deletingLastSession) {
  222. nextIndex = 0;
  223. sessions.push(createEmptySession());
  224. }
  225. // for undo delete action
  226. const restoreState = {
  227. currentSessionIndex: get().currentSessionIndex,
  228. sessions: get().sessions.slice(),
  229. };
  230. set(() => ({
  231. currentSessionIndex: nextIndex,
  232. sessions,
  233. }));
  234. showToast(
  235. Locale.Home.DeleteToast,
  236. {
  237. text: Locale.Home.Revert,
  238. onClick() {
  239. set(() => restoreState);
  240. },
  241. },
  242. 5000,
  243. );
  244. },
  245. currentSession() {
  246. let index = get().currentSessionIndex;
  247. const sessions = get().sessions;
  248. if (index < 0 || index >= sessions.length) {
  249. index = Math.min(sessions.length - 1, Math.max(0, index));
  250. set(() => ({ currentSessionIndex: index }));
  251. }
  252. const session = sessions[index];
  253. return session;
  254. },
  255. onNewMessage(message: ChatMessage) {
  256. get().updateCurrentSession((session) => {
  257. session.messages = session.messages.concat();
  258. session.lastUpdate = Date.now();
  259. });
  260. get().updateStat(message);
  261. get().summarizeSession();
  262. },
  263. async onUserInput(content: string, attachImages?: string[]) {
  264. const session = get().currentSession();
  265. const modelConfig = session.mask.modelConfig;
  266. const userContent = fillTemplateWith(content, modelConfig);
  267. console.log("[User Input] after template: ", userContent);
  268. let mContent: string | MultimodalContent[] = userContent;
  269. if (attachImages && attachImages.length > 0) {
  270. mContent = [
  271. {
  272. type: "text",
  273. text: userContent,
  274. },
  275. ];
  276. mContent = mContent.concat(
  277. attachImages.map((url) => {
  278. return {
  279. type: "image_url",
  280. image_url: {
  281. url: url,
  282. },
  283. };
  284. }),
  285. );
  286. }
  287. let userMessage: ChatMessage = createMessage({
  288. role: "user",
  289. content: mContent,
  290. });
  291. const botMessage: ChatMessage = createMessage({
  292. role: "assistant",
  293. streaming: true,
  294. model: modelConfig.model,
  295. });
  296. // get recent messages
  297. const recentMessages = get().getMessagesWithMemory();
  298. const sendMessages = recentMessages.concat(userMessage);
  299. const messageIndex = get().currentSession().messages.length + 1;
  300. // save user's and bot's message
  301. get().updateCurrentSession((session) => {
  302. const savedUserMessage = {
  303. ...userMessage,
  304. content: mContent,
  305. };
  306. session.messages = session.messages.concat([
  307. savedUserMessage,
  308. botMessage,
  309. ]);
  310. });
  311. var api: ClientApi;
  312. if (modelConfig.providerName == ServiceProvider.Google) {
  313. api = new ClientApi(ModelProvider.GeminiPro);
  314. } else if (modelConfig.providerName == ServiceProvider.Anthropic) {
  315. api = new ClientApi(ModelProvider.Claude);
  316. } else if (modelConfig.providerName == ServiceProvider.Baidu) {
  317. api = new ClientApi(ModelProvider.Ernie);
  318. } else {
  319. api = new ClientApi(ModelProvider.GPT);
  320. }
  321. // make request
  322. api.llm.chat({
  323. messages: sendMessages,
  324. config: { ...modelConfig, stream: true },
  325. onUpdate(message) {
  326. botMessage.streaming = true;
  327. if (message) {
  328. botMessage.content = message;
  329. }
  330. get().updateCurrentSession((session) => {
  331. session.messages = session.messages.concat();
  332. });
  333. },
  334. onFinish(message) {
  335. botMessage.streaming = false;
  336. if (message) {
  337. botMessage.content = message;
  338. get().onNewMessage(botMessage);
  339. }
  340. ChatControllerPool.remove(session.id, botMessage.id);
  341. },
  342. onError(error) {
  343. const isAborted = error.message.includes("aborted");
  344. botMessage.content +=
  345. "\n\n" +
  346. prettyObject({
  347. error: true,
  348. message: error.message,
  349. });
  350. botMessage.streaming = false;
  351. userMessage.isError = !isAborted;
  352. botMessage.isError = !isAborted;
  353. get().updateCurrentSession((session) => {
  354. session.messages = session.messages.concat();
  355. });
  356. ChatControllerPool.remove(
  357. session.id,
  358. botMessage.id ?? messageIndex,
  359. );
  360. console.error("[Chat] failed ", error);
  361. },
  362. onController(controller) {
  363. // collect controller for stop/retry
  364. ChatControllerPool.addController(
  365. session.id,
  366. botMessage.id ?? messageIndex,
  367. controller,
  368. );
  369. },
  370. });
  371. },
  372. getMemoryPrompt() {
  373. const session = get().currentSession();
  374. if (session.memoryPrompt.length) {
  375. return {
  376. role: "system",
  377. content: Locale.Store.Prompt.History(session.memoryPrompt),
  378. date: "",
  379. } as ChatMessage;
  380. }
  381. },
  382. getMessagesWithMemory() {
  383. const session = get().currentSession();
  384. const modelConfig = session.mask.modelConfig;
  385. const clearContextIndex = session.clearContextIndex ?? 0;
  386. const messages = session.messages.slice();
  387. const totalMessageCount = session.messages.length;
  388. // in-context prompts
  389. const contextPrompts = session.mask.context.slice();
  390. // system prompts, to get close to OpenAI Web ChatGPT
  391. const shouldInjectSystemPrompts =
  392. modelConfig.enableInjectSystemPrompts &&
  393. session.mask.modelConfig.model.startsWith("gpt-");
  394. var systemPrompts: ChatMessage[] = [];
  395. systemPrompts = shouldInjectSystemPrompts
  396. ? [
  397. createMessage({
  398. role: "system",
  399. content: fillTemplateWith("", {
  400. ...modelConfig,
  401. template: DEFAULT_SYSTEM_TEMPLATE,
  402. }),
  403. }),
  404. ]
  405. : [];
  406. if (shouldInjectSystemPrompts) {
  407. console.log(
  408. "[Global System Prompt] ",
  409. systemPrompts.at(0)?.content ?? "empty",
  410. );
  411. }
  412. const memoryPrompt = get().getMemoryPrompt();
  413. // long term memory
  414. const shouldSendLongTermMemory =
  415. modelConfig.sendMemory &&
  416. session.memoryPrompt &&
  417. session.memoryPrompt.length > 0 &&
  418. session.lastSummarizeIndex > clearContextIndex;
  419. const longTermMemoryPrompts =
  420. shouldSendLongTermMemory && memoryPrompt ? [memoryPrompt] : [];
  421. const longTermMemoryStartIndex = session.lastSummarizeIndex;
  422. // short term memory
  423. const shortTermMemoryStartIndex = Math.max(
  424. 0,
  425. totalMessageCount - modelConfig.historyMessageCount,
  426. );
  427. // lets concat send messages, including 4 parts:
  428. // 0. system prompt: to get close to OpenAI Web ChatGPT
  429. // 1. long term memory: summarized memory messages
  430. // 2. pre-defined in-context prompts
  431. // 3. short term memory: latest n messages
  432. // 4. newest input message
  433. const memoryStartIndex = shouldSendLongTermMemory
  434. ? Math.min(longTermMemoryStartIndex, shortTermMemoryStartIndex)
  435. : shortTermMemoryStartIndex;
  436. // and if user has cleared history messages, we should exclude the memory too.
  437. const contextStartIndex = Math.max(clearContextIndex, memoryStartIndex);
  438. const maxTokenThreshold = modelConfig.max_tokens;
  439. // get recent messages as much as possible
  440. const reversedRecentMessages = [];
  441. for (
  442. let i = totalMessageCount - 1, tokenCount = 0;
  443. i >= contextStartIndex && tokenCount < maxTokenThreshold;
  444. i -= 1
  445. ) {
  446. const msg = messages[i];
  447. if (!msg || msg.isError) continue;
  448. tokenCount += estimateTokenLength(getMessageTextContent(msg));
  449. reversedRecentMessages.push(msg);
  450. }
  451. // concat all messages
  452. const recentMessages = [
  453. ...systemPrompts,
  454. ...longTermMemoryPrompts,
  455. ...contextPrompts,
  456. ...reversedRecentMessages.reverse(),
  457. ];
  458. return recentMessages;
  459. },
  460. updateMessage(
  461. sessionIndex: number,
  462. messageIndex: number,
  463. updater: (message?: ChatMessage) => void,
  464. ) {
  465. const sessions = get().sessions;
  466. const session = sessions.at(sessionIndex);
  467. const messages = session?.messages;
  468. updater(messages?.at(messageIndex));
  469. set(() => ({ sessions }));
  470. },
  471. resetSession() {
  472. get().updateCurrentSession((session) => {
  473. session.messages = [];
  474. session.memoryPrompt = "";
  475. });
  476. },
  477. summarizeSession() {
  478. const config = useAppConfig.getState();
  479. const session = get().currentSession();
  480. const modelConfig = session.mask.modelConfig;
  481. var api: ClientApi;
  482. if (modelConfig.providerName == ServiceProvider.Google) {
  483. api = new ClientApi(ModelProvider.GeminiPro);
  484. } else if (modelConfig.providerName == ServiceProvider.Anthropic) {
  485. api = new ClientApi(ModelProvider.Claude);
  486. } else if (modelConfig.providerName == ServiceProvider.Baidu) {
  487. api = new ClientApi(ModelProvider.Ernie);
  488. } else {
  489. api = new ClientApi(ModelProvider.GPT);
  490. }
  491. // remove error messages if any
  492. const messages = session.messages;
  493. // should summarize topic after chating more than 50 words
  494. const SUMMARIZE_MIN_LEN = 50;
  495. if (
  496. config.enableAutoGenerateTitle &&
  497. session.topic === DEFAULT_TOPIC &&
  498. countMessages(messages) >= SUMMARIZE_MIN_LEN
  499. ) {
  500. const topicMessages = messages.concat(
  501. createMessage({
  502. role: "user",
  503. content: Locale.Store.Prompt.Topic,
  504. }),
  505. );
  506. api.llm.chat({
  507. messages: topicMessages,
  508. config: {
  509. model: getSummarizeModel(session.mask.modelConfig.model),
  510. stream: false,
  511. },
  512. onFinish(message) {
  513. get().updateCurrentSession(
  514. (session) =>
  515. (session.topic =
  516. message.length > 0 ? trimTopic(message) : DEFAULT_TOPIC),
  517. );
  518. },
  519. });
  520. }
  521. const summarizeIndex = Math.max(
  522. session.lastSummarizeIndex,
  523. session.clearContextIndex ?? 0,
  524. );
  525. let toBeSummarizedMsgs = messages
  526. .filter((msg) => !msg.isError)
  527. .slice(summarizeIndex);
  528. const historyMsgLength = countMessages(toBeSummarizedMsgs);
  529. if (historyMsgLength > modelConfig?.max_tokens ?? 4000) {
  530. const n = toBeSummarizedMsgs.length;
  531. toBeSummarizedMsgs = toBeSummarizedMsgs.slice(
  532. Math.max(0, n - modelConfig.historyMessageCount),
  533. );
  534. }
  535. const memoryPrompt = get().getMemoryPrompt();
  536. if (memoryPrompt) {
  537. // add memory prompt
  538. toBeSummarizedMsgs.unshift(memoryPrompt);
  539. }
  540. const lastSummarizeIndex = session.messages.length;
  541. console.log(
  542. "[Chat History] ",
  543. toBeSummarizedMsgs,
  544. historyMsgLength,
  545. modelConfig.compressMessageLengthThreshold,
  546. );
  547. if (
  548. historyMsgLength > modelConfig.compressMessageLengthThreshold &&
  549. modelConfig.sendMemory
  550. ) {
  551. /** Destruct max_tokens while summarizing
  552. * this param is just shit
  553. **/
  554. const { max_tokens, ...modelcfg } = modelConfig;
  555. api.llm.chat({
  556. messages: toBeSummarizedMsgs.concat(
  557. createMessage({
  558. role: "system",
  559. content: Locale.Store.Prompt.Summarize,
  560. date: "",
  561. }),
  562. ),
  563. config: {
  564. ...modelcfg,
  565. stream: true,
  566. model: getSummarizeModel(session.mask.modelConfig.model),
  567. },
  568. onUpdate(message) {
  569. session.memoryPrompt = message;
  570. },
  571. onFinish(message) {
  572. console.log("[Memory] ", message);
  573. get().updateCurrentSession((session) => {
  574. session.lastSummarizeIndex = lastSummarizeIndex;
  575. session.memoryPrompt = message; // Update the memory prompt for stored it in local storage
  576. });
  577. },
  578. onError(err) {
  579. console.error("[Summarize] ", err);
  580. },
  581. });
  582. }
  583. },
  584. updateStat(message: ChatMessage) {
  585. get().updateCurrentSession((session) => {
  586. session.stat.charCount += message.content.length;
  587. // TODO: should update chat count and word count
  588. });
  589. },
  590. updateCurrentSession(updater: (session: ChatSession) => void) {
  591. const sessions = get().sessions;
  592. const index = get().currentSessionIndex;
  593. updater(sessions[index]);
  594. set(() => ({ sessions }));
  595. },
  596. clearAllData() {
  597. localStorage.clear();
  598. location.reload();
  599. },
  600. };
  601. return methods;
  602. },
  603. {
  604. name: StoreKey.Chat,
  605. version: 3.1,
  606. migrate(persistedState, version) {
  607. const state = persistedState as any;
  608. const newState = JSON.parse(
  609. JSON.stringify(state),
  610. ) as typeof DEFAULT_CHAT_STATE;
  611. if (version < 2) {
  612. newState.sessions = [];
  613. const oldSessions = state.sessions;
  614. for (const oldSession of oldSessions) {
  615. const newSession = createEmptySession();
  616. newSession.topic = oldSession.topic;
  617. newSession.messages = [...oldSession.messages];
  618. newSession.mask.modelConfig.sendMemory = true;
  619. newSession.mask.modelConfig.historyMessageCount = 4;
  620. newSession.mask.modelConfig.compressMessageLengthThreshold = 1000;
  621. newState.sessions.push(newSession);
  622. }
  623. }
  624. if (version < 3) {
  625. // migrate id to nanoid
  626. newState.sessions.forEach((s) => {
  627. s.id = nanoid();
  628. s.messages.forEach((m) => (m.id = nanoid()));
  629. });
  630. }
  631. // Enable `enableInjectSystemPrompts` attribute for old sessions.
  632. // Resolve issue of old sessions not automatically enabling.
  633. if (version < 3.1) {
  634. newState.sessions.forEach((s) => {
  635. if (
  636. // Exclude those already set by user
  637. !s.mask.modelConfig.hasOwnProperty("enableInjectSystemPrompts")
  638. ) {
  639. // Because users may have changed this configuration,
  640. // the user's current configuration is used instead of the default
  641. const config = useAppConfig.getState();
  642. s.mask.modelConfig.enableInjectSystemPrompts =
  643. config.modelConfig.enableInjectSystemPrompts;
  644. }
  645. });
  646. }
  647. return newState as any;
  648. },
  649. },
  650. );