chat.ts 22 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743
  1. import { trimTopic, getMessageTextContent } from "../utils";
  2. import Locale, { getLang } from "../locales";
  3. import { showToast } from "../components/ui-lib";
  4. import { ModelConfig, ModelType, useAppConfig } from "./config";
  5. import { createEmptyMask, Mask } from "./mask";
  6. import {
  7. DEFAULT_INPUT_TEMPLATE,
  8. DEFAULT_MODELS,
  9. DEFAULT_SYSTEM_TEMPLATE,
  10. KnowledgeCutOffDate,
  11. StoreKey,
  12. SUMMARIZE_MODEL,
  13. GEMINI_SUMMARIZE_MODEL,
  14. ServiceProvider,
  15. } from "../constant";
  16. import { getClientApi } from "../client/api";
  17. import type {
  18. ClientApi,
  19. RequestMessage,
  20. MultimodalContent,
  21. } from "../client/api";
  22. import { ChatControllerPool } from "../client/controller";
  23. import { prettyObject } from "../utils/format";
  24. import { estimateTokenLength } from "../utils/token";
  25. import { nanoid } from "nanoid";
  26. import { createPersistStore } from "../utils/store";
  27. import { collectModelsWithDefaultModel } from "../utils/model";
  28. import { useAccessStore } from "./access";
  29. import { isDalle3 } from "../utils";
  30. export type ChatMessage = RequestMessage & {
  31. date: string;
  32. streaming?: boolean;
  33. isError?: boolean;
  34. id: string;
  35. model?: ModelType;
  36. };
  37. export function createMessage(override: Partial<ChatMessage>): ChatMessage {
  38. return {
  39. id: nanoid(),
  40. date: new Date().toLocaleString(),
  41. role: "user",
  42. content: "",
  43. ...override,
  44. };
  45. }
  46. export interface ChatStat {
  47. tokenCount: number;
  48. wordCount: number;
  49. charCount: number;
  50. }
  51. export interface ChatSession {
  52. appId: string,
  53. id: string;
  54. topic: string;
  55. memoryPrompt: string;
  56. messages: ChatMessage[];
  57. stat: ChatStat;
  58. lastUpdate: number;
  59. lastSummarizeIndex: number;
  60. clearContextIndex?: number;
  61. mask: Mask;
  62. }
  63. export const DEFAULT_TOPIC = Locale.Store.DefaultTopic;
  64. export const BOT_HELLO: ChatMessage = createMessage({
  65. role: "assistant",
  66. content: '您好,欢迎使用建科·小智,与本项目相关的问题都可以问我。',
  67. });
  68. function createEmptySession(): ChatSession {
  69. return {
  70. appId: '',
  71. id: nanoid(),
  72. topic: DEFAULT_TOPIC,
  73. memoryPrompt: "",
  74. messages: [],
  75. stat: {
  76. tokenCount: 0,
  77. wordCount: 0,
  78. charCount: 0,
  79. },
  80. lastUpdate: Date.now(),
  81. lastSummarizeIndex: 0,
  82. mask: createEmptyMask(),
  83. };
  84. }
  85. function getSummarizeModel(currentModel: string) {
  86. // if it is using gpt-* models, force to use 4o-mini to summarize
  87. if (currentModel.startsWith("gpt")) {
  88. const configStore = useAppConfig.getState();
  89. const accessStore = useAccessStore.getState();
  90. const allModel = collectModelsWithDefaultModel(
  91. configStore.models,
  92. [configStore.customModels, accessStore.customModels].join(","),
  93. accessStore.defaultModel,
  94. );
  95. const summarizeModel = allModel.find(
  96. (m) => m.name === SUMMARIZE_MODEL && m.available,
  97. );
  98. return summarizeModel?.name ?? currentModel;
  99. }
  100. if (currentModel.startsWith("gemini")) {
  101. return GEMINI_SUMMARIZE_MODEL;
  102. }
  103. return currentModel;
  104. }
  105. function countMessages(msgs: ChatMessage[]) {
  106. return msgs.reduce(
  107. (pre, cur) => pre + estimateTokenLength(getMessageTextContent(cur)),
  108. 0,
  109. );
  110. }
  111. function fillTemplateWith(input: string, modelConfig: ModelConfig) {
  112. const cutoff =
  113. KnowledgeCutOffDate[modelConfig.model] ?? KnowledgeCutOffDate.default;
  114. // Find the model in the DEFAULT_MODELS array that matches the modelConfig.model
  115. const modelInfo = DEFAULT_MODELS.find((m) => m.name === modelConfig.model);
  116. var serviceProvider = "OpenAI";
  117. if (modelInfo) {
  118. // TODO: auto detect the providerName from the modelConfig.model
  119. // Directly use the providerName from the modelInfo
  120. serviceProvider = modelInfo.provider.providerName;
  121. }
  122. const vars = {
  123. ServiceProvider: serviceProvider,
  124. cutoff,
  125. model: modelConfig.model,
  126. time: new Date().toString(),
  127. lang: getLang(),
  128. input: input,
  129. };
  130. let output = modelConfig.template ?? DEFAULT_INPUT_TEMPLATE;
  131. // remove duplicate
  132. if (input.startsWith(output)) {
  133. output = "";
  134. }
  135. // must contains {{input}}
  136. const inputVar = "{{input}}";
  137. if (!output.includes(inputVar)) {
  138. output += "\n" + inputVar;
  139. }
  140. Object.entries(vars).forEach(([name, value]) => {
  141. const regex = new RegExp(`{{${name}}}`, "g");
  142. output = output.replace(regex, value.toString()); // Ensure value is a string
  143. });
  144. return output;
  145. }
  146. const DEFAULT_CHAT_STATE = {
  147. model: 'BigModel' as 'BigModel' | 'DeepSeek',
  148. deepSeekStatus: 'ONLINE' as 'ONLINE' | 'LOCAL',
  149. sessions: [createEmptySession()],
  150. currentSessionIndex: 0,
  151. message: {
  152. content: '',
  153. role: 'assistant',
  154. },
  155. };
  156. export const useChatStore = createPersistStore(
  157. DEFAULT_CHAT_STATE,
  158. (set, _get) => {
  159. function get() {
  160. return {
  161. ..._get(),
  162. ...methods,
  163. };
  164. }
  165. const methods = {
  166. setModel(model: 'BigModel' | 'DeepSeek') {
  167. set({ model: model });
  168. },
  169. setDeepSeekStatus(status: 'ONLINE' | 'LOCAL') {
  170. set({ deepSeekStatus: status });
  171. },
  172. clearSessions() {
  173. set(() => ({
  174. sessions: [createEmptySession()],
  175. currentSessionIndex: 0,
  176. }));
  177. },
  178. selectSession(index: number) {
  179. set({
  180. currentSessionIndex: index,
  181. });
  182. },
  183. moveSession(from: number, to: number) {
  184. set((state) => {
  185. const { sessions, currentSessionIndex: oldIndex } = state;
  186. // move the session
  187. const newSessions = [...sessions];
  188. const session = newSessions[from];
  189. newSessions.splice(from, 1);
  190. newSessions.splice(to, 0, session);
  191. // modify current session id
  192. let newIndex = oldIndex === from ? to : oldIndex;
  193. if (oldIndex > from && oldIndex <= to) {
  194. newIndex -= 1;
  195. } else if (oldIndex < from && oldIndex >= to) {
  196. newIndex += 1;
  197. }
  198. return {
  199. currentSessionIndex: newIndex,
  200. sessions: newSessions,
  201. };
  202. });
  203. },
  204. newSession(mask?: Mask) {
  205. const session = createEmptySession();
  206. if (mask) {
  207. const config = useAppConfig.getState();
  208. const globalModelConfig = config.modelConfig;
  209. session.mask = {
  210. ...mask,
  211. modelConfig: {
  212. ...globalModelConfig,
  213. ...mask.modelConfig,
  214. },
  215. };
  216. session.topic = mask.name;
  217. }
  218. set((state) => ({
  219. currentSessionIndex: 0,
  220. sessions: [session].concat(state.sessions),
  221. }));
  222. },
  223. nextSession(delta: number) {
  224. const n = get().sessions.length;
  225. const limit = (x: number) => (x + n) % n;
  226. const i = get().currentSessionIndex;
  227. get().selectSession(limit(i + delta));
  228. },
  229. deleteSession(index: number) {
  230. const deletingLastSession = get().sessions.length === 1;
  231. const deletedSession = get().sessions.at(index);
  232. if (!deletedSession) return;
  233. const sessions = get().sessions.slice();
  234. sessions.splice(index, 1);
  235. const currentIndex = get().currentSessionIndex;
  236. let nextIndex = Math.min(
  237. currentIndex - Number(index < currentIndex),
  238. sessions.length - 1,
  239. );
  240. if (deletingLastSession) {
  241. nextIndex = 0;
  242. sessions.push(createEmptySession());
  243. }
  244. // for undo delete action
  245. const restoreState = {
  246. currentSessionIndex: get().currentSessionIndex,
  247. sessions: get().sessions.slice(),
  248. };
  249. set(() => ({
  250. currentSessionIndex: nextIndex,
  251. sessions,
  252. }));
  253. showToast(
  254. Locale.Home.DeleteToast,
  255. {
  256. text: Locale.Home.Revert,
  257. onClick() {
  258. set(() => restoreState);
  259. },
  260. },
  261. 5000,
  262. );
  263. },
  264. currentSession() {
  265. let index = get().currentSessionIndex;
  266. const sessions = get().sessions;
  267. if (index < 0 || index >= sessions.length) {
  268. index = Math.min(sessions.length - 1, Math.max(0, index));
  269. set(() => ({ currentSessionIndex: index }));
  270. }
  271. const session = sessions[index];
  272. return session;
  273. },
  274. onNewMessage(message: ChatMessage) {
  275. get().updateCurrentSession((session) => {
  276. session.messages = session.messages.concat();
  277. session.lastUpdate = Date.now();
  278. });
  279. get().updateStat(message);
  280. get().summarizeSession();
  281. },
  282. async onUserInput(content: string, attachImages?: string[]) {
  283. const session = get().currentSession();
  284. const modelConfig = session.mask.modelConfig;
  285. const userContent = fillTemplateWith(content, modelConfig);
  286. console.log("[User Input] after template: ", userContent);
  287. let mContent: string | MultimodalContent[] = userContent;
  288. if (attachImages && attachImages.length > 0) {
  289. mContent = [
  290. {
  291. type: "text",
  292. text: userContent,
  293. },
  294. ];
  295. mContent = mContent.concat(
  296. attachImages.map((url) => {
  297. return {
  298. type: "image_url",
  299. image_url: {
  300. url: url,
  301. },
  302. };
  303. }),
  304. );
  305. }
  306. let userMessage: ChatMessage = createMessage({
  307. role: "user",
  308. content: mContent,
  309. });
  310. const botMessage: ChatMessage = createMessage({
  311. role: "assistant",
  312. streaming: true,
  313. model: modelConfig.model,
  314. });
  315. // get recent messages
  316. const recentMessages = get().getMessagesWithMemory();
  317. const sendMessages = recentMessages.concat(userMessage);
  318. const messageIndex = get().currentSession().messages.length + 1;
  319. // save user's and bot's message
  320. get().updateCurrentSession((session) => {
  321. const savedUserMessage = {
  322. ...userMessage,
  323. content: mContent,
  324. };
  325. session.messages = session.messages.concat([
  326. savedUserMessage,
  327. botMessage,
  328. ]);
  329. });
  330. // 使用BigModel或DeepSeek
  331. const model = get().model as ServiceProvider;
  332. const api: ClientApi = getClientApi(model);
  333. api.llm.chat({
  334. messages: sendMessages,
  335. config: {
  336. ...modelConfig,
  337. appId: session.appId,
  338. stream: true,
  339. },
  340. onUpdate(message) {
  341. botMessage.streaming = true;
  342. if (message) {
  343. botMessage.content = message;
  344. }
  345. get().updateCurrentSession((session) => {
  346. session.messages = session.messages.concat();
  347. });
  348. },
  349. onFinish(message) {
  350. botMessage.streaming = false;
  351. if (message) {
  352. botMessage.content = message;
  353. get().onNewMessage(botMessage);
  354. }
  355. ChatControllerPool.remove(session.id, botMessage.id);
  356. },
  357. onError(error) {
  358. const isAborted = error.message.includes("aborted");
  359. botMessage.content +=
  360. "\n\n" +
  361. prettyObject({
  362. error: true,
  363. message: error.message,
  364. });
  365. botMessage.streaming = false;
  366. userMessage.isError = !isAborted;
  367. botMessage.isError = !isAborted;
  368. get().updateCurrentSession((session) => {
  369. session.messages = session.messages.concat();
  370. });
  371. ChatControllerPool.remove(
  372. session.id,
  373. botMessage.id ?? messageIndex,
  374. );
  375. console.error("[Chat] failed ", error);
  376. },
  377. onController(controller) {
  378. // collect controller for stop/retry
  379. ChatControllerPool.addController(
  380. session.id,
  381. botMessage.id ?? messageIndex,
  382. controller,
  383. );
  384. },
  385. });
  386. },
  387. getMemoryPrompt() {
  388. const session = get().currentSession();
  389. if (session.memoryPrompt.length) {
  390. return {
  391. role: "system",
  392. content: Locale.Store.Prompt.History(session.memoryPrompt),
  393. date: "",
  394. } as ChatMessage;
  395. }
  396. },
  397. getMessagesWithMemory() {
  398. const session = get().currentSession();
  399. const modelConfig = session.mask.modelConfig;
  400. const clearContextIndex = session.clearContextIndex ?? 0;
  401. const messages = session.messages.slice();
  402. const totalMessageCount = session.messages.length;
  403. // in-context prompts
  404. const contextPrompts = session.mask.context.slice();
  405. // system prompts, to get close to OpenAI Web ChatGPT
  406. const shouldInjectSystemPrompts =
  407. modelConfig.enableInjectSystemPrompts &&
  408. session.mask.modelConfig.model.startsWith("gpt-");
  409. var systemPrompts: ChatMessage[] = [];
  410. systemPrompts = shouldInjectSystemPrompts
  411. ? [
  412. createMessage({
  413. role: "system",
  414. content: fillTemplateWith("", {
  415. ...modelConfig,
  416. template: DEFAULT_SYSTEM_TEMPLATE,
  417. }),
  418. }),
  419. ]
  420. : [];
  421. if (shouldInjectSystemPrompts) {
  422. console.log(
  423. "[Global System Prompt] ",
  424. systemPrompts.at(0)?.content ?? "empty",
  425. );
  426. }
  427. const memoryPrompt = get().getMemoryPrompt();
  428. // long term memory
  429. const shouldSendLongTermMemory =
  430. modelConfig.sendMemory &&
  431. session.memoryPrompt &&
  432. session.memoryPrompt.length > 0 &&
  433. session.lastSummarizeIndex > clearContextIndex;
  434. const longTermMemoryPrompts =
  435. shouldSendLongTermMemory && memoryPrompt ? [memoryPrompt] : [];
  436. const longTermMemoryStartIndex = session.lastSummarizeIndex;
  437. // short term memory
  438. const shortTermMemoryStartIndex = Math.max(
  439. 0,
  440. totalMessageCount - modelConfig.historyMessageCount,
  441. );
  442. // lets concat send messages, including 4 parts:
  443. // 0. system prompt: to get close to OpenAI Web ChatGPT
  444. // 1. long term memory: summarized memory messages
  445. // 2. pre-defined in-context prompts
  446. // 3. short term memory: latest n messages
  447. // 4. newest input message
  448. const memoryStartIndex = shouldSendLongTermMemory
  449. ? Math.min(longTermMemoryStartIndex, shortTermMemoryStartIndex)
  450. : shortTermMemoryStartIndex;
  451. // and if user has cleared history messages, we should exclude the memory too.
  452. const contextStartIndex = Math.max(clearContextIndex, memoryStartIndex);
  453. const maxTokenThreshold = modelConfig.max_tokens;
  454. // get recent messages as much as possible
  455. const reversedRecentMessages = [];
  456. for (
  457. let i = totalMessageCount - 1, tokenCount = 0;
  458. i >= contextStartIndex && tokenCount < maxTokenThreshold;
  459. i -= 1
  460. ) {
  461. const msg = messages[i];
  462. if (!msg || msg.isError) continue;
  463. tokenCount += estimateTokenLength(getMessageTextContent(msg));
  464. reversedRecentMessages.push(msg);
  465. }
  466. // concat all messages
  467. const recentMessages = [
  468. ...systemPrompts,
  469. ...longTermMemoryPrompts,
  470. ...contextPrompts,
  471. ...reversedRecentMessages.reverse(),
  472. ];
  473. return recentMessages;
  474. },
  475. updateMessage(
  476. sessionIndex: number,
  477. messageIndex: number,
  478. updater: (message?: ChatMessage) => void,
  479. ) {
  480. const sessions = get().sessions;
  481. const session = sessions.at(sessionIndex);
  482. const messages = session?.messages;
  483. updater(messages?.at(messageIndex));
  484. set(() => ({ sessions }));
  485. },
  486. resetSession() {
  487. get().updateCurrentSession((session) => {
  488. session.messages = [];
  489. session.memoryPrompt = "";
  490. });
  491. },
  492. summarizeSession() {
  493. const config = useAppConfig.getState();
  494. const session = get().currentSession();
  495. const modelConfig = session.mask.modelConfig;
  496. // skip summarize when using dalle3?
  497. if (isDalle3(modelConfig.model)) {
  498. return;
  499. }
  500. // 使用BigModel或DeepSeek
  501. const model = get().model as ServiceProvider;
  502. const api: ClientApi = getClientApi(model);
  503. // remove error messages if any
  504. const messages = session.messages;
  505. // should summarize topic after chating more than 50 words
  506. const SUMMARIZE_MIN_LEN = 50;
  507. if (
  508. config.enableAutoGenerateTitle &&
  509. session.topic === DEFAULT_TOPIC &&
  510. countMessages(messages) >= SUMMARIZE_MIN_LEN
  511. ) {
  512. const topicMessages = messages.concat(
  513. createMessage({
  514. role: "user",
  515. content: Locale.Store.Prompt.Topic,
  516. }),
  517. );
  518. return;
  519. api.llm.chat({
  520. messages: topicMessages,
  521. config: {
  522. model: getSummarizeModel(session.mask.modelConfig.model),
  523. stream: false,
  524. providerName: model,
  525. },
  526. onFinish(message) {
  527. get().updateCurrentSession(
  528. (session) =>
  529. (session.topic =
  530. message.length > 0 ? trimTopic(message) : DEFAULT_TOPIC),
  531. );
  532. },
  533. });
  534. }
  535. const summarizeIndex = Math.max(
  536. session.lastSummarizeIndex,
  537. session.clearContextIndex ?? 0,
  538. );
  539. let toBeSummarizedMsgs = messages
  540. .filter((msg) => !msg.isError)
  541. .slice(summarizeIndex);
  542. const historyMsgLength = countMessages(toBeSummarizedMsgs);
  543. // @ts-ignore
  544. if (historyMsgLength > modelConfig?.max_tokens ?? 4000) {
  545. const n = toBeSummarizedMsgs.length;
  546. toBeSummarizedMsgs = toBeSummarizedMsgs.slice(
  547. Math.max(0, n - modelConfig.historyMessageCount),
  548. );
  549. }
  550. const memoryPrompt = get().getMemoryPrompt();
  551. if (memoryPrompt) {
  552. // add memory prompt
  553. toBeSummarizedMsgs.unshift(memoryPrompt);
  554. }
  555. const lastSummarizeIndex = session.messages.length;
  556. if (
  557. historyMsgLength > modelConfig.compressMessageLengthThreshold &&
  558. modelConfig.sendMemory
  559. ) {
  560. /** Destruct max_tokens while summarizing
  561. * this param is just shit
  562. **/
  563. const { max_tokens, ...modelcfg } = modelConfig;
  564. api.llm.chat({
  565. messages: toBeSummarizedMsgs.concat(
  566. createMessage({
  567. role: "system",
  568. content: Locale.Store.Prompt.Summarize,
  569. date: "",
  570. }),
  571. ),
  572. config: {
  573. ...modelcfg,
  574. stream: true,
  575. model: getSummarizeModel(session.mask.modelConfig.model),
  576. },
  577. onUpdate(message) {
  578. session.memoryPrompt = message;
  579. },
  580. onFinish(message) {
  581. get().updateCurrentSession((session) => {
  582. session.lastSummarizeIndex = lastSummarizeIndex;
  583. session.memoryPrompt = message; // Update the memory prompt for stored it in local storage
  584. });
  585. },
  586. onError(err) {
  587. console.error("[Summarize] ", err);
  588. },
  589. });
  590. }
  591. },
  592. updateStat(message: ChatMessage) {
  593. get().updateCurrentSession((session) => {
  594. session.stat.charCount += message.content.length;
  595. // TODO: should update chat count and word count
  596. });
  597. },
  598. updateCurrentSession(updater: (session: ChatSession) => void) {
  599. const sessions = get().sessions;
  600. const index = get().currentSessionIndex;
  601. updater(sessions[index]);
  602. set(() => ({ sessions }));
  603. },
  604. clearAllData() {
  605. localStorage.clear();
  606. location.reload();
  607. },
  608. };
  609. return methods;
  610. },
  611. {
  612. name: StoreKey.Chat,
  613. version: 3.1,
  614. migrate(persistedState, version) {
  615. const state = persistedState as any;
  616. const newState = JSON.parse(
  617. JSON.stringify(state),
  618. ) as typeof DEFAULT_CHAT_STATE;
  619. if (version < 2) {
  620. newState.sessions = [];
  621. const oldSessions = state.sessions;
  622. for (const oldSession of oldSessions) {
  623. const newSession = createEmptySession();
  624. newSession.appId = oldSession.appId;
  625. newSession.topic = oldSession.topic;
  626. newSession.messages = [...oldSession.messages];
  627. newSession.mask.modelConfig.sendMemory = true;
  628. newSession.mask.modelConfig.historyMessageCount = 4;
  629. newSession.mask.modelConfig.compressMessageLengthThreshold = 1000;
  630. newState.sessions.push(newSession);
  631. }
  632. }
  633. if (version < 3) {
  634. // migrate id to nanoid
  635. newState.sessions.forEach((s) => {
  636. s.id = nanoid();
  637. s.messages.forEach((m) => (m.id = nanoid()));
  638. });
  639. }
  640. // Enable `enableInjectSystemPrompts` attribute for old sessions.
  641. // Resolve issue of old sessions not automatically enabling.
  642. if (version < 3.1) {
  643. newState.sessions.forEach((s) => {
  644. if (
  645. // Exclude those already set by user
  646. !s.mask.modelConfig.hasOwnProperty("enableInjectSystemPrompts")
  647. ) {
  648. // Because users may have changed this configuration,
  649. // the user's current configuration is used instead of the default
  650. const config = useAppConfig.getState();
  651. s.mask.modelConfig.enableInjectSystemPrompts =
  652. config.modelConfig.enableInjectSystemPrompts;
  653. }
  654. });
  655. }
  656. return newState as any;
  657. },
  658. },
  659. );