chat.ts 22 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742
  1. import { trimTopic, getMessageTextContent } from "../utils";
  2. import Locale, { getLang } from "../locales";
  3. import { showToast } from "../components/ui-lib";
  4. import { ModelConfig, ModelType, useAppConfig } from "./config";
  5. import { createEmptyMask, Mask } from "./mask";
  6. import {
  7. DEFAULT_INPUT_TEMPLATE,
  8. DEFAULT_MODELS,
  9. DEFAULT_SYSTEM_TEMPLATE,
  10. KnowledgeCutOffDate,
  11. StoreKey,
  12. SUMMARIZE_MODEL,
  13. GEMINI_SUMMARIZE_MODEL,
  14. ServiceProvider,
  15. } from "../constant";
  16. import { getClientApi } from "../client/api";
  17. import type {
  18. ClientApi,
  19. RequestMessage,
  20. MultimodalContent,
  21. } from "../client/api";
  22. import { ChatControllerPool } from "../client/controller";
  23. import { prettyObject } from "../utils/format";
  24. import { estimateTokenLength } from "../utils/token";
  25. import { nanoid } from "nanoid";
  26. import { createPersistStore } from "../utils/store";
  27. import { collectModelsWithDefaultModel } from "../utils/model";
  28. import { useAccessStore } from "./access";
  29. import { isDalle3 } from "../utils";
  30. export type ChatMessage = RequestMessage & {
  31. date: string;
  32. streaming?: boolean;
  33. isError?: boolean;
  34. id: string;
  35. model?: ModelType;
  36. };
  37. export function createMessage(override: Partial<ChatMessage>): ChatMessage {
  38. return {
  39. id: nanoid(),
  40. date: new Date().toLocaleString(),
  41. role: "user",
  42. content: "",
  43. ...override,
  44. };
  45. }
  46. export interface ChatStat {
  47. tokenCount: number;
  48. wordCount: number;
  49. charCount: number;
  50. }
  51. export interface ChatSession {
  52. appId: string,
  53. id: string;
  54. topic: string;
  55. memoryPrompt: string;
  56. messages: ChatMessage[];
  57. stat: ChatStat;
  58. lastUpdate: number;
  59. lastSummarizeIndex: number;
  60. clearContextIndex?: number;
  61. mask: Mask;
  62. }
  63. export const DEFAULT_TOPIC = Locale.Store.DefaultTopic;
  64. export const BOT_HELLO: ChatMessage = createMessage({
  65. role: "assistant",
  66. content: '您好,欢迎使用建科·小智,与本项目相关的问题都可以问我。',
  67. });
  68. function createEmptySession(): ChatSession {
  69. return {
  70. appId: '',
  71. id: nanoid(),
  72. topic: DEFAULT_TOPIC,
  73. memoryPrompt: "",
  74. messages: [],
  75. stat: {
  76. tokenCount: 0,
  77. wordCount: 0,
  78. charCount: 0,
  79. },
  80. lastUpdate: Date.now(),
  81. lastSummarizeIndex: 0,
  82. mask: createEmptyMask(),
  83. };
  84. }
  85. function getSummarizeModel(currentModel: string) {
  86. // if it is using gpt-* models, force to use 4o-mini to summarize
  87. if (currentModel.startsWith("gpt")) {
  88. const configStore = useAppConfig.getState();
  89. const accessStore = useAccessStore.getState();
  90. const allModel = collectModelsWithDefaultModel(
  91. configStore.models,
  92. [configStore.customModels, accessStore.customModels].join(","),
  93. accessStore.defaultModel,
  94. );
  95. const summarizeModel = allModel.find(
  96. (m) => m.name === SUMMARIZE_MODEL && m.available,
  97. );
  98. return summarizeModel?.name ?? currentModel;
  99. }
  100. if (currentModel.startsWith("gemini")) {
  101. return GEMINI_SUMMARIZE_MODEL;
  102. }
  103. return currentModel;
  104. }
  105. function countMessages(msgs: ChatMessage[]) {
  106. return msgs.reduce(
  107. (pre, cur) => pre + estimateTokenLength(getMessageTextContent(cur)),
  108. 0,
  109. );
  110. }
  111. function fillTemplateWith(input: string, modelConfig: ModelConfig) {
  112. const cutoff =
  113. KnowledgeCutOffDate[modelConfig.model] ?? KnowledgeCutOffDate.default;
  114. // Find the model in the DEFAULT_MODELS array that matches the modelConfig.model
  115. const modelInfo = DEFAULT_MODELS.find((m) => m.name === modelConfig.model);
  116. var serviceProvider = "OpenAI";
  117. if (modelInfo) {
  118. // TODO: auto detect the providerName from the modelConfig.model
  119. // Directly use the providerName from the modelInfo
  120. serviceProvider = modelInfo.provider.providerName;
  121. }
  122. const vars = {
  123. ServiceProvider: serviceProvider,
  124. cutoff,
  125. model: modelConfig.model,
  126. time: new Date().toString(),
  127. lang: getLang(),
  128. input: input,
  129. };
  130. let output = modelConfig.template ?? DEFAULT_INPUT_TEMPLATE;
  131. // remove duplicate
  132. if (input.startsWith(output)) {
  133. output = "";
  134. }
  135. // must contains {{input}}
  136. const inputVar = "{{input}}";
  137. if (!output.includes(inputVar)) {
  138. output += "\n" + inputVar;
  139. }
  140. Object.entries(vars).forEach(([name, value]) => {
  141. const regex = new RegExp(`{{${name}}}`, "g");
  142. output = output.replace(regex, value.toString()); // Ensure value is a string
  143. });
  144. return output;
  145. }
  146. const DEFAULT_CHAT_STATE = {
  147. model: 'BigModel' as 'BigModel' | 'DeepSeek',
  148. sessions: [createEmptySession()],
  149. currentSessionIndex: 0,
  150. };
  151. export const useChatStore = createPersistStore(
  152. DEFAULT_CHAT_STATE,
  153. (set, _get) => {
  154. function get() {
  155. return {
  156. ..._get(),
  157. ...methods,
  158. };
  159. }
  160. const methods = {
  161. setModel(model: 'BigModel' | 'DeepSeek') {
  162. set({ model: model });
  163. },
  164. clearSessions() {
  165. set(() => ({
  166. sessions: [createEmptySession()],
  167. currentSessionIndex: 0,
  168. }));
  169. },
  170. selectSession(index: number) {
  171. set({
  172. currentSessionIndex: index,
  173. });
  174. },
  175. moveSession(from: number, to: number) {
  176. set((state) => {
  177. const { sessions, currentSessionIndex: oldIndex } = state;
  178. // move the session
  179. const newSessions = [...sessions];
  180. const session = newSessions[from];
  181. newSessions.splice(from, 1);
  182. newSessions.splice(to, 0, session);
  183. // modify current session id
  184. let newIndex = oldIndex === from ? to : oldIndex;
  185. if (oldIndex > from && oldIndex <= to) {
  186. newIndex -= 1;
  187. } else if (oldIndex < from && oldIndex >= to) {
  188. newIndex += 1;
  189. }
  190. return {
  191. currentSessionIndex: newIndex,
  192. sessions: newSessions,
  193. };
  194. });
  195. },
  196. newSession(mask?: Mask) {
  197. const session = createEmptySession();
  198. if (mask) {
  199. const config = useAppConfig.getState();
  200. const globalModelConfig = config.modelConfig;
  201. session.mask = {
  202. ...mask,
  203. modelConfig: {
  204. ...globalModelConfig,
  205. ...mask.modelConfig,
  206. },
  207. };
  208. session.topic = mask.name;
  209. }
  210. set((state) => ({
  211. currentSessionIndex: 0,
  212. sessions: [session].concat(state.sessions),
  213. }));
  214. },
  215. nextSession(delta: number) {
  216. const n = get().sessions.length;
  217. const limit = (x: number) => (x + n) % n;
  218. const i = get().currentSessionIndex;
  219. get().selectSession(limit(i + delta));
  220. },
  221. deleteSession(index: number) {
  222. const deletingLastSession = get().sessions.length === 1;
  223. const deletedSession = get().sessions.at(index);
  224. if (!deletedSession) return;
  225. const sessions = get().sessions.slice();
  226. sessions.splice(index, 1);
  227. const currentIndex = get().currentSessionIndex;
  228. let nextIndex = Math.min(
  229. currentIndex - Number(index < currentIndex),
  230. sessions.length - 1,
  231. );
  232. if (deletingLastSession) {
  233. nextIndex = 0;
  234. sessions.push(createEmptySession());
  235. }
  236. // for undo delete action
  237. const restoreState = {
  238. currentSessionIndex: get().currentSessionIndex,
  239. sessions: get().sessions.slice(),
  240. };
  241. set(() => ({
  242. currentSessionIndex: nextIndex,
  243. sessions,
  244. }));
  245. showToast(
  246. Locale.Home.DeleteToast,
  247. {
  248. text: Locale.Home.Revert,
  249. onClick() {
  250. set(() => restoreState);
  251. },
  252. },
  253. 5000,
  254. );
  255. },
  256. currentSession() {
  257. let index = get().currentSessionIndex;
  258. const sessions = get().sessions;
  259. if (index < 0 || index >= sessions.length) {
  260. index = Math.min(sessions.length - 1, Math.max(0, index));
  261. set(() => ({ currentSessionIndex: index }));
  262. }
  263. const session = sessions[index];
  264. return session;
  265. },
  266. onNewMessage(message: ChatMessage) {
  267. get().updateCurrentSession((session) => {
  268. session.messages = session.messages.concat();
  269. session.lastUpdate = Date.now();
  270. });
  271. get().updateStat(message);
  272. get().summarizeSession();
  273. },
  274. async onUserInput(content: string, attachImages?: string[]) {
  275. const session = get().currentSession();
  276. const modelConfig = session.mask.modelConfig;
  277. const userContent = fillTemplateWith(content, modelConfig);
  278. console.log("[User Input] after template: ", userContent);
  279. let mContent: string | MultimodalContent[] = userContent;
  280. if (attachImages && attachImages.length > 0) {
  281. mContent = [
  282. {
  283. type: "text",
  284. text: userContent,
  285. },
  286. ];
  287. mContent = mContent.concat(
  288. attachImages.map((url) => {
  289. return {
  290. type: "image_url",
  291. image_url: {
  292. url: url,
  293. },
  294. };
  295. }),
  296. );
  297. }
  298. let userMessage: ChatMessage = createMessage({
  299. role: "user",
  300. content: mContent,
  301. });
  302. const botMessage: ChatMessage = createMessage({
  303. role: "assistant",
  304. streaming: true,
  305. model: modelConfig.model,
  306. });
  307. // get recent messages
  308. const recentMessages = get().getMessagesWithMemory();
  309. const sendMessages = recentMessages.concat(userMessage);
  310. const messageIndex = get().currentSession().messages.length + 1;
  311. // save user's and bot's message
  312. get().updateCurrentSession((session) => {
  313. const savedUserMessage = {
  314. ...userMessage,
  315. content: mContent,
  316. };
  317. session.messages = session.messages.concat([
  318. savedUserMessage,
  319. botMessage,
  320. ]);
  321. });
  322. // 使用BigModel或DeepSeek
  323. const model = get().model as ServiceProvider;
  324. const api: ClientApi = getClientApi(model);
  325. api.llm.chat({
  326. messages: sendMessages,
  327. config: {
  328. ...modelConfig,
  329. appId: session.appId,
  330. stream: true,
  331. },
  332. onUpdate(message) {
  333. botMessage.streaming = true;
  334. if (message) {
  335. botMessage.content = message;
  336. }
  337. get().updateCurrentSession((session) => {
  338. session.messages = session.messages.concat();
  339. });
  340. },
  341. onFinish(message) {
  342. botMessage.streaming = false;
  343. if (message) {
  344. botMessage.content = message;
  345. get().onNewMessage(botMessage);
  346. }
  347. ChatControllerPool.remove(session.id, botMessage.id);
  348. },
  349. onError(error) {
  350. const isAborted = error.message.includes("aborted");
  351. botMessage.content +=
  352. "\n\n" +
  353. prettyObject({
  354. error: true,
  355. message: error.message,
  356. });
  357. botMessage.streaming = false;
  358. userMessage.isError = !isAborted;
  359. botMessage.isError = !isAborted;
  360. get().updateCurrentSession((session) => {
  361. session.messages = session.messages.concat();
  362. });
  363. ChatControllerPool.remove(
  364. session.id,
  365. botMessage.id ?? messageIndex,
  366. );
  367. console.error("[Chat] failed ", error);
  368. },
  369. onController(controller) {
  370. // collect controller for stop/retry
  371. ChatControllerPool.addController(
  372. session.id,
  373. botMessage.id ?? messageIndex,
  374. controller,
  375. );
  376. },
  377. });
  378. },
  379. getMemoryPrompt() {
  380. const session = get().currentSession();
  381. if (session.memoryPrompt.length) {
  382. return {
  383. role: "system",
  384. content: Locale.Store.Prompt.History(session.memoryPrompt),
  385. date: "",
  386. } as ChatMessage;
  387. }
  388. },
  389. getMessagesWithMemory() {
  390. const session = get().currentSession();
  391. const modelConfig = session.mask.modelConfig;
  392. const clearContextIndex = session.clearContextIndex ?? 0;
  393. const messages = session.messages.slice();
  394. const totalMessageCount = session.messages.length;
  395. // in-context prompts
  396. const contextPrompts = session.mask.context.slice();
  397. // system prompts, to get close to OpenAI Web ChatGPT
  398. const shouldInjectSystemPrompts =
  399. modelConfig.enableInjectSystemPrompts &&
  400. session.mask.modelConfig.model.startsWith("gpt-");
  401. var systemPrompts: ChatMessage[] = [];
  402. systemPrompts = shouldInjectSystemPrompts
  403. ? [
  404. createMessage({
  405. role: "system",
  406. content: fillTemplateWith("", {
  407. ...modelConfig,
  408. template: DEFAULT_SYSTEM_TEMPLATE,
  409. }),
  410. }),
  411. ]
  412. : [];
  413. if (shouldInjectSystemPrompts) {
  414. console.log(
  415. "[Global System Prompt] ",
  416. systemPrompts.at(0)?.content ?? "empty",
  417. );
  418. }
  419. const memoryPrompt = get().getMemoryPrompt();
  420. // long term memory
  421. const shouldSendLongTermMemory =
  422. modelConfig.sendMemory &&
  423. session.memoryPrompt &&
  424. session.memoryPrompt.length > 0 &&
  425. session.lastSummarizeIndex > clearContextIndex;
  426. const longTermMemoryPrompts =
  427. shouldSendLongTermMemory && memoryPrompt ? [memoryPrompt] : [];
  428. const longTermMemoryStartIndex = session.lastSummarizeIndex;
  429. // short term memory
  430. const shortTermMemoryStartIndex = Math.max(
  431. 0,
  432. totalMessageCount - modelConfig.historyMessageCount,
  433. );
  434. // lets concat send messages, including 4 parts:
  435. // 0. system prompt: to get close to OpenAI Web ChatGPT
  436. // 1. long term memory: summarized memory messages
  437. // 2. pre-defined in-context prompts
  438. // 3. short term memory: latest n messages
  439. // 4. newest input message
  440. const memoryStartIndex = shouldSendLongTermMemory
  441. ? Math.min(longTermMemoryStartIndex, shortTermMemoryStartIndex)
  442. : shortTermMemoryStartIndex;
  443. // and if user has cleared history messages, we should exclude the memory too.
  444. const contextStartIndex = Math.max(clearContextIndex, memoryStartIndex);
  445. const maxTokenThreshold = modelConfig.max_tokens;
  446. // get recent messages as much as possible
  447. const reversedRecentMessages = [];
  448. for (
  449. let i = totalMessageCount - 1, tokenCount = 0;
  450. i >= contextStartIndex && tokenCount < maxTokenThreshold;
  451. i -= 1
  452. ) {
  453. const msg = messages[i];
  454. if (!msg || msg.isError) continue;
  455. tokenCount += estimateTokenLength(getMessageTextContent(msg));
  456. reversedRecentMessages.push(msg);
  457. }
  458. // concat all messages
  459. const recentMessages = [
  460. ...systemPrompts,
  461. ...longTermMemoryPrompts,
  462. ...contextPrompts,
  463. ...reversedRecentMessages.reverse(),
  464. ];
  465. return recentMessages;
  466. },
  467. updateMessage(
  468. sessionIndex: number,
  469. messageIndex: number,
  470. updater: (message?: ChatMessage) => void,
  471. ) {
  472. const sessions = get().sessions;
  473. const session = sessions.at(sessionIndex);
  474. const messages = session?.messages;
  475. updater(messages?.at(messageIndex));
  476. set(() => ({ sessions }));
  477. },
  478. resetSession() {
  479. get().updateCurrentSession((session) => {
  480. session.messages = [];
  481. session.memoryPrompt = "";
  482. });
  483. },
  484. summarizeSession() {
  485. const config = useAppConfig.getState();
  486. const session = get().currentSession();
  487. const modelConfig = session.mask.modelConfig;
  488. // skip summarize when using dalle3?
  489. if (isDalle3(modelConfig.model)) {
  490. return;
  491. }
  492. // 使用BigModel或DeepSeek
  493. const model = get().model as ServiceProvider;
  494. const api: ClientApi = getClientApi(model);
  495. // remove error messages if any
  496. const messages = session.messages;
  497. // should summarize topic after chating more than 50 words
  498. const SUMMARIZE_MIN_LEN = 50;
  499. if (
  500. config.enableAutoGenerateTitle &&
  501. session.topic === DEFAULT_TOPIC &&
  502. countMessages(messages) >= SUMMARIZE_MIN_LEN
  503. ) {
  504. const topicMessages = messages.concat(
  505. createMessage({
  506. role: "user",
  507. content: Locale.Store.Prompt.Topic,
  508. }),
  509. );
  510. return;
  511. api.llm.chat({
  512. messages: topicMessages,
  513. config: {
  514. model: getSummarizeModel(session.mask.modelConfig.model),
  515. stream: false,
  516. providerName: model,
  517. },
  518. onFinish(message) {
  519. get().updateCurrentSession(
  520. (session) =>
  521. (session.topic =
  522. message.length > 0 ? trimTopic(message) : DEFAULT_TOPIC),
  523. );
  524. },
  525. });
  526. }
  527. const summarizeIndex = Math.max(
  528. session.lastSummarizeIndex,
  529. session.clearContextIndex ?? 0,
  530. );
  531. let toBeSummarizedMsgs = messages
  532. .filter((msg) => !msg.isError)
  533. .slice(summarizeIndex);
  534. const historyMsgLength = countMessages(toBeSummarizedMsgs);
  535. // @ts-ignore
  536. if (historyMsgLength > modelConfig?.max_tokens ?? 4000) {
  537. const n = toBeSummarizedMsgs.length;
  538. toBeSummarizedMsgs = toBeSummarizedMsgs.slice(
  539. Math.max(0, n - modelConfig.historyMessageCount),
  540. );
  541. }
  542. const memoryPrompt = get().getMemoryPrompt();
  543. if (memoryPrompt) {
  544. // add memory prompt
  545. toBeSummarizedMsgs.unshift(memoryPrompt);
  546. }
  547. const lastSummarizeIndex = session.messages.length;
  548. console.log(
  549. "[Chat History] ",
  550. toBeSummarizedMsgs,
  551. historyMsgLength,
  552. modelConfig.compressMessageLengthThreshold,
  553. );
  554. if (
  555. historyMsgLength > modelConfig.compressMessageLengthThreshold &&
  556. modelConfig.sendMemory
  557. ) {
  558. /** Destruct max_tokens while summarizing
  559. * this param is just shit
  560. **/
  561. const { max_tokens, ...modelcfg } = modelConfig;
  562. api.llm.chat({
  563. messages: toBeSummarizedMsgs.concat(
  564. createMessage({
  565. role: "system",
  566. content: Locale.Store.Prompt.Summarize,
  567. date: "",
  568. }),
  569. ),
  570. config: {
  571. ...modelcfg,
  572. stream: true,
  573. model: getSummarizeModel(session.mask.modelConfig.model),
  574. },
  575. onUpdate(message) {
  576. session.memoryPrompt = message;
  577. },
  578. onFinish(message) {
  579. get().updateCurrentSession((session) => {
  580. session.lastSummarizeIndex = lastSummarizeIndex;
  581. session.memoryPrompt = message; // Update the memory prompt for stored it in local storage
  582. });
  583. },
  584. onError(err) {
  585. console.error("[Summarize] ", err);
  586. },
  587. });
  588. }
  589. },
  590. updateStat(message: ChatMessage) {
  591. get().updateCurrentSession((session) => {
  592. session.stat.charCount += message.content.length;
  593. // TODO: should update chat count and word count
  594. });
  595. },
  596. updateCurrentSession(updater: (session: ChatSession) => void) {
  597. const sessions = get().sessions;
  598. const index = get().currentSessionIndex;
  599. updater(sessions[index]);
  600. set(() => ({ sessions }));
  601. },
  602. clearAllData() {
  603. localStorage.clear();
  604. location.reload();
  605. },
  606. };
  607. return methods;
  608. },
  609. {
  610. name: StoreKey.Chat,
  611. version: 3.1,
  612. migrate(persistedState, version) {
  613. const state = persistedState as any;
  614. const newState = JSON.parse(
  615. JSON.stringify(state),
  616. ) as typeof DEFAULT_CHAT_STATE;
  617. if (version < 2) {
  618. newState.sessions = [];
  619. const oldSessions = state.sessions;
  620. for (const oldSession of oldSessions) {
  621. const newSession = createEmptySession();
  622. newSession.appId = oldSession.appId;
  623. newSession.topic = oldSession.topic;
  624. newSession.messages = [...oldSession.messages];
  625. newSession.mask.modelConfig.sendMemory = true;
  626. newSession.mask.modelConfig.historyMessageCount = 4;
  627. newSession.mask.modelConfig.compressMessageLengthThreshold = 1000;
  628. newState.sessions.push(newSession);
  629. }
  630. }
  631. if (version < 3) {
  632. // migrate id to nanoid
  633. newState.sessions.forEach((s) => {
  634. s.id = nanoid();
  635. s.messages.forEach((m) => (m.id = nanoid()));
  636. });
  637. }
  638. // Enable `enableInjectSystemPrompts` attribute for old sessions.
  639. // Resolve issue of old sessions not automatically enabling.
  640. if (version < 3.1) {
  641. newState.sessions.forEach((s) => {
  642. if (
  643. // Exclude those already set by user
  644. !s.mask.modelConfig.hasOwnProperty("enableInjectSystemPrompts")
  645. ) {
  646. // Because users may have changed this configuration,
  647. // the user's current configuration is used instead of the default
  648. const config = useAppConfig.getState();
  649. s.mask.modelConfig.enableInjectSystemPrompts =
  650. config.modelConfig.enableInjectSystemPrompts;
  651. }
  652. });
  653. }
  654. return newState as any;
  655. },
  656. },
  657. );