chat.ts 21 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721
  1. import { trimTopic, getMessageTextContent } from "../utils";
  2. import Locale, { getLang } from "../locales";
  3. import { showToast } from "../components/ui-lib";
  4. import { ModelConfig, ModelType, useAppConfig } from "./config";
  5. import { createEmptyMask, Mask } from "./mask";
  6. import {
  7. DEFAULT_INPUT_TEMPLATE,
  8. DEFAULT_MODELS,
  9. DEFAULT_SYSTEM_TEMPLATE,
  10. KnowledgeCutOffDate,
  11. ModelProvider,
  12. StoreKey,
  13. SUMMARIZE_MODEL,
  14. GEMINI_SUMMARIZE_MODEL,
  15. } from "../constant";
  16. import { ClientApi, RequestMessage, MultimodalContent } from "../client/api";
  17. import { ChatControllerPool } from "../client/controller";
  18. import { prettyObject } from "../utils/format";
  19. import { estimateTokenLength } from "../utils/token";
  20. import { nanoid } from "nanoid";
  21. import { createPersistStore } from "../utils/store";
  22. import { identifyDefaultClaudeModel } from "../utils/checkers";
  23. export type ChatMessage = RequestMessage & {
  24. date: string;
  25. streaming?: boolean;
  26. isError?: boolean;
  27. id: string;
  28. model?: ModelType;
  29. };
  30. export function createMessage(override: Partial<ChatMessage>): ChatMessage {
  31. return {
  32. id: nanoid(),
  33. date: new Date().toLocaleString(),
  34. role: "user",
  35. content: "",
  36. ...override,
  37. };
  38. }
  39. export interface ChatStat {
  40. tokenCount: number;
  41. wordCount: number;
  42. charCount: number;
  43. }
  44. export interface ChatSession {
  45. id: string;
  46. topic: string;
  47. memoryPrompt: string;
  48. messages: ChatMessage[];
  49. stat: ChatStat;
  50. lastUpdate: number;
  51. lastSummarizeIndex: number;
  52. clearContextIndex?: number;
  53. mask: Mask;
  54. }
  55. export const DEFAULT_TOPIC = Locale.Store.DefaultTopic;
  56. export const BOT_HELLO: ChatMessage = createMessage({
  57. role: "assistant",
  58. content: Locale.Store.BotHello,
  59. });
  60. function createEmptySession(): ChatSession {
  61. return {
  62. id: nanoid(),
  63. topic: DEFAULT_TOPIC,
  64. memoryPrompt: "",
  65. messages: [],
  66. stat: {
  67. tokenCount: 0,
  68. wordCount: 0,
  69. charCount: 0,
  70. },
  71. lastUpdate: Date.now(),
  72. lastSummarizeIndex: 0,
  73. mask: createEmptyMask(),
  74. };
  75. }
  76. function getSummarizeModel(currentModel: string) {
  77. // if it is using gpt-* models, force to use 3.5 to summarize
  78. if (currentModel.startsWith("gpt")) {
  79. return SUMMARIZE_MODEL;
  80. }
  81. if (currentModel.startsWith("gemini-pro")) {
  82. return GEMINI_SUMMARIZE_MODEL;
  83. }
  84. return currentModel;
  85. }
  86. function countMessages(msgs: ChatMessage[]) {
  87. return msgs.reduce(
  88. (pre, cur) => pre + estimateTokenLength(getMessageTextContent(cur)),
  89. 0,
  90. );
  91. }
  92. function fillTemplateWith(input: string, modelConfig: ModelConfig) {
  93. const cutoff =
  94. KnowledgeCutOffDate[modelConfig.model] ?? KnowledgeCutOffDate.default;
  95. // Find the model in the DEFAULT_MODELS array that matches the modelConfig.model
  96. const modelInfo = DEFAULT_MODELS.find((m) => m.name === modelConfig.model);
  97. var serviceProvider = "OpenAI";
  98. if (modelInfo) {
  99. // TODO: auto detect the providerName from the modelConfig.model
  100. // Directly use the providerName from the modelInfo
  101. serviceProvider = modelInfo.provider.providerName;
  102. }
  103. const vars = {
  104. ServiceProvider: serviceProvider,
  105. cutoff,
  106. model: modelConfig.model,
  107. time: new Date().toString(),
  108. lang: getLang(),
  109. input: input,
  110. };
  111. let output = modelConfig.template ?? DEFAULT_INPUT_TEMPLATE;
  112. // remove duplicate
  113. if (input.startsWith(output)) {
  114. output = "";
  115. }
  116. // must contains {{input}}
  117. const inputVar = "{{input}}";
  118. if (!output.includes(inputVar)) {
  119. output += "\n" + inputVar;
  120. }
  121. Object.entries(vars).forEach(([name, value]) => {
  122. const regex = new RegExp(`{{${name}}}`, "g");
  123. output = output.replace(regex, value.toString()); // Ensure value is a string
  124. });
  125. return output;
  126. }
  127. const DEFAULT_CHAT_STATE = {
  128. sessions: [createEmptySession()],
  129. currentSessionIndex: 0,
  130. };
  131. export const useChatStore = createPersistStore(
  132. DEFAULT_CHAT_STATE,
  133. (set, _get) => {
  134. function get() {
  135. return {
  136. ..._get(),
  137. ...methods,
  138. };
  139. }
  140. const methods = {
  141. clearSessions() {
  142. set(() => ({
  143. sessions: [createEmptySession()],
  144. currentSessionIndex: 0,
  145. }));
  146. },
  147. selectSession(index: number) {
  148. set({
  149. currentSessionIndex: index,
  150. });
  151. },
  152. moveSession(from: number, to: number) {
  153. set((state) => {
  154. const { sessions, currentSessionIndex: oldIndex } = state;
  155. // move the session
  156. const newSessions = [...sessions];
  157. const session = newSessions[from];
  158. newSessions.splice(from, 1);
  159. newSessions.splice(to, 0, session);
  160. // modify current session id
  161. let newIndex = oldIndex === from ? to : oldIndex;
  162. if (oldIndex > from && oldIndex <= to) {
  163. newIndex -= 1;
  164. } else if (oldIndex < from && oldIndex >= to) {
  165. newIndex += 1;
  166. }
  167. return {
  168. currentSessionIndex: newIndex,
  169. sessions: newSessions,
  170. };
  171. });
  172. },
  173. newSession(mask?: Mask) {
  174. const session = createEmptySession();
  175. if (mask) {
  176. const config = useAppConfig.getState();
  177. const globalModelConfig = config.modelConfig;
  178. session.mask = {
  179. ...mask,
  180. modelConfig: {
  181. ...globalModelConfig,
  182. ...mask.modelConfig,
  183. },
  184. };
  185. session.topic = mask.name;
  186. }
  187. set((state) => ({
  188. currentSessionIndex: 0,
  189. sessions: [session].concat(state.sessions),
  190. }));
  191. },
  192. nextSession(delta: number) {
  193. const n = get().sessions.length;
  194. const limit = (x: number) => (x + n) % n;
  195. const i = get().currentSessionIndex;
  196. get().selectSession(limit(i + delta));
  197. },
  198. deleteSession(index: number) {
  199. const deletingLastSession = get().sessions.length === 1;
  200. const deletedSession = get().sessions.at(index);
  201. if (!deletedSession) return;
  202. const sessions = get().sessions.slice();
  203. sessions.splice(index, 1);
  204. const currentIndex = get().currentSessionIndex;
  205. let nextIndex = Math.min(
  206. currentIndex - Number(index < currentIndex),
  207. sessions.length - 1,
  208. );
  209. if (deletingLastSession) {
  210. nextIndex = 0;
  211. sessions.push(createEmptySession());
  212. }
  213. // for undo delete action
  214. const restoreState = {
  215. currentSessionIndex: get().currentSessionIndex,
  216. sessions: get().sessions.slice(),
  217. };
  218. set(() => ({
  219. currentSessionIndex: nextIndex,
  220. sessions,
  221. }));
  222. showToast(
  223. Locale.Home.DeleteToast,
  224. {
  225. text: Locale.Home.Revert,
  226. onClick() {
  227. set(() => restoreState);
  228. },
  229. },
  230. 5000,
  231. );
  232. },
  233. currentSession() {
  234. let index = get().currentSessionIndex;
  235. const sessions = get().sessions;
  236. if (index < 0 || index >= sessions.length) {
  237. index = Math.min(sessions.length - 1, Math.max(0, index));
  238. set(() => ({ currentSessionIndex: index }));
  239. }
  240. const session = sessions[index];
  241. return session;
  242. },
  243. onNewMessage(message: ChatMessage) {
  244. get().updateCurrentSession((session) => {
  245. session.messages = session.messages.concat();
  246. session.lastUpdate = Date.now();
  247. });
  248. get().updateStat(message);
  249. get().summarizeSession();
  250. },
  251. async onUserInput(content: string, attachImages?: string[]) {
  252. const session = get().currentSession();
  253. const modelConfig = session.mask.modelConfig;
  254. const userContent = fillTemplateWith(content, modelConfig);
  255. console.log("[User Input] after template: ", userContent);
  256. let mContent: string | MultimodalContent[] = userContent;
  257. if (attachImages && attachImages.length > 0) {
  258. mContent = [
  259. {
  260. type: "text",
  261. text: userContent,
  262. },
  263. ];
  264. mContent = mContent.concat(
  265. attachImages.map((url) => {
  266. return {
  267. type: "image_url",
  268. image_url: {
  269. url: url,
  270. },
  271. };
  272. }),
  273. );
  274. }
  275. let userMessage: ChatMessage = createMessage({
  276. role: "user",
  277. content: mContent,
  278. });
  279. const botMessage: ChatMessage = createMessage({
  280. role: "assistant",
  281. streaming: true,
  282. model: modelConfig.model,
  283. });
  284. // get recent messages
  285. const recentMessages = get().getMessagesWithMemory();
  286. const sendMessages = recentMessages.concat(userMessage);
  287. const messageIndex = get().currentSession().messages.length + 1;
  288. // save user's and bot's message
  289. get().updateCurrentSession((session) => {
  290. const savedUserMessage = {
  291. ...userMessage,
  292. content: mContent,
  293. };
  294. session.messages = session.messages.concat([
  295. savedUserMessage,
  296. botMessage,
  297. ]);
  298. });
  299. var api: ClientApi;
  300. if (modelConfig.model.startsWith("gemini")) {
  301. api = new ClientApi(ModelProvider.GeminiPro);
  302. } else if (identifyDefaultClaudeModel(modelConfig.model)) {
  303. api = new ClientApi(ModelProvider.Claude);
  304. } else {
  305. api = new ClientApi(ModelProvider.GPT);
  306. }
  307. // make request
  308. api.llm.chat({
  309. messages: sendMessages,
  310. config: { ...modelConfig, stream: true },
  311. onUpdate(message) {
  312. botMessage.streaming = true;
  313. if (message) {
  314. botMessage.content = message;
  315. }
  316. get().updateCurrentSession((session) => {
  317. session.messages = session.messages.concat();
  318. });
  319. },
  320. onFinish(message) {
  321. botMessage.streaming = false;
  322. if (message) {
  323. botMessage.content = message;
  324. get().onNewMessage(botMessage);
  325. }
  326. ChatControllerPool.remove(session.id, botMessage.id);
  327. },
  328. onError(error) {
  329. const isAborted = error.message.includes("aborted");
  330. botMessage.content +=
  331. "\n\n" +
  332. prettyObject({
  333. error: true,
  334. message: error.message,
  335. });
  336. botMessage.streaming = false;
  337. userMessage.isError = !isAborted;
  338. botMessage.isError = !isAborted;
  339. get().updateCurrentSession((session) => {
  340. session.messages = session.messages.concat();
  341. });
  342. ChatControllerPool.remove(
  343. session.id,
  344. botMessage.id ?? messageIndex,
  345. );
  346. console.error("[Chat] failed ", error);
  347. },
  348. onController(controller) {
  349. // collect controller for stop/retry
  350. ChatControllerPool.addController(
  351. session.id,
  352. botMessage.id ?? messageIndex,
  353. controller,
  354. );
  355. },
  356. });
  357. },
  358. getMemoryPrompt() {
  359. const session = get().currentSession();
  360. return {
  361. role: "system",
  362. content:
  363. session.memoryPrompt.length > 0
  364. ? Locale.Store.Prompt.History(session.memoryPrompt)
  365. : "",
  366. date: "",
  367. } as ChatMessage;
  368. },
  369. getMessagesWithMemory() {
  370. const session = get().currentSession();
  371. const modelConfig = session.mask.modelConfig;
  372. const clearContextIndex = session.clearContextIndex ?? 0;
  373. const messages = session.messages.slice();
  374. const totalMessageCount = session.messages.length;
  375. // in-context prompts
  376. const contextPrompts = session.mask.context.slice();
  377. // system prompts, to get close to OpenAI Web ChatGPT
  378. const shouldInjectSystemPrompts =
  379. modelConfig.enableInjectSystemPrompts &&
  380. session.mask.modelConfig.model.startsWith("gpt-");
  381. var systemPrompts: ChatMessage[] = [];
  382. systemPrompts = shouldInjectSystemPrompts
  383. ? [
  384. createMessage({
  385. role: "system",
  386. content: fillTemplateWith("", {
  387. ...modelConfig,
  388. template: DEFAULT_SYSTEM_TEMPLATE,
  389. }),
  390. }),
  391. ]
  392. : [];
  393. if (shouldInjectSystemPrompts) {
  394. console.log(
  395. "[Global System Prompt] ",
  396. systemPrompts.at(0)?.content ?? "empty",
  397. );
  398. }
  399. // long term memory
  400. const shouldSendLongTermMemory =
  401. modelConfig.sendMemory &&
  402. session.memoryPrompt &&
  403. session.memoryPrompt.length > 0 &&
  404. session.lastSummarizeIndex > clearContextIndex;
  405. const longTermMemoryPrompts = shouldSendLongTermMemory
  406. ? [get().getMemoryPrompt()]
  407. : [];
  408. const longTermMemoryStartIndex = session.lastSummarizeIndex;
  409. // short term memory
  410. const shortTermMemoryStartIndex = Math.max(
  411. 0,
  412. totalMessageCount - modelConfig.historyMessageCount,
  413. );
  414. // lets concat send messages, including 4 parts:
  415. // 0. system prompt: to get close to OpenAI Web ChatGPT
  416. // 1. long term memory: summarized memory messages
  417. // 2. pre-defined in-context prompts
  418. // 3. short term memory: latest n messages
  419. // 4. newest input message
  420. const memoryStartIndex = shouldSendLongTermMemory
  421. ? Math.min(longTermMemoryStartIndex, shortTermMemoryStartIndex)
  422. : shortTermMemoryStartIndex;
  423. // and if user has cleared history messages, we should exclude the memory too.
  424. const contextStartIndex = Math.max(clearContextIndex, memoryStartIndex);
  425. const maxTokenThreshold = modelConfig.max_tokens;
  426. // get recent messages as much as possible
  427. const reversedRecentMessages = [];
  428. for (
  429. let i = totalMessageCount - 1, tokenCount = 0;
  430. i >= contextStartIndex && tokenCount < maxTokenThreshold;
  431. i -= 1
  432. ) {
  433. const msg = messages[i];
  434. if (!msg || msg.isError) continue;
  435. tokenCount += estimateTokenLength(getMessageTextContent(msg));
  436. reversedRecentMessages.push(msg);
  437. }
  438. // concat all messages
  439. const recentMessages = [
  440. ...systemPrompts,
  441. ...longTermMemoryPrompts,
  442. ...contextPrompts,
  443. ...reversedRecentMessages.reverse(),
  444. ];
  445. return recentMessages;
  446. },
  447. updateMessage(
  448. sessionIndex: number,
  449. messageIndex: number,
  450. updater: (message?: ChatMessage) => void,
  451. ) {
  452. const sessions = get().sessions;
  453. const session = sessions.at(sessionIndex);
  454. const messages = session?.messages;
  455. updater(messages?.at(messageIndex));
  456. set(() => ({ sessions }));
  457. },
  458. resetSession() {
  459. get().updateCurrentSession((session) => {
  460. session.messages = [];
  461. session.memoryPrompt = "";
  462. });
  463. },
  464. summarizeSession() {
  465. const config = useAppConfig.getState();
  466. const session = get().currentSession();
  467. const modelConfig = session.mask.modelConfig;
  468. var api: ClientApi;
  469. if (modelConfig.model.startsWith("gemini")) {
  470. api = new ClientApi(ModelProvider.GeminiPro);
  471. } else if (identifyDefaultClaudeModel(modelConfig.model)) {
  472. api = new ClientApi(ModelProvider.Claude);
  473. } else {
  474. api = new ClientApi(ModelProvider.GPT);
  475. }
  476. // remove error messages if any
  477. const messages = session.messages;
  478. // should summarize topic after chating more than 50 words
  479. const SUMMARIZE_MIN_LEN = 50;
  480. if (
  481. config.enableAutoGenerateTitle &&
  482. session.topic === DEFAULT_TOPIC &&
  483. countMessages(messages) >= SUMMARIZE_MIN_LEN
  484. ) {
  485. const topicMessages = messages.concat(
  486. createMessage({
  487. role: "user",
  488. content: Locale.Store.Prompt.Topic,
  489. }),
  490. );
  491. api.llm.chat({
  492. messages: topicMessages,
  493. config: {
  494. model: getSummarizeModel(session.mask.modelConfig.model),
  495. stream: false,
  496. },
  497. onFinish(message) {
  498. get().updateCurrentSession(
  499. (session) =>
  500. (session.topic =
  501. message.length > 0 ? trimTopic(message) : DEFAULT_TOPIC),
  502. );
  503. },
  504. });
  505. }
  506. const summarizeIndex = Math.max(
  507. session.lastSummarizeIndex,
  508. session.clearContextIndex ?? 0,
  509. );
  510. let toBeSummarizedMsgs = messages
  511. .filter((msg) => !msg.isError)
  512. .slice(summarizeIndex);
  513. const historyMsgLength = countMessages(toBeSummarizedMsgs);
  514. if (historyMsgLength > modelConfig?.max_tokens ?? 4000) {
  515. const n = toBeSummarizedMsgs.length;
  516. toBeSummarizedMsgs = toBeSummarizedMsgs.slice(
  517. Math.max(0, n - modelConfig.historyMessageCount),
  518. );
  519. }
  520. // add memory prompt
  521. toBeSummarizedMsgs.unshift(get().getMemoryPrompt());
  522. const lastSummarizeIndex = session.messages.length;
  523. console.log(
  524. "[Chat History] ",
  525. toBeSummarizedMsgs,
  526. historyMsgLength,
  527. modelConfig.compressMessageLengthThreshold,
  528. );
  529. if (
  530. historyMsgLength > modelConfig.compressMessageLengthThreshold &&
  531. modelConfig.sendMemory
  532. ) {
  533. /** Destruct max_tokens while summarizing
  534. * this param is just shit
  535. **/
  536. const { max_tokens, ...modelcfg } = modelConfig;
  537. api.llm.chat({
  538. messages: toBeSummarizedMsgs.concat(
  539. createMessage({
  540. role: "system",
  541. content: Locale.Store.Prompt.Summarize,
  542. date: "",
  543. }),
  544. ),
  545. config: {
  546. ...modelcfg,
  547. stream: true,
  548. model: getSummarizeModel(session.mask.modelConfig.model),
  549. },
  550. onUpdate(message) {
  551. session.memoryPrompt = message;
  552. },
  553. onFinish(message) {
  554. console.log("[Memory] ", message);
  555. get().updateCurrentSession((session) => {
  556. session.lastSummarizeIndex = lastSummarizeIndex;
  557. session.memoryPrompt = message; // Update the memory prompt for stored it in local storage
  558. });
  559. },
  560. onError(err) {
  561. console.error("[Summarize] ", err);
  562. },
  563. });
  564. }
  565. },
  566. updateStat(message: ChatMessage) {
  567. get().updateCurrentSession((session) => {
  568. session.stat.charCount += message.content.length;
  569. // TODO: should update chat count and word count
  570. });
  571. },
  572. updateCurrentSession(updater: (session: ChatSession) => void) {
  573. const sessions = get().sessions;
  574. const index = get().currentSessionIndex;
  575. updater(sessions[index]);
  576. set(() => ({ sessions }));
  577. },
  578. clearAllData() {
  579. localStorage.clear();
  580. location.reload();
  581. },
  582. };
  583. return methods;
  584. },
  585. {
  586. name: StoreKey.Chat,
  587. version: 3.1,
  588. migrate(persistedState, version) {
  589. const state = persistedState as any;
  590. const newState = JSON.parse(
  591. JSON.stringify(state),
  592. ) as typeof DEFAULT_CHAT_STATE;
  593. if (version < 2) {
  594. newState.sessions = [];
  595. const oldSessions = state.sessions;
  596. for (const oldSession of oldSessions) {
  597. const newSession = createEmptySession();
  598. newSession.topic = oldSession.topic;
  599. newSession.messages = [...oldSession.messages];
  600. newSession.mask.modelConfig.sendMemory = true;
  601. newSession.mask.modelConfig.historyMessageCount = 4;
  602. newSession.mask.modelConfig.compressMessageLengthThreshold = 1000;
  603. newState.sessions.push(newSession);
  604. }
  605. }
  606. if (version < 3) {
  607. // migrate id to nanoid
  608. newState.sessions.forEach((s) => {
  609. s.id = nanoid();
  610. s.messages.forEach((m) => (m.id = nanoid()));
  611. });
  612. }
  613. // Enable `enableInjectSystemPrompts` attribute for old sessions.
  614. // Resolve issue of old sessions not automatically enabling.
  615. if (version < 3.1) {
  616. newState.sessions.forEach((s) => {
  617. if (
  618. // Exclude those already set by user
  619. !s.mask.modelConfig.hasOwnProperty("enableInjectSystemPrompts")
  620. ) {
  621. // Because users may have changed this configuration,
  622. // the user's current configuration is used instead of the default
  623. const config = useAppConfig.getState();
  624. s.mask.modelConfig.enableInjectSystemPrompts =
  625. config.modelConfig.enableInjectSystemPrompts;
  626. }
  627. });
  628. }
  629. return newState as any;
  630. },
  631. },
  632. );