Spaces:
Running
Running
import { getStringHash, debounce, waitUntilCondition, extractAllWords, isTrueBoolean } from '../../utils.js'; | |
import { getContext, getApiUrl, extension_settings, doExtrasFetch, modules, renderExtensionTemplateAsync } from '../../extensions.js'; | |
import { | |
activateSendButtons, | |
deactivateSendButtons, | |
animation_duration, | |
eventSource, | |
event_types, | |
extension_prompt_roles, | |
extension_prompt_types, | |
generateQuietPrompt, | |
is_send_press, | |
saveSettingsDebounced, | |
substituteParamsExtended, | |
generateRaw, | |
getMaxContextSize, | |
setExtensionPrompt, | |
} from '../../../script.js'; | |
import { is_group_generating, selected_group } from '../../group-chats.js'; | |
import { loadMovingUIState } from '../../power-user.js'; | |
import { dragElement } from '../../RossAscends-mods.js'; | |
import { getTextTokens, getTokenCountAsync, tokenizers } from '../../tokenizers.js'; | |
import { debounce_timeout } from '../../constants.js'; | |
import { SlashCommandParser } from '../../slash-commands/SlashCommandParser.js'; | |
import { SlashCommand } from '../../slash-commands/SlashCommand.js'; | |
import { ARGUMENT_TYPE, SlashCommandArgument, SlashCommandNamedArgument } from '../../slash-commands/SlashCommandArgument.js'; | |
import { MacrosParser } from '../../macros.js'; | |
import { countWebLlmTokens, generateWebLlmChatPrompt, getWebLlmContextSize, isWebLlmSupported } from '../shared.js'; | |
import { commonEnumProviders } from '../../slash-commands/SlashCommandCommonEnumsProvider.js'; | |
export { MODULE_NAME }; | |
const MODULE_NAME = '1_memory'; | |
let lastCharacterId = null; | |
let lastGroupId = null; | |
let lastChatId = null; | |
let lastMessageHash = null; | |
let lastMessageId = null; | |
let inApiCall = false; | |
/** | |
* Count the number of tokens in the provided text. | |
* @param {string} text Text to count tokens for | |
* @param {number} padding Number of additional tokens to add to the count | |
* @returns {Promise<number>} Number of tokens in the text | |
*/ | |
async function countSourceTokens(text, padding = 0) { | |
if (extension_settings.memory.source === summary_sources.webllm) { | |
const count = await countWebLlmTokens(text); | |
return count + padding; | |
} | |
if (extension_settings.memory.source === summary_sources.extras) { | |
const count = getTextTokens(tokenizers.GPT2, text).length; | |
return count + padding; | |
} | |
return await getTokenCountAsync(text, padding); | |
} | |
async function getSourceContextSize() { | |
const overrideLength = extension_settings.memory.overrideResponseLength; | |
if (extension_settings.memory.source === summary_sources.webllm) { | |
const maxContext = await getWebLlmContextSize(); | |
return overrideLength > 0 ? (maxContext - overrideLength) : Math.round(maxContext * 0.75); | |
} | |
if (extension_settings.source === summary_sources.extras) { | |
return 1024 - 64; | |
} | |
return getMaxContextSize(overrideLength); | |
} | |
const formatMemoryValue = function (value) { | |
if (!value) { | |
return ''; | |
} | |
value = value.trim(); | |
if (extension_settings.memory.template) { | |
return substituteParamsExtended(extension_settings.memory.template, { summary: value }); | |
} else { | |
return `Summary: ${value}`; | |
} | |
}; | |
const saveChatDebounced = debounce(() => getContext().saveChat(), debounce_timeout.relaxed); | |
const summary_sources = { | |
'extras': 'extras', | |
'main': 'main', | |
'webllm': 'webllm', | |
}; | |
const prompt_builders = { | |
DEFAULT: 0, | |
RAW_BLOCKING: 1, | |
RAW_NON_BLOCKING: 2, | |
}; | |
const defaultPrompt = '[Pause your roleplay. Summarize the most important facts and events in the story so far. If a summary already exists in your memory, use that as a base and expand with new facts. Limit the summary to {{words}} words or less. Your response should include nothing but the summary.]'; | |
const defaultTemplate = '[Summary: {{summary}}]'; | |
const defaultSettings = { | |
memoryFrozen: false, | |
SkipWIAN: false, | |
source: summary_sources.extras, | |
prompt: defaultPrompt, | |
template: defaultTemplate, | |
position: extension_prompt_types.IN_PROMPT, | |
role: extension_prompt_roles.SYSTEM, | |
scan: false, | |
depth: 2, | |
promptWords: 200, | |
promptMinWords: 25, | |
promptMaxWords: 1000, | |
promptWordsStep: 25, | |
promptInterval: 10, | |
promptMinInterval: 0, | |
promptMaxInterval: 250, | |
promptIntervalStep: 1, | |
promptForceWords: 0, | |
promptForceWordsStep: 100, | |
promptMinForceWords: 0, | |
promptMaxForceWords: 10000, | |
overrideResponseLength: 0, | |
overrideResponseLengthMin: 0, | |
overrideResponseLengthMax: 4096, | |
overrideResponseLengthStep: 16, | |
maxMessagesPerRequest: 0, | |
maxMessagesPerRequestMin: 0, | |
maxMessagesPerRequestMax: 250, | |
maxMessagesPerRequestStep: 1, | |
prompt_builder: prompt_builders.DEFAULT, | |
}; | |
function loadSettings() { | |
if (Object.keys(extension_settings.memory).length === 0) { | |
Object.assign(extension_settings.memory, defaultSettings); | |
} | |
for (const key of Object.keys(defaultSettings)) { | |
if (extension_settings.memory[key] === undefined) { | |
extension_settings.memory[key] = defaultSettings[key]; | |
} | |
} | |
$('#summary_source').val(extension_settings.memory.source).trigger('change'); | |
$('#memory_frozen').prop('checked', extension_settings.memory.memoryFrozen).trigger('input'); | |
$('#memory_skipWIAN').prop('checked', extension_settings.memory.SkipWIAN).trigger('input'); | |
$('#memory_prompt').val(extension_settings.memory.prompt).trigger('input'); | |
$('#memory_prompt_words').val(extension_settings.memory.promptWords).trigger('input'); | |
$('#memory_prompt_interval').val(extension_settings.memory.promptInterval).trigger('input'); | |
$('#memory_template').val(extension_settings.memory.template).trigger('input'); | |
$('#memory_depth').val(extension_settings.memory.depth).trigger('input'); | |
$('#memory_role').val(extension_settings.memory.role).trigger('input'); | |
$(`input[name="memory_position"][value="${extension_settings.memory.position}"]`).prop('checked', true).trigger('input'); | |
$('#memory_prompt_words_force').val(extension_settings.memory.promptForceWords).trigger('input'); | |
$(`input[name="memory_prompt_builder"][value="${extension_settings.memory.prompt_builder}"]`).prop('checked', true).trigger('input'); | |
$('#memory_override_response_length').val(extension_settings.memory.overrideResponseLength).trigger('input'); | |
$('#memory_max_messages_per_request').val(extension_settings.memory.maxMessagesPerRequest).trigger('input'); | |
$('#memory_include_wi_scan').prop('checked', extension_settings.memory.scan).trigger('input'); | |
switchSourceControls(extension_settings.memory.source); | |
} | |
async function onPromptForceWordsAutoClick() { | |
const context = getContext(); | |
const maxPromptLength = await getSourceContextSize(); | |
const chat = context.chat; | |
const allMessages = chat.filter(m => !m.is_system && m.mes).map(m => m.mes); | |
const messagesWordCount = allMessages.map(m => extractAllWords(m)).flat().length; | |
const averageMessageWordCount = messagesWordCount / allMessages.length; | |
const tokensPerWord = await countSourceTokens(allMessages.join('\n')) / messagesWordCount; | |
const wordsPerToken = 1 / tokensPerWord; | |
const maxPromptLengthWords = Math.round(maxPromptLength * wordsPerToken); | |
// How many words should pass so that messages will start be dropped out of context; | |
const wordsPerPrompt = Math.floor(maxPromptLength / tokensPerWord); | |
// How many words will be needed to fit the allowance buffer | |
const summaryPromptWords = extractAllWords(extension_settings.memory.prompt).length; | |
const promptAllowanceWords = maxPromptLengthWords - extension_settings.memory.promptWords - summaryPromptWords; | |
const averageMessagesPerPrompt = Math.floor(promptAllowanceWords / averageMessageWordCount); | |
const maxMessagesPerSummary = extension_settings.memory.maxMessagesPerRequest || 0; | |
const targetMessagesInPrompt = maxMessagesPerSummary > 0 ? maxMessagesPerSummary : Math.max(0, averageMessagesPerPrompt); | |
const targetSummaryWords = (targetMessagesInPrompt * averageMessageWordCount) + (promptAllowanceWords / 4); | |
console.table({ | |
maxPromptLength, | |
maxPromptLengthWords, | |
promptAllowanceWords, | |
averageMessagesPerPrompt, | |
targetMessagesInPrompt, | |
targetSummaryWords, | |
wordsPerPrompt, | |
wordsPerToken, | |
tokensPerWord, | |
messagesWordCount, | |
}); | |
const ROUNDING = 100; | |
extension_settings.memory.promptForceWords = Math.max(1, Math.floor(targetSummaryWords / ROUNDING) * ROUNDING); | |
$('#memory_prompt_words_force').val(extension_settings.memory.promptForceWords).trigger('input'); | |
} | |
async function onPromptIntervalAutoClick() { | |
const context = getContext(); | |
const maxPromptLength = await getSourceContextSize(); | |
const chat = context.chat; | |
const allMessages = chat.filter(m => !m.is_system && m.mes).map(m => m.mes); | |
const messagesWordCount = allMessages.map(m => extractAllWords(m)).flat().length; | |
const messagesTokenCount = await countSourceTokens(allMessages.join('\n')); | |
const tokensPerWord = messagesTokenCount / messagesWordCount; | |
const averageMessageTokenCount = messagesTokenCount / allMessages.length; | |
const targetSummaryTokens = Math.round(extension_settings.memory.promptWords * tokensPerWord); | |
const promptTokens = await countSourceTokens(extension_settings.memory.prompt); | |
const promptAllowance = maxPromptLength - promptTokens - targetSummaryTokens; | |
const maxMessagesPerSummary = extension_settings.memory.maxMessagesPerRequest || 0; | |
const averageMessagesPerPrompt = Math.floor(promptAllowance / averageMessageTokenCount); | |
const targetMessagesInPrompt = maxMessagesPerSummary > 0 ? maxMessagesPerSummary : Math.max(0, averageMessagesPerPrompt); | |
const adjustedAverageMessagesPerPrompt = targetMessagesInPrompt + (averageMessagesPerPrompt - targetMessagesInPrompt) / 4; | |
console.table({ | |
maxPromptLength, | |
promptAllowance, | |
targetSummaryTokens, | |
promptTokens, | |
messagesWordCount, | |
messagesTokenCount, | |
tokensPerWord, | |
averageMessageTokenCount, | |
averageMessagesPerPrompt, | |
targetMessagesInPrompt, | |
adjustedAverageMessagesPerPrompt, | |
maxMessagesPerSummary, | |
}); | |
const ROUNDING = 5; | |
extension_settings.memory.promptInterval = Math.max(1, Math.floor(adjustedAverageMessagesPerPrompt / ROUNDING) * ROUNDING); | |
$('#memory_prompt_interval').val(extension_settings.memory.promptInterval).trigger('input'); | |
} | |
function onSummarySourceChange(event) { | |
const value = event.target.value; | |
extension_settings.memory.source = value; | |
switchSourceControls(value); | |
saveSettingsDebounced(); | |
} | |
function switchSourceControls(value) { | |
$('#memory_settings [data-summary-source]').each((_, element) => { | |
const source = element.dataset.summarySource.split(',').map(s => s.trim()); | |
$(element).toggle(source.includes(value)); | |
}); | |
} | |
function onMemoryFrozenInput() { | |
const value = Boolean($(this).prop('checked')); | |
extension_settings.memory.memoryFrozen = value; | |
saveSettingsDebounced(); | |
} | |
function onMemorySkipWIANInput() { | |
const value = Boolean($(this).prop('checked')); | |
extension_settings.memory.SkipWIAN = value; | |
saveSettingsDebounced(); | |
} | |
function onMemoryPromptWordsInput() { | |
const value = $(this).val(); | |
extension_settings.memory.promptWords = Number(value); | |
$('#memory_prompt_words_value').text(extension_settings.memory.promptWords); | |
saveSettingsDebounced(); | |
} | |
function onMemoryPromptIntervalInput() { | |
const value = $(this).val(); | |
extension_settings.memory.promptInterval = Number(value); | |
$('#memory_prompt_interval_value').text(extension_settings.memory.promptInterval); | |
saveSettingsDebounced(); | |
} | |
function onMemoryPromptRestoreClick() { | |
$('#memory_prompt').val(defaultPrompt).trigger('input'); | |
} | |
function onMemoryPromptInput() { | |
const value = $(this).val(); | |
extension_settings.memory.prompt = value; | |
saveSettingsDebounced(); | |
} | |
function onMemoryTemplateInput() { | |
const value = $(this).val(); | |
extension_settings.memory.template = value; | |
reinsertMemory(); | |
saveSettingsDebounced(); | |
} | |
function onMemoryDepthInput() { | |
const value = $(this).val(); | |
extension_settings.memory.depth = Number(value); | |
reinsertMemory(); | |
saveSettingsDebounced(); | |
} | |
function onMemoryRoleInput() { | |
const value = $(this).val(); | |
extension_settings.memory.role = Number(value); | |
reinsertMemory(); | |
saveSettingsDebounced(); | |
} | |
function onMemoryPositionChange(e) { | |
const value = e.target.value; | |
extension_settings.memory.position = value; | |
reinsertMemory(); | |
saveSettingsDebounced(); | |
} | |
function onMemoryIncludeWIScanInput() { | |
const value = !!$(this).prop('checked'); | |
extension_settings.memory.scan = value; | |
reinsertMemory(); | |
saveSettingsDebounced(); | |
} | |
function onMemoryPromptWordsForceInput() { | |
const value = $(this).val(); | |
extension_settings.memory.promptForceWords = Number(value); | |
$('#memory_prompt_words_force_value').text(extension_settings.memory.promptForceWords); | |
saveSettingsDebounced(); | |
} | |
function onOverrideResponseLengthInput() { | |
const value = $(this).val(); | |
extension_settings.memory.overrideResponseLength = Number(value); | |
$('#memory_override_response_length_value').text(extension_settings.memory.overrideResponseLength); | |
saveSettingsDebounced(); | |
} | |
function onMaxMessagesPerRequestInput() { | |
const value = $(this).val(); | |
extension_settings.memory.maxMessagesPerRequest = Number(value); | |
$('#memory_max_messages_per_request_value').text(extension_settings.memory.maxMessagesPerRequest); | |
saveSettingsDebounced(); | |
} | |
function saveLastValues() { | |
const context = getContext(); | |
lastGroupId = context.groupId; | |
lastCharacterId = context.characterId; | |
lastChatId = context.chatId; | |
lastMessageId = context.chat?.length ?? null; | |
lastMessageHash = getStringHash((context.chat.length && context.chat[context.chat.length - 1]['mes']) ?? ''); | |
} | |
function getLatestMemoryFromChat(chat) { | |
if (!Array.isArray(chat) || !chat.length) { | |
return ''; | |
} | |
const reversedChat = chat.slice().reverse(); | |
reversedChat.shift(); | |
for (let mes of reversedChat) { | |
if (mes.extra && mes.extra.memory) { | |
return mes.extra.memory; | |
} | |
} | |
return ''; | |
} | |
function getIndexOfLatestChatSummary(chat) { | |
if (!Array.isArray(chat) || !chat.length) { | |
return -1; | |
} | |
const reversedChat = chat.slice().reverse(); | |
reversedChat.shift(); | |
for (let mes of reversedChat) { | |
if (mes.extra && mes.extra.memory) { | |
return chat.indexOf(mes); | |
} | |
} | |
return -1; | |
} | |
async function onChatEvent() { | |
// Module not enabled | |
if (extension_settings.memory.source === summary_sources.extras && !modules.includes('summarize')) { | |
return; | |
} | |
// WebLLM is not supported | |
if (extension_settings.memory.source === summary_sources.webllm && !isWebLlmSupported()) { | |
return; | |
} | |
const context = getContext(); | |
const chat = context.chat; | |
// no characters or group selected | |
if (!context.groupId && context.characterId === undefined) { | |
return; | |
} | |
// Generation is in progress, summary prevented | |
if (is_send_press) { | |
return; | |
} | |
// Chat/character/group changed | |
if ((context.groupId && lastGroupId !== context.groupId) || (context.characterId !== lastCharacterId) || (context.chatId !== lastChatId)) { | |
const latestMemory = getLatestMemoryFromChat(chat); | |
setMemoryContext(latestMemory, false); | |
saveLastValues(); | |
return; | |
} | |
// Currently summarizing or frozen state - skip | |
if (inApiCall || extension_settings.memory.memoryFrozen) { | |
return; | |
} | |
// No new messages - do nothing | |
if (chat.length === 0 || (lastMessageId === chat.length && getStringHash(chat[chat.length - 1].mes) === lastMessageHash)) { | |
return; | |
} | |
// Messages has been deleted - rewrite the context with the latest available memory | |
if (chat.length < lastMessageId) { | |
const latestMemory = getLatestMemoryFromChat(chat); | |
setMemoryContext(latestMemory, false); | |
} | |
// Message has been edited / regenerated - delete the saved memory | |
if (chat.length | |
&& chat[chat.length - 1].extra | |
&& chat[chat.length - 1].extra.memory | |
&& lastMessageId === chat.length | |
&& getStringHash(chat[chat.length - 1].mes) !== lastMessageHash) { | |
delete chat[chat.length - 1].extra.memory; | |
} | |
try { | |
await summarizeChat(context); | |
} | |
catch (error) { | |
console.log(error); | |
} | |
finally { | |
saveLastValues(); | |
} | |
} | |
/** | |
* Forces a summary generation for the current chat. | |
* @param {boolean} quiet If an informational toast should be displayed | |
* @returns {Promise<string>} Summarized text | |
*/ | |
async function forceSummarizeChat(quiet) { | |
if (extension_settings.memory.source === summary_sources.extras) { | |
toastr.warning('Force summarization is not supported for Extras API'); | |
return; | |
} | |
const context = getContext(); | |
const skipWIAN = extension_settings.memory.SkipWIAN; | |
console.log(`Skipping WIAN? ${skipWIAN}`); | |
if (!context.chatId) { | |
toastr.warning('No chat selected'); | |
return ''; | |
} | |
const toast = quiet ? jQuery() : toastr.info('Summarizing chat...', 'Please wait', { timeOut: 0, extendedTimeOut: 0 }); | |
const value = extension_settings.memory.source === summary_sources.main | |
? await summarizeChatMain(context, true, skipWIAN) | |
: await summarizeChatWebLLM(context, true); | |
toastr.clear(toast); | |
if (!value) { | |
toastr.warning('Failed to summarize chat'); | |
return ''; | |
} | |
return value; | |
} | |
/** | |
* Callback for the summarize command. | |
* @param {object} args Command arguments | |
* @param {string} text Text to summarize | |
*/ | |
async function summarizeCallback(args, text) { | |
text = text.trim(); | |
// Summarize the current chat if no text provided | |
if (!text) { | |
const quiet = isTrueBoolean(args.quiet); | |
return await forceSummarizeChat(quiet); | |
} | |
const source = args.source || extension_settings.memory.source; | |
const prompt = substituteParamsExtended((args.prompt || extension_settings.memory.prompt), { words: extension_settings.memory.promptWords }); | |
try { | |
switch (source) { | |
case summary_sources.extras: | |
return await callExtrasSummarizeAPI(text); | |
case summary_sources.main: | |
return await generateRaw(text, '', false, false, prompt, extension_settings.memory.overrideResponseLength); | |
case summary_sources.webllm: { | |
const messages = [{ role: 'system', content: prompt }, { role: 'user', content: text }].filter(m => m.content); | |
const params = extension_settings.memory.overrideResponseLength > 0 ? { max_tokens: extension_settings.memory.overrideResponseLength } : {}; | |
return await generateWebLlmChatPrompt(messages, params); | |
} | |
default: | |
toastr.warning('Invalid summarization source specified'); | |
return ''; | |
} | |
} catch (error) { | |
toastr.error(String(error), 'Failed to summarize text'); | |
console.log(error); | |
return ''; | |
} | |
} | |
async function summarizeChat(context) { | |
const skipWIAN = extension_settings.memory.SkipWIAN; | |
switch (extension_settings.memory.source) { | |
case summary_sources.extras: | |
await summarizeChatExtras(context); | |
break; | |
case summary_sources.main: | |
await summarizeChatMain(context, false, skipWIAN); | |
break; | |
case summary_sources.webllm: | |
await summarizeChatWebLLM(context, false); | |
break; | |
default: | |
break; | |
} | |
} | |
/** | |
* Check if the chat should be summarized based on the current conditions. | |
* Return summary prompt if it should be summarized. | |
* @param {any} context ST context | |
* @param {boolean} force Summarize the chat regardless of the conditions | |
* @returns {Promise<string>} Summary prompt or empty string | |
*/ | |
async function getSummaryPromptForNow(context, force) { | |
if (extension_settings.memory.promptInterval === 0 && !force) { | |
console.debug('Prompt interval is set to 0, skipping summarization'); | |
return ''; | |
} | |
try { | |
// Wait for group to finish generating | |
if (selected_group) { | |
await waitUntilCondition(() => is_group_generating === false, 1000, 10); | |
} | |
// Wait for the send button to be released | |
waitUntilCondition(() => is_send_press === false, 30000, 100); | |
} catch { | |
console.debug('Timeout waiting for is_send_press'); | |
return ''; | |
} | |
if (!context.chat.length) { | |
console.debug('No messages in chat to summarize'); | |
return ''; | |
} | |
if (context.chat.length < extension_settings.memory.promptInterval && !force) { | |
console.debug(`Not enough messages in chat to summarize (chat: ${context.chat.length}, interval: ${extension_settings.memory.promptInterval})`); | |
return ''; | |
} | |
let messagesSinceLastSummary = 0; | |
let wordsSinceLastSummary = 0; | |
let conditionSatisfied = false; | |
for (let i = context.chat.length - 1; i >= 0; i--) { | |
if (context.chat[i].extra && context.chat[i].extra.memory) { | |
break; | |
} | |
messagesSinceLastSummary++; | |
wordsSinceLastSummary += extractAllWords(context.chat[i].mes).length; | |
} | |
if (messagesSinceLastSummary >= extension_settings.memory.promptInterval) { | |
conditionSatisfied = true; | |
} | |
if (extension_settings.memory.promptForceWords && wordsSinceLastSummary >= extension_settings.memory.promptForceWords) { | |
conditionSatisfied = true; | |
} | |
if (!conditionSatisfied && !force) { | |
console.debug(`Summary conditions not satisfied (messages: ${messagesSinceLastSummary}, interval: ${extension_settings.memory.promptInterval}, words: ${wordsSinceLastSummary}, force words: ${extension_settings.memory.promptForceWords})`); | |
return ''; | |
} | |
console.log('Summarizing chat, messages since last summary: ' + messagesSinceLastSummary, 'words since last summary: ' + wordsSinceLastSummary); | |
const prompt = substituteParamsExtended(extension_settings.memory.prompt, { words: extension_settings.memory.promptWords }); | |
if (!prompt) { | |
console.debug('Summarization prompt is empty. Skipping summarization.'); | |
return ''; | |
} | |
return prompt; | |
} | |
async function summarizeChatWebLLM(context, force) { | |
if (!isWebLlmSupported()) { | |
return; | |
} | |
const prompt = await getSummaryPromptForNow(context, force); | |
if (!prompt) { | |
return; | |
} | |
const { rawPrompt, lastUsedIndex } = await getRawSummaryPrompt(context, prompt); | |
if (lastUsedIndex === null || lastUsedIndex === -1) { | |
if (force) { | |
toastr.info('To try again, remove the latest summary.', 'No messages found to summarize'); | |
} | |
return null; | |
} | |
const messages = [ | |
{ role: 'system', content: prompt }, | |
{ role: 'user', content: rawPrompt }, | |
]; | |
const params = {}; | |
if (extension_settings.memory.overrideResponseLength > 0) { | |
params.max_tokens = extension_settings.memory.overrideResponseLength; | |
} | |
const summary = await generateWebLlmChatPrompt(messages, params); | |
const newContext = getContext(); | |
// something changed during summarization request | |
if (newContext.groupId !== context.groupId || | |
newContext.chatId !== context.chatId || | |
(!newContext.groupId && (newContext.characterId !== context.characterId))) { | |
console.log('Context changed, summary discarded'); | |
return; | |
} | |
setMemoryContext(summary, true, lastUsedIndex); | |
return summary; | |
} | |
async function summarizeChatMain(context, force, skipWIAN) { | |
const prompt = await getSummaryPromptForNow(context, force); | |
if (!prompt) { | |
return; | |
} | |
console.log('sending summary prompt'); | |
let summary = ''; | |
let index = null; | |
if (prompt_builders.DEFAULT === extension_settings.memory.prompt_builder) { | |
summary = await generateQuietPrompt(prompt, false, skipWIAN, '', '', extension_settings.memory.overrideResponseLength); | |
} | |
if ([prompt_builders.RAW_BLOCKING, prompt_builders.RAW_NON_BLOCKING].includes(extension_settings.memory.prompt_builder)) { | |
const lock = extension_settings.memory.prompt_builder === prompt_builders.RAW_BLOCKING; | |
try { | |
if (lock) { | |
deactivateSendButtons(); | |
} | |
const { rawPrompt, lastUsedIndex } = await getRawSummaryPrompt(context, prompt); | |
if (lastUsedIndex === null || lastUsedIndex === -1) { | |
if (force) { | |
toastr.info('To try again, remove the latest summary.', 'No messages found to summarize'); | |
} | |
return null; | |
} | |
summary = await generateRaw(rawPrompt, '', false, false, prompt, extension_settings.memory.overrideResponseLength); | |
index = lastUsedIndex; | |
} finally { | |
if (lock) { | |
activateSendButtons(); | |
} | |
} | |
} | |
const newContext = getContext(); | |
// something changed during summarization request | |
if (newContext.groupId !== context.groupId | |
|| newContext.chatId !== context.chatId | |
|| (!newContext.groupId && (newContext.characterId !== context.characterId))) { | |
console.log('Context changed, summary discarded'); | |
return; | |
} | |
setMemoryContext(summary, true, index); | |
return summary; | |
} | |
/** | |
* Get the raw summarization prompt from the chat context. | |
* @param {object} context ST context | |
* @param {string} prompt Summarization system prompt | |
* @returns {Promise<{rawPrompt: string, lastUsedIndex: number}>} Raw summarization prompt | |
*/ | |
async function getRawSummaryPrompt(context, prompt) { | |
/** | |
* Get the memory string from the chat buffer. | |
* @param {boolean} includeSystem Include prompt into the memory string | |
* @returns {string} Memory string | |
*/ | |
function getMemoryString(includeSystem) { | |
const delimiter = '\n\n'; | |
const stringBuilder = []; | |
const bufferString = chatBuffer.slice().join(delimiter); | |
if (includeSystem) { | |
stringBuilder.push(prompt); | |
} | |
if (latestSummary) { | |
stringBuilder.push(latestSummary); | |
} | |
stringBuilder.push(bufferString); | |
return stringBuilder.join(delimiter).trim(); | |
} | |
const chat = context.chat.slice(); | |
const latestSummary = getLatestMemoryFromChat(chat); | |
const latestSummaryIndex = getIndexOfLatestChatSummary(chat); | |
chat.pop(); // We always exclude the last message from the buffer | |
const chatBuffer = []; | |
const PADDING = 64; | |
const PROMPT_SIZE = await getSourceContextSize(); | |
let latestUsedMessage = null; | |
for (let index = latestSummaryIndex + 1; index < chat.length; index++) { | |
const message = chat[index]; | |
if (!message) { | |
break; | |
} | |
if (message.is_system || !message.mes) { | |
continue; | |
} | |
const entry = `${message.name}:\n${message.mes}`; | |
chatBuffer.push(entry); | |
const tokens = await countSourceTokens(getMemoryString(true), PADDING); | |
if (tokens > PROMPT_SIZE) { | |
chatBuffer.pop(); | |
break; | |
} | |
latestUsedMessage = message; | |
if (extension_settings.memory.maxMessagesPerRequest > 0 && chatBuffer.length >= extension_settings.memory.maxMessagesPerRequest) { | |
break; | |
} | |
} | |
const lastUsedIndex = context.chat.indexOf(latestUsedMessage); | |
const rawPrompt = getMemoryString(false); | |
return { rawPrompt, lastUsedIndex }; | |
} | |
async function summarizeChatExtras(context) { | |
function getMemoryString() { | |
return (longMemory + '\n\n' + memoryBuffer.slice().reverse().join('\n\n')).trim(); | |
} | |
const chat = context.chat; | |
const longMemory = getLatestMemoryFromChat(chat); | |
const reversedChat = chat.slice().reverse(); | |
reversedChat.shift(); | |
const memoryBuffer = []; | |
const CONTEXT_SIZE = await getSourceContextSize(); | |
for (const message of reversedChat) { | |
// we reached the point of latest memory | |
if (longMemory && message.extra && message.extra.memory == longMemory) { | |
break; | |
} | |
// don't care about system | |
if (message.is_system) { | |
continue; | |
} | |
// determine the sender's name | |
const entry = `${message.name}:\n${message.mes}`; | |
memoryBuffer.push(entry); | |
// check if token limit was reached | |
const tokens = await countSourceTokens(getMemoryString()); | |
if (tokens >= CONTEXT_SIZE) { | |
break; | |
} | |
} | |
const resultingString = getMemoryString(); | |
const resultingTokens = await countSourceTokens(resultingString); | |
if (!resultingString || resultingTokens < CONTEXT_SIZE) { | |
console.debug('Not enough context to summarize'); | |
return; | |
} | |
// perform the summarization API call | |
try { | |
inApiCall = true; | |
const summary = await callExtrasSummarizeAPI(resultingString); | |
const newContext = getContext(); | |
// something changed during summarization request | |
if (newContext.groupId !== context.groupId | |
|| newContext.chatId !== context.chatId | |
|| (!newContext.groupId && (newContext.characterId !== context.characterId))) { | |
console.log('Context changed, summary discarded'); | |
return; | |
} | |
setMemoryContext(summary, true); | |
} | |
catch (error) { | |
console.log(error); | |
} | |
finally { | |
inApiCall = false; | |
} | |
} | |
/** | |
* Call the Extras API to summarize the provided text. | |
* @param {string} text Text to summarize | |
* @returns {Promise<string>} Summarized text | |
*/ | |
async function callExtrasSummarizeAPI(text) { | |
if (!modules.includes('summarize')) { | |
throw new Error('Summarize module is not enabled in Extras API'); | |
} | |
const url = new URL(getApiUrl()); | |
url.pathname = '/api/summarize'; | |
const apiResult = await doExtrasFetch(url, { | |
method: 'POST', | |
headers: { | |
'Content-Type': 'application/json', | |
'Bypass-Tunnel-Reminder': 'bypass', | |
}, | |
body: JSON.stringify({ | |
text: text, | |
params: {}, | |
}), | |
}); | |
if (apiResult.ok) { | |
const data = await apiResult.json(); | |
const summary = data.summary; | |
return summary; | |
} | |
throw new Error('Extras API call failed'); | |
} | |
function onMemoryRestoreClick() { | |
const context = getContext(); | |
const content = $('#memory_contents').val(); | |
const reversedChat = context.chat.slice().reverse(); | |
reversedChat.shift(); | |
for (let mes of reversedChat) { | |
if (mes.extra && mes.extra.memory == content) { | |
delete mes.extra.memory; | |
break; | |
} | |
} | |
const newContent = getLatestMemoryFromChat(context.chat); | |
setMemoryContext(newContent, false); | |
} | |
function onMemoryContentInput() { | |
const value = $(this).val(); | |
setMemoryContext(value, true); | |
} | |
function onMemoryPromptBuilderInput(e) { | |
const value = Number(e.target.value); | |
extension_settings.memory.prompt_builder = value; | |
saveSettingsDebounced(); | |
} | |
function reinsertMemory() { | |
const existingValue = String($('#memory_contents').val()); | |
setMemoryContext(existingValue, false); | |
} | |
/** | |
* Set the summary value to the context and save it to the chat message extra. | |
* @param {string} value Value of a summary | |
* @param {boolean} saveToMessage Should the summary be saved to the chat message extra | |
* @param {number|null} index Index of the chat message to save the summary to. If null, the pre-last message is used. | |
*/ | |
function setMemoryContext(value, saveToMessage, index = null) { | |
setExtensionPrompt(MODULE_NAME, formatMemoryValue(value), extension_settings.memory.position, extension_settings.memory.depth, extension_settings.memory.scan, extension_settings.memory.role); | |
$('#memory_contents').val(value); | |
const summaryLog = value | |
? `Summary set to: ${value}. Position: ${extension_settings.memory.position}. Depth: ${extension_settings.memory.depth}. Role: ${extension_settings.memory.role}` | |
: 'Summary has no content'; | |
console.debug(summaryLog); | |
const context = getContext(); | |
if (saveToMessage && context.chat.length) { | |
const idx = index ?? context.chat.length - 2; | |
const mes = context.chat[idx < 0 ? 0 : idx]; | |
if (!mes.extra) { | |
mes.extra = {}; | |
} | |
mes.extra.memory = value; | |
saveChatDebounced(); | |
} | |
} | |
function doPopout(e) { | |
const target = e.target; | |
//repurposes the zoomed avatar template to server as a floating div | |
if ($('#summaryExtensionPopout').length === 0) { | |
console.debug('did not see popout yet, creating'); | |
const originalHTMLClone = $(target).parent().parent().parent().find('.inline-drawer-content').html(); | |
const originalElement = $(target).parent().parent().parent().find('.inline-drawer-content'); | |
const template = $('#zoomed_avatar_template').html(); | |
const controlBarHtml = `<div class="panelControlBar flex-container"> | |
<div id="summaryExtensionPopoutheader" class="fa-solid fa-grip drag-grabber hoverglow"></div> | |
<div id="summaryExtensionPopoutClose" class="fa-solid fa-circle-xmark hoverglow dragClose"></div> | |
</div>`; | |
const newElement = $(template); | |
newElement.attr('id', 'summaryExtensionPopout') | |
.removeClass('zoomed_avatar') | |
.addClass('draggable') | |
.empty(); | |
const prevSummaryBoxContents = $('#memory_contents').val(); //copy summary box before emptying | |
originalElement.empty(); | |
originalElement.html('<div class="flex-container alignitemscenter justifyCenter wide100p"><small>Currently popped out</small></div>'); | |
newElement.append(controlBarHtml).append(originalHTMLClone); | |
$('body').append(newElement); | |
$('#summaryExtensionDrawerContents').addClass('scrollableInnerFull'); | |
setMemoryContext(prevSummaryBoxContents, false); //paste prev summary box contents into popout box | |
setupListeners(); | |
loadSettings(); | |
loadMovingUIState(); | |
$('#summaryExtensionPopout').fadeIn(animation_duration); | |
dragElement(newElement); | |
//setup listener for close button to restore extensions menu | |
$('#summaryExtensionPopoutClose').off('click').on('click', function () { | |
$('#summaryExtensionDrawerContents').removeClass('scrollableInnerFull'); | |
const summaryPopoutHTML = $('#summaryExtensionDrawerContents'); | |
$('#summaryExtensionPopout').fadeOut(animation_duration, () => { | |
originalElement.empty(); | |
originalElement.html(summaryPopoutHTML); | |
$('#summaryExtensionPopout').remove(); | |
}); | |
loadSettings(); | |
}); | |
} else { | |
console.debug('saw existing popout, removing'); | |
$('#summaryExtensionPopout').fadeOut(animation_duration, () => { $('#summaryExtensionPopoutClose').trigger('click'); }); | |
} | |
} | |
function setupListeners() { | |
//setup shared listeners for popout and regular ext menu | |
$('#memory_restore').off('click').on('click', onMemoryRestoreClick); | |
$('#memory_contents').off('click').on('input', onMemoryContentInput); | |
$('#memory_frozen').off('click').on('input', onMemoryFrozenInput); | |
$('#memory_skipWIAN').off('click').on('input', onMemorySkipWIANInput); | |
$('#summary_source').off('click').on('change', onSummarySourceChange); | |
$('#memory_prompt_words').off('click').on('input', onMemoryPromptWordsInput); | |
$('#memory_prompt_interval').off('click').on('input', onMemoryPromptIntervalInput); | |
$('#memory_prompt').off('click').on('input', onMemoryPromptInput); | |
$('#memory_force_summarize').off('click').on('click', () => forceSummarizeChat(false)); | |
$('#memory_template').off('click').on('input', onMemoryTemplateInput); | |
$('#memory_depth').off('click').on('input', onMemoryDepthInput); | |
$('#memory_role').off('click').on('input', onMemoryRoleInput); | |
$('input[name="memory_position"]').off('click').on('change', onMemoryPositionChange); | |
$('#memory_prompt_words_force').off('click').on('input', onMemoryPromptWordsForceInput); | |
$('#memory_prompt_builder_default').off('click').on('input', onMemoryPromptBuilderInput); | |
$('#memory_prompt_builder_raw_blocking').off('click').on('input', onMemoryPromptBuilderInput); | |
$('#memory_prompt_builder_raw_non_blocking').off('click').on('input', onMemoryPromptBuilderInput); | |
$('#memory_prompt_restore').off('click').on('click', onMemoryPromptRestoreClick); | |
$('#memory_prompt_interval_auto').off('click').on('click', onPromptIntervalAutoClick); | |
$('#memory_prompt_words_auto').off('click').on('click', onPromptForceWordsAutoClick); | |
$('#memory_override_response_length').off('click').on('input', onOverrideResponseLengthInput); | |
$('#memory_max_messages_per_request').off('click').on('input', onMaxMessagesPerRequestInput); | |
$('#memory_include_wi_scan').off('input').on('input', onMemoryIncludeWIScanInput); | |
$('#summarySettingsBlockToggle').off('click').on('click', function () { | |
console.log('saw settings button click'); | |
$('#summarySettingsBlock').slideToggle(200, 'swing'); //toggleClass("hidden"); | |
}); | |
} | |
jQuery(async function () { | |
async function addExtensionControls() { | |
const settingsHtml = await renderExtensionTemplateAsync('memory', 'settings', { defaultSettings }); | |
$('#summarize_container').append(settingsHtml); | |
setupListeners(); | |
$('#summaryExtensionPopoutButton').off('click').on('click', function (e) { | |
doPopout(e); | |
e.stopPropagation(); | |
}); | |
} | |
await addExtensionControls(); | |
loadSettings(); | |
eventSource.makeLast(event_types.CHARACTER_MESSAGE_RENDERED, onChatEvent); | |
eventSource.on(event_types.MESSAGE_DELETED, onChatEvent); | |
eventSource.on(event_types.MESSAGE_EDITED, onChatEvent); | |
eventSource.on(event_types.MESSAGE_SWIPED, onChatEvent); | |
eventSource.on(event_types.CHAT_CHANGED, onChatEvent); | |
SlashCommandParser.addCommandObject(SlashCommand.fromProps({ | |
name: 'summarize', | |
callback: summarizeCallback, | |
namedArgumentList: [ | |
new SlashCommandNamedArgument('source', 'API to use for summarization', [ARGUMENT_TYPE.STRING], false, false, '', Object.values(summary_sources)), | |
SlashCommandNamedArgument.fromProps({ | |
name: 'prompt', | |
description: 'prompt to use for summarization', | |
typeList: [ARGUMENT_TYPE.STRING], | |
defaultValue: '', | |
}), | |
SlashCommandNamedArgument.fromProps({ | |
name: 'quiet', | |
description: 'suppress the toast message when summarizing the chat', | |
typeList: [ARGUMENT_TYPE.BOOLEAN], | |
defaultValue: 'false', | |
enumList: commonEnumProviders.boolean('trueFalse')(), | |
}), | |
], | |
unnamedArgumentList: [ | |
new SlashCommandArgument('text to summarize', [ARGUMENT_TYPE.STRING], false, false, ''), | |
], | |
helpString: 'Summarizes the given text. If no text is provided, the current chat will be summarized. Can specify the source and the prompt to use.', | |
returns: ARGUMENT_TYPE.STRING, | |
})); | |
MacrosParser.registerMacro('summary', () => getLatestMemoryFromChat(getContext().chat)); | |
}); | |