1
0
Fork 0

Compare commits

..

3 Commits

Author SHA1 Message Date
Pabloader f228f78915 New unslop logic 2026-03-11 15:11:44 +00:00
Pabloader 98302de620 Disable thinking in the chat template. 2026-03-11 15:11:22 +00:00
Pabloader b4db7fd2a7 Nested message formatting 2026-03-11 15:11:07 +00:00
3 changed files with 62 additions and 35 deletions

View File

@ -161,6 +161,12 @@ export namespace Connection {
if (extraSettings.max_length && extraSettings.max_length < maxLength) {
maxLength = extraSettings.max_length;
}
const baseTemperature = extraSettings.temperature ?? DEFAULT_GENERATION_SETTINGS.temperature;
let currentTemperature = baseTemperature;
const MAX_TEMPERATURE = 2.0;
const TEMP_INCREMENT = 0.15;
const RECOVERY_LENGTH = 16;
const requestData = {
prompt,
params: {
@ -170,11 +176,13 @@ export namespace Connection {
max_context_length: model.maxContext,
max_length: maxLength,
rep_pen_range: Math.min(model.maxContext, 4096),
temperature: currentTemperature,
},
models: model.hordeNames,
workers: model.workers,
};
const bannedTokens = requestData.params.banned_tokens ?? [];
let recoveryMode = false;
const { signal } = abortController;
@ -221,34 +229,54 @@ export namespace Connection {
if (response?.text) {
text = response.text;
let minStopIdx = text.length;
for (const sequence of requestData.params.stop_sequence) {
const stopIdx = text.indexOf(sequence);
if (stopIdx >= 0) {
text = text.slice(0, stopIdx);
if (stopIdx >= 0 && stopIdx < minStopIdx) {
minStopIdx = stopIdx;
}
}
if (minStopIdx < text.length) {
text = text.slice(0, minStopIdx);
}
const locaseText = text.toLowerCase();
let unsloppedText = text;
let slopDetected = false;
let minSlopIdx = text.length;
let detectedBan = '';
for (const ban of bannedTokens) {
const slopIdx = locaseText.indexOf(ban.toLowerCase());
if (slopIdx >= 0) {
console.log(`[horde] slop '${ban}' detected at ${slopIdx}`);
unsloppedText = unsloppedText.slice(0, slopIdx).trimEnd();
if (slopIdx >= 0 && slopIdx < minSlopIdx) {
minSlopIdx = slopIdx;
detectedBan = ban;
slopDetected = true;
}
}
if (slopDetected) {
console.log(`[horde] slop '${detectedBan}' detected at ${minSlopIdx}`);
unsloppedText = unsloppedText.slice(0, minSlopIdx).trimEnd();
}
yield { text: unsloppedText, cost: response.cost };
requestData.prompt += unsloppedText;
if (unsloppedText === text) {
if (slopDetected) {
recoveryMode = true;
requestData.params.max_length = RECOVERY_LENGTH;
currentTemperature = Math.min(MAX_TEMPERATURE, currentTemperature + TEMP_INCREMENT);
requestData.params.temperature = currentTemperature;
requestData.params.top_p = Math.min(0.98, 0.92 + (currentTemperature - baseTemperature) * 0.02);
} else if (recoveryMode) {
recoveryMode = false;
requestData.params.max_length = maxLength;
requestData.params.temperature = baseTemperature;
requestData.params.top_p = 0.92;
currentTemperature = baseTemperature;
} else {
return; // we are finished
}
if (unsloppedText.length === 0) {
requestData.params.temperature += 0.05;
}
}
} catch (e) {
if (!signal.aborted) {

View File

@ -423,6 +423,7 @@ export namespace Huggingface {
applyTemplate(templateString, {
messages,
add_generation_prompt: true,
enable_thinking: false,
tools: functions?.map(convertFunctionToTool),
})
);

View File

@ -25,50 +25,48 @@ export namespace MessageTools {
}
export const format = (message: string): string => {
const replaceRegex = /([*"]\*?)/ig;
const replaceRegex = /(\*\*?|")/ig;
const splitToken = '___SPLIT_AWOORWA___';
const preparedMessage = message.replace(replaceRegex, `${splitToken}$1${splitToken}`);
const parts = preparedMessage.split(splitToken);
let isText = true;
let keepPart = true;
const stack: string[] = [];
let resultHTML = '';
for (const part of parts) {
if (isText) {
const isClose = stack.at(-1) === part;
if (isClose) {
stack.pop();
if (part === '*' || part === '**') {
resultHTML += `</span>`;
} else if (part === '"') {
resultHTML += `"</span>`;
}
} else {
if (part === '*') {
isText = false;
keepPart = false;
stack.push(part);
resultHTML += `<span class="italic">`;
} else if (part === '**') {
isText = false;
keepPart = false;
stack.push(part);
resultHTML += `<span class="bold">`;
} else if (part === '"') {
isText = false;
keepPart = true;
stack.push(part);
resultHTML += `<span class="quote">"`;
} else {
resultHTML += part;
}
} else {
if (part === '*' || part === '**') {
resultHTML += `</span>`;
isText = true;
} else if (part === '"') {
resultHTML += `"</span>`;
isText = true;
} else {
resultHTML += part;
}
}
}
if (!isText) {
while (stack.length) {
const part = stack.pop();
if (part === '*' || part === '**') {
resultHTML += `</span>`;
} else if (part === '"') {
resultHTML += `"</span>`;
}
}
return resultHTML;