New unslop logic
This commit is contained in:
parent
98302de620
commit
f228f78915
|
|
@ -161,6 +161,12 @@ export namespace Connection {
|
||||||
if (extraSettings.max_length && extraSettings.max_length < maxLength) {
|
if (extraSettings.max_length && extraSettings.max_length < maxLength) {
|
||||||
maxLength = extraSettings.max_length;
|
maxLength = extraSettings.max_length;
|
||||||
}
|
}
|
||||||
|
const baseTemperature = extraSettings.temperature ?? DEFAULT_GENERATION_SETTINGS.temperature;
|
||||||
|
let currentTemperature = baseTemperature;
|
||||||
|
const MAX_TEMPERATURE = 2.0;
|
||||||
|
const TEMP_INCREMENT = 0.15;
|
||||||
|
const RECOVERY_LENGTH = 16;
|
||||||
|
|
||||||
const requestData = {
|
const requestData = {
|
||||||
prompt,
|
prompt,
|
||||||
params: {
|
params: {
|
||||||
|
|
@ -170,11 +176,13 @@ export namespace Connection {
|
||||||
max_context_length: model.maxContext,
|
max_context_length: model.maxContext,
|
||||||
max_length: maxLength,
|
max_length: maxLength,
|
||||||
rep_pen_range: Math.min(model.maxContext, 4096),
|
rep_pen_range: Math.min(model.maxContext, 4096),
|
||||||
|
temperature: currentTemperature,
|
||||||
},
|
},
|
||||||
models: model.hordeNames,
|
models: model.hordeNames,
|
||||||
workers: model.workers,
|
workers: model.workers,
|
||||||
};
|
};
|
||||||
const bannedTokens = requestData.params.banned_tokens ?? [];
|
const bannedTokens = requestData.params.banned_tokens ?? [];
|
||||||
|
let recoveryMode = false;
|
||||||
|
|
||||||
const { signal } = abortController;
|
const { signal } = abortController;
|
||||||
|
|
||||||
|
|
@ -221,34 +229,54 @@ export namespace Connection {
|
||||||
|
|
||||||
if (response?.text) {
|
if (response?.text) {
|
||||||
text = response.text;
|
text = response.text;
|
||||||
|
let minStopIdx = text.length;
|
||||||
for (const sequence of requestData.params.stop_sequence) {
|
for (const sequence of requestData.params.stop_sequence) {
|
||||||
const stopIdx = text.indexOf(sequence);
|
const stopIdx = text.indexOf(sequence);
|
||||||
if (stopIdx >= 0) {
|
if (stopIdx >= 0 && stopIdx < minStopIdx) {
|
||||||
text = text.slice(0, stopIdx);
|
minStopIdx = stopIdx;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
if (minStopIdx < text.length) {
|
||||||
|
text = text.slice(0, minStopIdx);
|
||||||
|
}
|
||||||
|
|
||||||
const locaseText = text.toLowerCase();
|
const locaseText = text.toLowerCase();
|
||||||
let unsloppedText = text;
|
let unsloppedText = text;
|
||||||
|
let slopDetected = false;
|
||||||
|
let minSlopIdx = text.length;
|
||||||
|
let detectedBan = '';
|
||||||
for (const ban of bannedTokens) {
|
for (const ban of bannedTokens) {
|
||||||
const slopIdx = locaseText.indexOf(ban.toLowerCase());
|
const slopIdx = locaseText.indexOf(ban.toLowerCase());
|
||||||
if (slopIdx >= 0) {
|
if (slopIdx >= 0 && slopIdx < minSlopIdx) {
|
||||||
console.log(`[horde] slop '${ban}' detected at ${slopIdx}`);
|
minSlopIdx = slopIdx;
|
||||||
unsloppedText = unsloppedText.slice(0, slopIdx).trimEnd();
|
detectedBan = ban;
|
||||||
|
slopDetected = true;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
if (slopDetected) {
|
||||||
|
console.log(`[horde] slop '${detectedBan}' detected at ${minSlopIdx}`);
|
||||||
|
unsloppedText = unsloppedText.slice(0, minSlopIdx).trimEnd();
|
||||||
|
}
|
||||||
|
|
||||||
yield { text: unsloppedText, cost: response.cost };
|
yield { text: unsloppedText, cost: response.cost };
|
||||||
|
|
||||||
requestData.prompt += unsloppedText;
|
requestData.prompt += unsloppedText;
|
||||||
|
|
||||||
if (unsloppedText === text) {
|
if (slopDetected) {
|
||||||
|
recoveryMode = true;
|
||||||
|
requestData.params.max_length = RECOVERY_LENGTH;
|
||||||
|
currentTemperature = Math.min(MAX_TEMPERATURE, currentTemperature + TEMP_INCREMENT);
|
||||||
|
requestData.params.temperature = currentTemperature;
|
||||||
|
requestData.params.top_p = Math.min(0.98, 0.92 + (currentTemperature - baseTemperature) * 0.02);
|
||||||
|
} else if (recoveryMode) {
|
||||||
|
recoveryMode = false;
|
||||||
|
requestData.params.max_length = maxLength;
|
||||||
|
requestData.params.temperature = baseTemperature;
|
||||||
|
requestData.params.top_p = 0.92;
|
||||||
|
currentTemperature = baseTemperature;
|
||||||
|
} else {
|
||||||
return; // we are finished
|
return; // we are finished
|
||||||
}
|
}
|
||||||
|
|
||||||
if (unsloppedText.length === 0) {
|
|
||||||
requestData.params.temperature += 0.05;
|
|
||||||
}
|
|
||||||
}
|
}
|
||||||
} catch (e) {
|
} catch (e) {
|
||||||
if (!signal.aborted) {
|
if (!signal.aborted) {
|
||||||
|
|
|
||||||
Loading…
Reference in New Issue