pluralchat

Sleeping

nsarrazin commited on Jun 3, 2025

Commit

6cd421f

unverified ·

1 Parent(s): 7e91987

feat(reasoning): support end token search across multiple chunks (#1838)

* feat(huggingchat): model update 27-05-25

* feat: update prompt examples in config

* feat: revert model config changes

Files changed (1) hide show

src/lib/server/textGeneration/generate.ts CHANGED Viewed

@@ -154,6 +154,40 @@ Do not use prefixes such as Response: or Answer: when answering to the user.`,
 		if (reasoning) {
 			reasoningBuffer += output.token.text;
 			// yield status update if it has changed
 			if (status !== "") {
 				yield {

 		if (reasoning) {
 			reasoningBuffer += output.token.text;
+			if (model.reasoning && model.reasoning.type === "tokens") {
+				// split reasoning buffer so that anything that comes after the end token is separated
+				// add it to the normal buffer, and yield two updates, one for the reasoning and one for the normal content
+				// also set reasoning to false
+				if (reasoningBuffer.lastIndexOf(model.reasoning.endToken) !== -1) {
+					const endTokenIndex = reasoningBuffer.lastIndexOf(model.reasoning.endToken);
+					const textBuffer = reasoningBuffer.slice(endTokenIndex + model.reasoning.endToken.length);
+					reasoningBuffer = reasoningBuffer.slice(
+						0,
+						endTokenIndex + model.reasoning.endToken.length + 1
+					);
+					yield {
+						type: MessageUpdateType.Reasoning,
+						subtype: MessageReasoningUpdateType.Stream,
+						token: output.token.text,
+					};
+					yield {
+						type: MessageUpdateType.Stream,
+						token: textBuffer,
+					};
+					yield {
+						type: MessageUpdateType.Reasoning,
+						subtype: MessageReasoningUpdateType.Status,
+						status: `Done in ${Math.round((new Date().getTime() - startTime.getTime()) / 1000)}s.`,
+					};
+					reasoning = false;
+					continue;
+				}
+			}
 			// yield status update if it has changed
 			if (status !== "") {
 				yield {