Skip to content

fix(trimmer): trim last message when allowPartial: true and strategy: first #8287

New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Open
wants to merge 7 commits into
base: main
Choose a base branch
from
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
93 changes: 64 additions & 29 deletions langchain-core/src/messages/tests/message_utils.test.ts
Original file line number Diff line number Diff line change
@@ -1,16 +1,16 @@
import { it, describe, test, expect } from "@jest/globals";
import { describe, expect, it, test } from "@jest/globals";
import { v4 } from "uuid";
import {
filterMessages,
mergeMessageRuns,
trimMessages,
} from "../transformers.js";
import { AIMessage, AIMessageChunk } from "../ai.js";
import { BaseMessage, MessageContent } from "../base.js";
import { ChatMessage } from "../chat.js";
import { HumanMessage } from "../human.js";
import { SystemMessage } from "../system.js";
import { ToolMessage } from "../tool.js";
import { BaseMessage } from "../base.js";
import {
filterMessages,
mergeMessageRuns,
trimMessages,
} from "../transformers.js";
import {
getBufferString,
mapChatMessagesToStoredMessages,
Expand Down Expand Up @@ -141,7 +141,26 @@ describe("mergeMessageRuns", () => {
});

describe("trimMessages can trim", () => {
const messagesAndTokenCounterFactory = () => {
const defaultCountTokensByMessageContent = (
content: MessageContent
): number => {
// treat each message like it adds 3 default tokens at the beginning
// of the message and at the end of the message. 3 + 4 + 3 = 10 tokens
// per message.
const defaultMsgPrefixLen = 3;
const defaultContentLen = 4;
const defaultMsgSuffixLen = 3;

const contentLen = Array.isArray(content)
? content.length * defaultContentLen
: defaultContentLen;

return defaultMsgPrefixLen + contentLen + defaultMsgSuffixLen;
};

const messagesAndTokenCounterFactory = ({
countTokensByMessageContent = defaultCountTokensByMessageContent,
} = {}) => {
const messages = [
new SystemMessage(
"This is a 4 token text. The full message is 10 tokens."
Expand All @@ -168,27 +187,10 @@ describe("trimMessages can trim", () => {
];

const dummyTokenCounter = (messages: BaseMessage[]): number => {
// treat each message like it adds 3 default tokens at the beginning
// of the message and at the end of the message. 3 + 4 + 3 = 10 tokens
// per message.

const defaultContentLen = 4;
const defaultMsgPrefixLen = 3;
const defaultMsgSuffixLen = 3;

let count = 0;
for (const msg of messages) {
if (typeof msg.content === "string") {
count +=
defaultMsgPrefixLen + defaultContentLen + defaultMsgSuffixLen;
}
if (Array.isArray(msg.content)) {
count +=
defaultMsgPrefixLen +
msg.content.length * defaultContentLen +
defaultMsgSuffixLen;
}
}
const count = messages.reduce(
(count, msg) => count + countTokensByMessageContent(msg.content),
0
);
console.log(count);
return count;
};
Expand Down Expand Up @@ -376,6 +378,39 @@ describe("trimMessages can trim", () => {
]);
});

it("First tokens, allowing partial messages, have to trim the last 10 characters of the last message", async () => {
// For the purpose of this test, we'll override the dummy token counter to count characters.
const { messages, dummyTokenCounter } = messagesAndTokenCounterFactory({
countTokensByMessageContent: (content: MessageContent): number =>
content.length,
});

const totalCharacters = messages.reduce(
(count, msg) => count + msg.content.length,
0
);

const trimmedMessages = await trimMessages(messages, {
maxTokens: totalCharacters - 10,
tokenCounter: dummyTokenCounter,
strategy: "first",
allowPartial: true,
textSplitter: (text: string) => text.split(""),
});

const trimmedMessagesContent = trimmedMessages.map((msg) => msg.content);
expect(trimmedMessagesContent).toEqual([
"This is a 4 token text. The full message is 10 tokens.",
"This is a 4 token text. The full message is 10 tokens.",
[
{ type: "text", text: "This is the FIRST 4 token block." },
{ type: "text", text: "This is the SECOND 4 token block." },
],
"This is a 4 token text. The full message is 10 tokens.",
"This is a 4 token text. The full message is ",
]);
});

it("Last 30 tokens, including system message, not allowing partial messages", async () => {
const { messages, dummyTokenCounter } = messagesAndTokenCounterFactory();
const trimmedMessages = await trimMessages(messages, {
Expand Down
2 changes: 1 addition & 1 deletion langchain-core/src/messages/transformers.ts
Original file line number Diff line number Diff line change
Expand Up @@ -745,7 +745,7 @@ async function _firstMaxTokens(
break;
}
}
if (idx < messagesCopy.length - 1 && partialStrategy) {
if (idx < messagesCopy.length && partialStrategy) {
let includedPartial = false;
if (Array.isArray(messagesCopy[idx].content)) {
const excluded = messagesCopy[idx];
Expand Down