eval-protocol · benjibc · Mar 7, 2026 · Mar 7, 2026 · chatgpt-codex-connector · Mar 7, 2026
diff --git a/vite-app/dist/assets/index-10cZ11iB.js b/vite-app/dist/assets/index-10cZ11iB.js
diff --git a/vite-app/dist/assets/index-10cZ11iB.js.map b/vite-app/dist/assets/index-10cZ11iB.js.map
diff --git a/vite-app/dist/assets/index-DFeF7AG_.js b/vite-app/dist/assets/index-DFeF7AG_.js
diff --git a/vite-app/dist/assets/index-DFeF7AG_.js.map b/vite-app/dist/assets/index-DFeF7AG_.js.map
diff --git a/vite-app/dist/assets/index-DOD73Wyg.css b/vite-app/dist/assets/index-DOD73Wyg.css
diff --git a/vite-app/dist/assets/index-DvKW7FQL.css b/vite-app/dist/assets/index-DvKW7FQL.css
diff --git a/vite-app/dist/index.html b/vite-app/dist/index.html
@@ -5,8 +5,8 @@
     <meta name="viewport" content="width=device-width, initial-scale=1.0" />
     <title>EP | Log Viewer</title>
     <link rel="icon" href="/assets/favicon-BkAAWQga.png" />
-    <script type="module" crossorigin src="/assets/index-10cZ11iB.js"></script>
-    <link rel="stylesheet" crossorigin href="/assets/index-DOD73Wyg.css">
+    <script type="module" crossorigin src="/assets/index-DFeF7AG_.js"></script>
+    <link rel="stylesheet" crossorigin href="/assets/index-DvKW7FQL.css">
   </head>
   <body>
     <div id="root"></div>

diff --git a/vite-app/src/components/EvaluationRow.tsx b/vite-app/src/components/EvaluationRow.tsx
@@ -337,9 +337,77 @@ const ToolsSection = observer(
   )
 );
 
+function buildToolDeclareContent(tools: EvaluationRowType["tools"]): string {
+  if (!tools?.length) return "";
+  const blocks = tools
+    .map((tool) => {
+      const fn = (tool as any)?.function || {};
+      const properties = fn.parameters?.properties || {};
+      const actionEnum = Array.isArray(properties.action?.enum)
+        ? properties.action.enum.map((value: string) => `"${value}"`).join(" | ")
+        : "string";
+      return [
+        `// ${fn.description || "Tool declaration."}`,
+        `type ${fn.name || "tool"} = (_: {`,
+        `  // ${properties.action?.description || "Tool argument."}`,
+        `  action: ${actionEnum},`,
+        "  [k: string]: never",
+        "}) => any;",
+      ].join("\n");
+    })
+    .join("\n");
+
+  return `# Tools\n\n## functions\nnamespace functions {\n${blocks}\n}`;
+}
+
+function buildPromptFaithfulMessages(
+  messages: EvaluationRowType["messages"],
+  tools: EvaluationRowType["tools"]
+): EvaluationRowType["messages"] {
+  const toolDeclareContent = buildToolDeclareContent(tools);
+  if (!toolDeclareContent) return messages;
+  const nextMessages = [...(messages || [])];
+  const firstSystemIdx = nextMessages.findIndex(
+    (message) => message?.role === "system"
+  );
+  if (firstSystemIdx === -1) {
+    return [{ role: "system", content: toolDeclareContent } as any, ...nextMessages];
+  }
+
+  const firstSystem = nextMessages[firstSystemIdx] as any;
+  const existingContent =
+    typeof firstSystem?.content === "string"
+      ? firstSystem.content
+      : Array.isArray(firstSystem?.content)
+      ? firstSystem.content
+          .map((part: any) => {
+            if (part?.type === "text") return part.text || "";
+            if (part?.type === "image_url") return "[Image]";
+            return JSON.stringify(part);
+          })
+          .join("")
+      : firstSystem?.content != null
+      ? JSON.stringify(firstSystem.content)
+      : "";
+
+  nextMessages[firstSystemIdx] = {
+    ...firstSystem,
+    content: existingContent
+      ? `${toolDeclareContent}\n\n${existingContent}`
+      : toolDeclareContent,
+  } as any;
+  return nextMessages;
+}
+
 const ChatInterfaceSection = observer(
-  ({ messages }: { messages: EvaluationRowType["messages"] }) => (
-    <ChatInterface messages={messages} />
+  ({
+    messages,
+    tools,
+  }: {
+    messages: EvaluationRowType["messages"];
+    tools: EvaluationRowType["tools"];
+  }) => (
+    <ChatInterface messages={buildPromptFaithfulMessages(messages, tools)} />
   )
 );
 
@@ -376,7 +444,7 @@ const ExpandedContent = observer(
       <div className="flex gap-3 w-fit">
         {/* Left Column - Chat Interface */}
         <div className="min-w-0">
-          <ChatInterfaceSection messages={messages} />
+          <ChatInterfaceSection messages={messages} tools={tools} />
         </div>
 
         {/* Token Debug Column */}

diff --git a/vite-app/src/components/MessageBubble.tsx b/vite-app/src/components/MessageBubble.tsx
@@ -14,9 +14,12 @@ export const MessageBubble = ({ message }: { message: Message }) => {
   const isTool = message.role === "tool";
   const hasToolCalls = message.tool_calls && message.tool_calls.length > 0;
   const hasFunctionCall = message.function_call;
+  const hideMessageContent = message.role === "assistant" && hasToolCalls;
 
   // Get the message content as a string
   const reasoning = (message as any).reasoning_content as string | undefined;
+  const titleLabel =
+    message.role === "system" && message.name ? message.name : message.role;
   const getMessageContent = () => {
     if (typeof message.content === "string") {
       return message.content;
@@ -33,11 +36,14 @@ export const MessageBubble = ({ message }: { message: Message }) => {
     }
   };
 
-  const messageContent = getMessageContent();
+  const messageContent = hideMessageContent ? "" : getMessageContent();
   const hasMessageContent = messageContent.trim().length > 0;
   const isLongMessage = messageContent.length > 200; // Threshold for considering a message "long"
 
   const renderContent = () => {
+    if (hideMessageContent) {
+      return null;
+    }
     if (typeof message.content === "string") {
       return isLongMessage && !isExpanded
         ? message.content.substring(0, 200) + "..."
@@ -161,7 +167,7 @@ export const MessageBubble = ({ message }: { message: Message }) => {
             hasMessageContent ? "pr-8" : ""
           }`}
         >
-          {message.role}
+          {titleLabel}
         </div>
         <div className="whitespace-pre-wrap break-words overflow-hidden text-xs">
           {renderContent()}