campfirein · cuongdo-byterover · May 27, 2026 · May 27, 2026 · May 27, 2026 · May 27, 2026
@@ -1,23 +1,54 @@
 /* eslint-disable camelcase */
 import {readFile as readFileAsync} from 'node:fs/promises'
+import {relative as relativePath} from 'node:path'
 
 import type {AnalyticsEventName} from '../../../shared/analytics/event-names.js'
 import type {CurateRunCompletedProps} from '../../../shared/analytics/events/curate-run-completed.js'
 import type {PropsArg} from '../../../shared/analytics/events/index.js'
 import type {QueryCompletedProps} from '../../../shared/analytics/events/query-completed.js'
+import type {TaskType} from '../../../shared/analytics/task-types.js'
 import type {LlmToolResultEvent} from '../../core/domain/transport/schemas.js'
 import type {TaskInfo} from '../../core/domain/transport/task-info.js'
 import type {IAnalyticsClient} from '../../core/interfaces/analytics/i-analytics-client.js'
 import type {ITaskLifecycleHook} from '../../core/interfaces/process/i-task-lifecycle-hook.js'
 import type {QueryResultMetadata} from './query-log-handler.js'
 
 import {AnalyticsEventNames} from '../../../shared/analytics/event-names.js'
+import {TaskTypes} from '../../../shared/analytics/task-types.js'
 import {parseFrontmatter} from '../../core/domain/knowledge/markdown-writer.js'
 import {extractCurateOperations} from '../../utils/curate-result-parser.js'
 import {processLog} from '../../utils/process-logger.js'
 import {CURATE_TASK_TYPES} from './curate-log-handler.js'
 import {QUERY_TASK_TYPES} from './query-log-handler.js'
 
+/**
+ * Translate the daemon's runtime task type string to the canonical
+ * analytics wire value. The daemon still dispatches the pre-ENG-2925
+ * name `'curate-html-direct'`; analytics emits the post-rename
+ * `'curate-tool-mode'`. Once the rename PR lands, this becomes a
+ * no-op identity and can be inlined.
+ */
+function toAnalyticsTaskType(daemonType: string): TaskType {
+  if (daemonType === 'curate-html-direct') return TaskTypes.CURATE_TOOL_MODE
+  return daemonType as TaskType
+}
+
+/**
+ * Convert an absolute filesystem path to a project-relative path for the
+ * analytics wire. Falls back to the input unchanged when projectPath is
+ * unset (e.g., search tasks scoped to the daemon root). Keeps emits free
+ * of `/Users/{name}` PII while still letting PMs reason about which file
+ * inside a project an operation touched.
+ */
+function toRelativePath(filePath: string, projectPath?: string): string {
+  if (!projectPath) return filePath
+  const rel = relativePath(projectPath, filePath)
+  // `path.relative` returns '' when paths are identical — defensively
+  // surface a leaf token rather than emit a zero-length wire string that
+  // would fail `z.string().min(1)`.
+  return rel === '' ? '.' : rel
+}
+
 // `CURATE_TASK_TYPES` is exported as a readonly tuple; wrap in a Set<string>
 // for cast-free `.has()` lookups against TaskInfo.type (string).
 const CURATE_TASK_TYPE_SET: ReadonlySet<string> = new Set(CURATE_TASK_TYPES)
@@ -67,6 +98,8 @@ type CurateCounters = {
 type CurateTaskAnalyticsState = {
   counters: CurateCounters
   flavor: 'curate'
+  /** Captured at onTaskCreate so onToolResult emits can relativize op.filePath. */
+  projectPath?: string
   taskType: CurateTaskTypeLiteral
 }
 
@@ -142,36 +175,57 @@ export class AnalyticsHook implements ITaskLifecycleHook {
 
   async onTaskCancelled(taskId: string, task: TaskInfo): Promise<void> {
     await this.dispatchTerminal(taskId, task, 'cancelled')
+    this.emitTaskFailed(taskId, task)
   }
 
   async onTaskCompleted(taskId: string, _result: string, task: TaskInfo): Promise<void> {
     const state = this.tasks.get(taskId)
-    if (!state) return
+    if (state) {
+      // Drain any in-flight per-op processing so CURATE_OPERATION_APPLIED emits
+      // land BEFORE the run-completion emit on the wire. The chain never
+      // rejects (see `onToolResult`), so this await is safe.
+      await this.pendingByTask.get(taskId)
+
+      if (state.flavor === 'curate') {
+        const outcome = state.counters.failed > 0 ? 'partial' : 'completed'
+        this.emit(
+          AnalyticsEventNames.CURATE_RUN_COMPLETED,
+          this.buildCurateRunPayload({outcome, state, task, taskId}),
+        )
+      } else {
+        this.emit(
+          AnalyticsEventNames.QUERY_COMPLETED,
+          await this.buildQueryCompletedPayload({outcome: 'completed', state, task, taskId}),
+        )
+      }
+    }
 
-    // Drain any in-flight per-op processing so CURATE_OPERATION_APPLIED emits
-    // land BEFORE the run-completion emit on the wire. The chain never
-    // rejects (see `onToolResult`), so this await is safe.
-    await this.pendingByTask.get(taskId)
 
-    if (state.flavor === 'curate') {
-      const outcome = state.counters.failed > 0 ? 'partial' : 'completed'
-      this.emit(
-        AnalyticsEventNames.CURATE_RUN_COMPLETED,
-        this.buildCurateRunPayload({outcome, state, task, taskId}),
-      )
-    } else {
-      this.emit(
-        AnalyticsEventNames.QUERY_COMPLETED,
-        await this.buildQueryCompletedPayload({outcome: 'completed', state, task, taskId}),
-      )
-    }
+    // M14.3 generic funnel emit. Fires for EVERY task type AFTER any
+    // per-flavor M12 emit (terminal-event-last convention).
+    this.emit(AnalyticsEventNames.TASK_COMPLETED, {
+      duration_ms: this.durationMs(task),
+      task_id: taskId,
+      task_type: toAnalyticsTaskType(task.type),
+    })
   }
 
   async onTaskCreate(task: TaskInfo): Promise<void> {
+    // M14.3 generic funnel-entry emit. Fires for EVERY task type BEFORE
+    // the M12 per-flavor state init so the entry event lands even if
+    // state setup throws downstream.
+    this.emit(AnalyticsEventNames.TASK_CREATED, {
+      has_files: (task.files?.length ?? 0) > 0,
+      has_folder: typeof task.folderPath === 'string' && task.folderPath.length > 0,
+      task_id: task.taskId,
+      task_type: toAnalyticsTaskType(task.type),
+    })
+
     if (isCurateLiteral(task.type)) {
       this.tasks.set(task.taskId, {
         counters: {added: 0, deleted: 0, failed: 0, merged: 0, pendingReview: 0, updated: 0},
         flavor: 'curate',
+        projectPath: task.projectPath,
         taskType: task.type,
       })
       return
@@ -184,6 +238,7 @@ export class AnalyticsHook implements ITaskLifecycleHook {
 
   async onTaskError(taskId: string, _errorMessage: string, task: TaskInfo): Promise<void> {
     await this.dispatchTerminal(taskId, task, 'error')
+    this.emitTaskFailed(taskId, task)
   }
 
   async onToolResult(taskId: string, payload: LlmToolResultEvent): Promise<void> {
@@ -246,7 +301,7 @@ export class AnalyticsHook implements ITaskLifecycleHook {
       outcome,
       pending_review_count: state.counters.pendingReview,
       task_id: taskId,
-      task_type: state.taskType,
+      task_type: toAnalyticsTaskType(state.taskType),
     }
   }
 
@@ -303,17 +358,24 @@ export class AnalyticsHook implements ITaskLifecycleHook {
 
     // M12.3: harvest per-path frontmatter on the same async read path used
     // for curate emits. Entries whose file is unreadable / has no frontmatter
-    // carry `absolute_path` alone (the three array fields stay absent).
-    // `Promise.all` preserves input-array order in the result regardless of
-    // which read settles first.
+    // carry empty keywords / tags / related_paths arrays — the wire shape
+    // is uniform regardless of read success. `Promise.all` preserves
+    // input-array order in the result regardless of which read settles first.
     const readPathsWithMetadata = await Promise.all(
       cappedPaths.map(async (p) => {
         const fm = await this.readFrontmatterFields(p)
         return {
-          absolute_path: p,
-          ...(fm.keywords ? {keywords: fm.keywords} : {}),
-          ...(fm.related ? {related: fm.related} : {}),
-          ...(fm.tags ? {tags: fm.tags} : {}),
+          keywords: fm.keywords ?? [],
+          // M14 review tightening: each related entry is structured so a
+          // later FU can populate the linked file's own keywords/tags
+          // without changing the wire shape.
+          related_paths: (fm.related ?? []).map((r) => ({
+            keywords: [],
+            relative_path: r,
+            tags: [],
+          })),
+          relative_path: toRelativePath(p, task.projectPath),
+          tags: fm.tags ?? [],
         }
       }),
     )
@@ -331,7 +393,7 @@ export class AnalyticsHook implements ITaskLifecycleHook {
       read_tool_call_count: readToolCallCount,
       search_call_count: searchCallCount,
       task_id: taskId,
-      task_type: 'query',
+      task_type: toAnalyticsTaskType(task.type),
       ...(tier === undefined ? {} : {tier}),
     }
   }
@@ -371,6 +433,20 @@ export class AnalyticsHook implements ITaskLifecycleHook {
     }
   }
 
+  /**
+   * M14.3 generic terminal-failure emit. Fired by both onTaskError and
+   * onTaskCancelled AFTER dispatchTerminal so M12 per-flavor failure
+   * emits land first on the wire. Cancellation maps to task_failed
+   * (not a distinct event) per the schema's docblock.
+   */
+  private emitTaskFailed(taskId: string, task: TaskInfo): void {
+    this.emit(AnalyticsEventNames.TASK_FAILED, {
+      duration_ms: this.durationMs(task),
+      task_id: taskId,
+      task_type: toAnalyticsTaskType(task.type),
+    })
+  }
+
   private async processToolResult(taskId: string, payload: LlmToolResultEvent): Promise<void> {
     const state = this.tasks.get(taskId)
     if (!state || state.flavor !== 'curate') return
@@ -423,20 +499,21 @@ export class AnalyticsHook implements ITaskLifecycleHook {
 
       // M12.3: read post-op frontmatter for ADD / UPDATE / MERGE-target /
       // UPSERT. DELETE skips the read (file is gone). Frontmatter fields
-      // stay absent when the read fails (ENOENT, EACCES, malformed YAML).
+      // default to empty arrays when the read fails (ENOENT, EACCES,
+      // malformed YAML) so the wire shape stays uniform.
       // eslint-disable-next-line no-await-in-loop -- emit order MUST match op order
       const frontmatter = op.type === 'DELETE' ? {} : await this.readFrontmatterFields(op.filePath)
 
       this.emit(AnalyticsEventNames.CURATE_OPERATION_APPLIED, {
-        absolute_path: op.filePath,
         ...(op.confidence ? {confidence: op.confidence} : {}),
         ...(op.impact ? {impact: op.impact} : {}),
-        ...(frontmatter.keywords ? {keywords: frontmatter.keywords} : {}),
+        keywords: frontmatter.keywords ?? [],
         knowledge_path: op.path,
         needs_review: op.needsReview ?? false,
         operation_type: op.type,
         ...(frontmatter.related ? {related: frontmatter.related} : {}),
-        ...(frontmatter.tags ? {tags: frontmatter.tags} : {}),
+        relative_path: toRelativePath(op.filePath, state.projectPath),
+        tags: frontmatter.tags ?? [],
         task_id: taskId,
       })
     }

@@ -50,7 +50,12 @@ function telemetryFields(record: CurateUsageRecord | undefined): {
   }
 }
 
-export const CURATE_TASK_TYPES = ['curate', 'curate-folder'] as const
+// `curate-html-direct` is the pre-ENG-2925 name still dispatched by the
+// daemon; `curate-tool-mode` is the post-rename name. Both are listed
+// so M12 state init in AnalyticsHook kicks in for tool-mode curates.
+// The analytics wire canonicalizes both to `curate-tool-mode` via
+// `toAnalyticsTaskType` in `analytics-hook.ts`.
+export const CURATE_TASK_TYPES = ['curate', 'curate-folder', 'curate-html-direct', 'curate-tool-mode'] as const
 
 // ── Summary computation ───────────────────────────────────────────────────────
 

@@ -44,7 +44,10 @@ type TaskState = {
   queryResult?: QueryResultMetadata
 }
 
-export const QUERY_TASK_TYPES: ReadonlySet<string> = new Set(['query'])
+// `query-tool-mode` is the v4.0 daemon dispatch name; legacy `query` is
+// kept for back-compat. Both names enable M12 state init in AnalyticsHook
+// (and matching query-log persistence here).
+export const QUERY_TASK_TYPES: ReadonlySet<string> = new Set(['query', 'query-tool-mode'])
 
 // ── QueryLogHandler ──────────────────────────────────────────────────────────
 

@@ -5,24 +5,28 @@ import {z} from 'zod'
  * Per-event schema for `curate_operation_applied`.
  *
  * Emitted by the daemon's `AnalyticsHook` (M12.2) once per successful curate
- * operation. Each operation carries the affected file's absolute path, its
- * knowledge-tree address, review/impact metadata, and (M12.3) the file's
- * current-state frontmatter values for tags / keywords / related.
+ * operation. Each operation carries the affected file's project-relative
+ * path, its knowledge-tree address, review/impact metadata, and (M12.3) the
+ * file's current-state frontmatter values for tags / keywords / related.
  *
- * All three frontmatter arrays are optional and absent on DELETE operations
- * (the file is gone post-op) and on read failures (defensive).
+ * Review tightening (M14 follow-up):
+ * - `absolute_path` → `relative_path` for privacy + portability across hosts
+ * - `keywords` / `tags` are now required arrays (default empty) so consumers
+ *   don't have to special-case the "field absent" shape
+ * - `related` stays optional and absent on DELETE / read-failure (file is
+ *   gone or unreadable, no related-link source to harvest from)
  */
 export const CurateOperationAppliedSchema = z
   .object({
-    absolute_path: z.string().min(1),
     confidence: z.enum(['high', 'low']).optional(),
     impact: z.enum(['high', 'low']).optional(),
-    keywords: z.array(z.string().max(256)).max(50).optional(),
+    keywords: z.array(z.string().max(256)).max(50),
     knowledge_path: z.string().min(1),
     needs_review: z.boolean(),
     operation_type: z.enum(['ADD', 'UPDATE', 'DELETE', 'MERGE', 'UPSERT']),
     related: z.array(z.string().max(256)).max(50).optional(),
-    tags: z.array(z.string().max(256)).max(50).optional(),
+    relative_path: z.string().min(1),
+    tags: z.array(z.string().max(256)).max(50),
     task_id: z.string().min(1),
   })
   .strict()

@@ -1,12 +1,20 @@
 /* eslint-disable camelcase */
 import {z} from 'zod'
 
+import {TASK_TYPE_VALUES} from '../task-types.js'
+
 /**
  * Per-event schema for `curate_run_completed`.
  *
  * Emitted by the daemon's `AnalyticsHook` (M12.2) at curate task terminal
  * states (completed / partial / cancelled / error). Carries per-task
  * operation counters so PMs can aggregate curate volume + outcome over time.
+ *
+ * M14.2 migrated `task_type` from a literal ['curate', 'curate-folder']
+ * enum to the canonical `TASK_TYPE_VALUES` tuple so v4.0 tool-mode types
+ * (curate-tool-mode) round-trip the wire boundary. The hook is expected
+ * to only emit this event for curate flavors; the schema no longer
+ * structurally enforces that and trusts the caller.
  */
 export const CurateRunCompletedSchema = z
   .object({
@@ -19,7 +27,7 @@ export const CurateRunCompletedSchema = z
     outcome: z.enum(['completed', 'partial', 'cancelled', 'error']),
     pending_review_count: z.number().int().nonnegative(),
     task_id: z.string().min(1),
-    task_type: z.enum(['curate', 'curate-folder']),
+    task_type: z.enum(TASK_TYPE_VALUES),
   })
   .strict()