chore: initialize recovered claude workspace

2026-04-02 15:29:01 +08:00
commit a10efa3b4b
1940 changed files with 506426 additions and 0 deletions
--- a/src/utils/dxt/helpers.ts
+++ b/src/utils/dxt/helpers.ts
@@ -0,0 +1,88 @@
+import type { McpbManifest } from '@anthropic-ai/mcpb'
+import { errorMessage } from '../errors.js'
+import { jsonParse } from '../slowOperations.js'
+
+/**
+ * Parses and validates a DXT manifest from a JSON object.
+ *
+ * Lazy-imports @anthropic-ai/mcpb: that package uses zod v3 which eagerly
+ * creates 24 .bind(this) closures per schema instance (~300 instances between
+ * schemas.js and schemas-loose.js). Deferring the import keeps ~700KB of bound
+ * closures out of the startup heap for sessions that never touch .dxt/.mcpb.
+ */
+export async function validateManifest(
+  manifestJson: unknown,
+): Promise<McpbManifest> {
+  const { McpbManifestSchema } = await import('@anthropic-ai/mcpb')
+  const parseResult = McpbManifestSchema.safeParse(manifestJson)
+
+  if (!parseResult.success) {
+    const errors = parseResult.error.flatten()
+    const errorMessages = [
+      ...Object.entries(errors.fieldErrors).map(
+        ([field, errs]) => `${field}: ${errs?.join(', ')}`,
+      ),
+      ...(errors.formErrors || []),
+    ]
+      .filter(Boolean)
+      .join('; ')
+
+    throw new Error(`Invalid manifest: ${errorMessages}`)
+  }
+
+  return parseResult.data
+}
+
+/**
+ * Parses and validates a DXT manifest from raw text data.
+ */
+export async function parseAndValidateManifestFromText(
+  manifestText: string,
+): Promise<McpbManifest> {
+  let manifestJson: unknown
+
+  try {
+    manifestJson = jsonParse(manifestText)
+  } catch (error) {
+    throw new Error(`Invalid JSON in manifest.json: ${errorMessage(error)}`)
+  }
+
+  return validateManifest(manifestJson)
+}
+
+/**
+ * Parses and validates a DXT manifest from raw binary data.
+ */
+export async function parseAndValidateManifestFromBytes(
+  manifestData: Uint8Array,
+): Promise<McpbManifest> {
+  const manifestText = new TextDecoder().decode(manifestData)
+  return parseAndValidateManifestFromText(manifestText)
+}
+
+/**
+ * Generates an extension ID from author name and extension name.
+ * Uses the same algorithm as the directory backend for consistency.
+ */
+export function generateExtensionId(
+  manifest: McpbManifest,
+  prefix?: 'local.unpacked' | 'local.dxt',
+): string {
+  const sanitize = (str: string) =>
+    str
+      .toLowerCase()
+      .replace(/\s+/g, '-')
+      .replace(/[^a-z0-9-_.]/g, '')
+      .replace(/-+/g, '-')
+      .replace(/^-+|-+$/g, '')
+
+  const authorName = manifest.author.name
+  const extensionName = manifest.name
+
+  const sanitizedAuthor = sanitize(authorName)
+  const sanitizedName = sanitize(extensionName)
+
+  return prefix
+    ? `${prefix}.${sanitizedAuthor}.${sanitizedName}`
+    : `${sanitizedAuthor}.${sanitizedName}`
+}
--- a/src/utils/dxt/zip.ts
+++ b/src/utils/dxt/zip.ts
@@ -0,0 +1,226 @@
+import { isAbsolute, normalize } from 'path'
+import { logForDebugging } from '../debug.js'
+import { isENOENT } from '../errors.js'
+import { getFsImplementation } from '../fsOperations.js'
+import { containsPathTraversal } from '../path.js'
+
+const LIMITS = {
+  MAX_FILE_SIZE: 512 * 1024 * 1024, // 512MB per file
+  MAX_TOTAL_SIZE: 1024 * 1024 * 1024, // 1024MB total uncompressed
+  MAX_FILE_COUNT: 100000, // Maximum number of files
+  MAX_COMPRESSION_RATIO: 50, // Anything above 50:1 is suspicious
+  MIN_COMPRESSION_RATIO: 0.5, // Below 0.5:1 might indicate already compressed malicious content
+}
+
+/**
+ * State tracker for zip file validation during extraction
+ */
+type ZipValidationState = {
+  fileCount: number
+  totalUncompressedSize: number
+  compressedSize: number
+  errors: string[]
+}
+
+/**
+ * File metadata from fflate filter
+ */
+type ZipFileMetadata = {
+  name: string
+  originalSize?: number
+}
+
+/**
+ * Result of validating a single file in a zip archive
+ */
+type FileValidationResult = {
+  isValid: boolean
+  error?: string
+}
+
+/**
+ * Validates a file path to prevent path traversal attacks
+ */
+export function isPathSafe(filePath: string): boolean {
+  if (containsPathTraversal(filePath)) {
+    return false
+  }
+
+  // Normalize the path to resolve any '.' segments
+  const normalized = normalize(filePath)
+
+  // Check for absolute paths (we only want relative paths in archives)
+  if (isAbsolute(normalized)) {
+    return false
+  }
+
+  return true
+}
+
+/**
+ * Validates a single file during zip extraction
+ */
+export function validateZipFile(
+  file: ZipFileMetadata,
+  state: ZipValidationState,
+): FileValidationResult {
+  state.fileCount++
+
+  let error: string | undefined
+
+  // Check file count
+  if (state.fileCount > LIMITS.MAX_FILE_COUNT) {
+    error = `Archive contains too many files: ${state.fileCount} (max: ${LIMITS.MAX_FILE_COUNT})`
+  }
+
+  // Validate path safety
+  if (!isPathSafe(file.name)) {
+    error = `Unsafe file path detected: "${file.name}". Path traversal or absolute paths are not allowed.`
+  }
+
+  // Check individual file size
+  const fileSize = file.originalSize || 0
+  if (fileSize > LIMITS.MAX_FILE_SIZE) {
+    error = `File "${file.name}" is too large: ${Math.round(fileSize / 1024 / 1024)}MB (max: ${Math.round(LIMITS.MAX_FILE_SIZE / 1024 / 1024)}MB)`
+  }
+
+  // Track total uncompressed size
+  state.totalUncompressedSize += fileSize
+
+  // Check total size
+  if (state.totalUncompressedSize > LIMITS.MAX_TOTAL_SIZE) {
+    error = `Archive total size is too large: ${Math.round(state.totalUncompressedSize / 1024 / 1024)}MB (max: ${Math.round(LIMITS.MAX_TOTAL_SIZE / 1024 / 1024)}MB)`
+  }
+
+  // Check compression ratio for zip bomb detection
+  const currentRatio = state.totalUncompressedSize / state.compressedSize
+  if (currentRatio > LIMITS.MAX_COMPRESSION_RATIO) {
+    error = `Suspicious compression ratio detected: ${currentRatio.toFixed(1)}:1 (max: ${LIMITS.MAX_COMPRESSION_RATIO}:1). This may be a zip bomb.`
+  }
+
+  return error ? { isValid: false, error } : { isValid: true }
+}
+
+/**
+ * Unzips data from a Buffer and returns its contents as a record of file paths to Uint8Array data.
+ * Uses unzipSync to avoid fflate worker termination crashes in bun.
+ * Accepts raw zip bytes so that the caller can read the file asynchronously.
+ *
+ * fflate is lazy-imported to avoid its ~196KB of top-level lookup tables (revfd
+ * Int32Array(32769), rev Uint16Array(32768), etc.) being allocated at startup
+ * when this module is reached via the plugin loader chain.
+ */
+export async function unzipFile(
+  zipData: Buffer,
+): Promise<Record<string, Uint8Array>> {
+  const { unzipSync } = await import('fflate')
+  const compressedSize = zipData.length
+
+  const state: ZipValidationState = {
+    fileCount: 0,
+    totalUncompressedSize: 0,
+    compressedSize: compressedSize,
+    errors: [],
+  }
+
+  const result = unzipSync(new Uint8Array(zipData), {
+    filter: file => {
+      const validationResult = validateZipFile(file, state)
+      if (!validationResult.isValid) {
+        throw new Error(validationResult.error!)
+      }
+      return true
+    },
+  })
+
+  logForDebugging(
+    `Zip extraction completed: ${state.fileCount} files, ${Math.round(state.totalUncompressedSize / 1024)}KB uncompressed`,
+  )
+
+  return result
+}
+
+/**
+ * Parse Unix file modes from a zip's central directory.
+ *
+ * fflate's `unzipSync` returns only `Record<string, Uint8Array>` — it does not
+ * surface the external file attributes stored in the central directory. This
+ * means executable bits are lost during extraction (everything becomes 0644).
+ * The git-clone path preserves +x natively, but the GCS/zip path needs this
+ * helper to keep parity.
+ *
+ * Returns `name → mode` for entries created on a Unix host (`versionMadeBy`
+ * high byte === 3). Entries from other hosts, or with no mode bits set, are
+ * omitted. Callers should treat a missing key as "use default mode".
+ *
+ * Format per PKZIP APPNOTE.TXT §4.3.12 (central directory) and §4.3.16 (EOCD).
+ * ZIP64 is not handled — returns `{}` on archives >4GB or >65535 entries,
+ * which is fine for marketplace zips (~3.5MB) and MCPB bundles.
+ */
+export function parseZipModes(data: Uint8Array): Record<string, number> {
+  // Buffer view for readUInt* methods — shares memory, no copy.
+  const buf = Buffer.from(data.buffer, data.byteOffset, data.byteLength)
+  const modes: Record<string, number> = {}
+
+  // 1. Find the End of Central Directory record (sig 0x06054b50). It lives in
+  //    the trailing 22 + 65535 bytes (fixed EOCD size + max comment length).
+  //    Scan backwards — the EOCD is typically the last 22 bytes.
+  const minEocd = Math.max(0, buf.length - 22 - 0xffff)
+  let eocd = -1
+  for (let i = buf.length - 22; i >= minEocd; i--) {
+    if (buf.readUInt32LE(i) === 0x06054b50) {
+      eocd = i
+      break
+    }
+  }
+  if (eocd < 0) return modes // malformed — let fflate's error surface elsewhere
+
+  const entryCount = buf.readUInt16LE(eocd + 10)
+  let off = buf.readUInt32LE(eocd + 16) // central directory start offset
+
+  // 2. Walk central directory entries (sig 0x02014b50). Each entry has a
+  //    46-byte fixed header followed by variable-length name/extra/comment.
+  for (let i = 0; i < entryCount; i++) {
+    if (off + 46 > buf.length || buf.readUInt32LE(off) !== 0x02014b50) break
+    const versionMadeBy = buf.readUInt16LE(off + 4)
+    const nameLen = buf.readUInt16LE(off + 28)
+    const extraLen = buf.readUInt16LE(off + 30)
+    const commentLen = buf.readUInt16LE(off + 32)
+    const externalAttr = buf.readUInt32LE(off + 38)
+    const name = buf.toString('utf8', off + 46, off + 46 + nameLen)
+
+    // versionMadeBy high byte = host OS. 3 = Unix. For Unix zips, the high
+    // 16 bits of externalAttr hold st_mode (file type + permission bits).
+    if (versionMadeBy >> 8 === 3) {
+      const mode = (externalAttr >>> 16) & 0xffff
+      if (mode) modes[name] = mode
+    }
+
+    off += 46 + nameLen + extraLen + commentLen
+  }
+
+  return modes
+}
+
+/**
+ * Reads a zip file from disk asynchronously and unzips it.
+ * Returns its contents as a record of file paths to Uint8Array data.
+ */
+export async function readAndUnzipFile(
+  filePath: string,
+): Promise<Record<string, Uint8Array>> {
+  const fs = getFsImplementation()
+
+  try {
+    const zipData = await fs.readFileBytes(filePath)
+    // await is required here: without it, rejections from the now-async
+    // unzipFile() escape the try/catch and bypass the error wrapping below.
+    return await unzipFile(zipData)
+  } catch (error) {
+    if (isENOENT(error)) {
+      throw error
+    }
+    const errorMessage = error instanceof Error ? error.message : String(error)
+    throw new Error(`Failed to read or unzip file: ${errorMessage}`)
+  }
+}