feat(llm): extract Claude SYSTEM_PROMPT + generateSpec into shared @bmm/llm package

2026-05-19 18:05:31 +02:00 · 2026-05-19 18:05:31 +02:00 · bb0d9c2cda
commit bb0d9c2cda
parent ab67203921
7 changed files with 203 additions and 120 deletions
--- a/apps/api/package.json
+++ b/apps/api/package.json
@ -12,6 +12,7 @@
  "dependencies": {
    "@bmm/auth": "workspace:*",
    "@bmm/db": "workspace:*",
    "@bmm/llm": "workspace:*",
    "@bmm/types": "workspace:*",
    "@fastify/cookie": "11.0.1",
    "@fastify/cors": "10.0.1",
--- a/apps/generator/package.json
+++ b/apps/generator/package.json
@ -12,6 +12,7 @@
  "dependencies": {
    "@anthropic-ai/sdk": "0.32.1",
    "@bmm/db": "workspace:*",
    "@bmm/llm": "workspace:*",
    "@bmm/types": "workspace:*",
    "bullmq": "5.34.5",
    "drizzle-orm": "0.36.4",
--- a/apps/generator/src/lib/claude.ts
+++ b/apps/generator/src/lib/claude.ts
@ -1,127 +1,12 @@
-import Anthropic from '@anthropic-ai/sdk';
+import { generateSpec as sharedGenerate, type GenerationResult } from '@bmm/llm';
 import { GeneratorSpec, type GeneratorSpec as GeneratorSpecT } from '@bmm/types';
 import { config } from '../config.js';
-const SYSTEM_PROMPT = `You generate production-grade MCP server specifications as STRICT JSON.
+export type { GenerationResult };
 Output ONE JSON object (no markdown, no prose, no code fences) with this exact shape:
 {
  "name": "human-readable server name (max 128 chars)",
  "description": "1-2 sentence purpose",
  "tools": [
    {
      "name": "snake_case_tool_name",
      "description": "what the AI client sees — single sentence, clear",
      "inputSchema": {
        "param_name": { "type": "string|number|boolean|array|object", "description": "...", "required": true }
      },
      "implementation": "ASYNC TypeScript body. Receives {args} pre-validated. Must return MCP content blocks: { content: [{ type: 'text', text: '...' }] }. Use process.env.SECRET_NAME for secrets. NEVER use eval/Function/child_process. Use globalThis.fetch for HTTP. Wrap external calls in try/catch and return { content: [{ type: 'text', text: 'Error: ...' }], isError: true } on failure."
    }
  ],
  "resources": [],
  "prompts": [],
  "requiredSecrets": ["UPPER_SNAKE_CASE"],
  "scopes": ["mcp:read"],
  "dependencies": {}
 }
 Rules:
 - Tools are idempotent unless the description explicitly says destructive.
 - Validate all string inputs before use.
 - For databases: parameterized queries only (use the 'pg' library with $1 placeholders).
 - For HTTP APIs: globalThis.fetch with explicit timeout via AbortSignal.timeout(10000).
 - Never hardcode credentials; declare them under requiredSecrets and read via process.env.
 - Keep tool implementations under 5000 characters.
 - Do not include "import" statements in implementations — the runtime injects fetch, pg, etc.
 Return JSON only. No explanation.`;
 export interface GenerationResult {
  spec: GeneratorSpecT;
  source: 'claude' | 'mock';
 }
 export async function generateSpec(prompt: string): Promise<GenerationResult> {
-  if (!config.ANTHROPIC_API_KEY) {
+  return sharedGenerate(prompt, {
-    return { spec: mockSpec(prompt), source: 'mock' };
+    apiKey: config.ANTHROPIC_API_KEY,
  }
  const client = new Anthropic({ apiKey: config.ANTHROPIC_API_KEY });
  const response = await client.messages.create({
    model: config.MODEL_GENERATE,
-    max_tokens: 8192,
+    maxTokens: 8192,
    system: SYSTEM_PROMPT,
    messages: [{ role: 'user', content: prompt }],
  });
  const text = response.content
    .filter((b): b is { type: 'text'; text: string } => b.type === 'text')
    .map((b) => b.text)
    .join('');
  const json = extractJson(text);
  const parsed = GeneratorSpec.safeParse(json);
  if (!parsed.success) {
    throw new Error(`spec_validation_failed: ${parsed.error.message}`);
  }
  scanForInjection(parsed.data);
  return { spec: parsed.data, source: 'claude' };
 }
 function extractJson(text: string): unknown {
  const trimmed = text.trim();
  // strip ```json fences if present
  const fenced = trimmed.match(/```(?:json)?\s*([\s\S]*?)```/);
  const body = fenced ? fenced[1] : trimmed;
  if (!body) throw new Error('empty_generation_output');
  try {
    return JSON.parse(body);
  } catch (e) {
    throw new Error(`generation_not_json: ${(e as Error).message}`);
  }
 }
 const BANNED_PATTERNS = [
  /\beval\s*\(/,
  /\bnew\s+Function\s*\(/,
  /\brequire\s*\(\s*['"]child_process['"]/,
  /\bchild_process\b/,
  /ignore\s+previous\s+instructions/i,
  /disregard\s+(the\s+)?(above|previous)/i,
 ];
 function scanForInjection(spec: GeneratorSpecT): void {
  for (const tool of spec.tools) {
    for (const pattern of BANNED_PATTERNS) {
      if (pattern.test(tool.implementation) || pattern.test(tool.description)) {
        throw new Error(`banned_pattern_detected: ${pattern.source}`);
      }
    }
  }
 }
 function mockSpec(prompt: string): GeneratorSpecT {
  return {
    name: 'Echo MCP',
    description: `Mock server (no ANTHROPIC_API_KEY). Prompt was: ${prompt.slice(0, 200)}`,
    tools: [
      {
        name: 'echo',
        description: 'Echoes the input string back to the caller.',
        inputSchema: {
          message: { type: 'string', description: 'Message to echo back', required: true },
        },
        implementation: `const msg = String(args.message ?? '');\nreturn { content: [{ type: 'text', text: \`echo: \${msg}\` }] };`,
      },
      {
        name: 'now',
        description: 'Returns the current server UTC timestamp.',
        inputSchema: {},
        implementation: `return { content: [{ type: 'text', text: new Date().toISOString() }] };`,
      },
    ],
    resources: [],
    prompts: [],
    requiredSecrets: [],
    scopes: ['mcp:read'],
    dependencies: {},
  };
 }
--- a/packages/llm/package.json
+++ b/packages/llm/package.json
@ -0,0 +1,23 @@
 {
  "name": "@bmm/llm",
  "version": "0.1.0",
  "type": "module",
  "private": true,
  "main": "./src/index.ts",
  "types": "./src/index.ts",
  "exports": {
    ".": "./src/index.ts"
  },
  "scripts": {
    "typecheck": "tsc --noEmit"
  },
  "dependencies": {
    "@anthropic-ai/sdk": "0.32.1",
    "@bmm/types": "workspace:*",
    "zod": "3.25.76"
  },
  "devDependencies": {
    "@types/node": "22.10.2",
    "typescript": "5.7.2"
  }
 }
--- a/packages/llm/src/index.ts
+++ b/packages/llm/src/index.ts
@ -0,0 +1,139 @@
 import Anthropic from '@anthropic-ai/sdk';
 import { GeneratorSpec, type GeneratorSpec as GeneratorSpecT } from '@bmm/types';
 export const SYSTEM_PROMPT = `You generate production-grade MCP server specifications as STRICT JSON.
 Output ONE JSON object (no markdown, no prose, no code fences) with this exact shape:
 {
  "name": "human-readable server name (max 128 chars)",
  "description": "1-2 sentence purpose",
  "tools": [
    {
      "name": "snake_case_tool_name",
      "description": "what the AI client sees — single sentence, clear",
      "inputSchema": {
        "param_name": { "type": "string|number|boolean|array|object", "description": "...", "required": true }
      },
      "implementation": "ASYNC TypeScript body. Receives {args} pre-validated. Must return MCP content blocks: { content: [{ type: 'text', text: '...' }] }. Use process.env.SECRET_NAME for secrets. NEVER use eval/Function/child_process. Use globalThis.fetch for HTTP. Wrap external calls in try/catch and return { content: [{ type: 'text', text: 'Error: ...' }], isError: true } on failure."
    }
  ],
  "resources": [],
  "prompts": [],
  "requiredSecrets": ["UPPER_SNAKE_CASE"],
  "scopes": ["mcp:read"],
  "dependencies": {}
 }
 Rules:
 - Tools are idempotent unless the description explicitly says destructive.
 - Validate all string inputs before use.
 - For databases: parameterized queries only (use the 'pg' library with $1 placeholders).
 - For HTTP APIs: globalThis.fetch with explicit timeout via AbortSignal.timeout(10000).
 - Never hardcode credentials; declare them under requiredSecrets and read via process.env.
 - Keep tool implementations under 5000 characters.
 - Do not include "import" statements in implementations — the runtime injects fetch, pg, etc.
 Return JSON only. No explanation.`;
 const BANNED_PATTERNS = [
  /\beval\s*\(/,
  /\bnew\s+Function\s*\(/,
  /\brequire\s*\(\s*['"]child_process['"]/,
  /\bchild_process\b/,
  /ignore\s+previous\s+instructions/i,
  /disregard\s+(the\s+)?(above|previous)/i,
 ];
 export interface GenerationResult {
  spec: GeneratorSpecT;
  source: 'claude' | 'mock';
 }
 export interface GenerateOptions {
  apiKey?: string;
  model?: string;
  maxTokens?: number;
 }
 export async function generateSpec(prompt: string, opts: GenerateOptions = {}): Promise<GenerationResult> {
  if (!opts.apiKey) {
    return { spec: mockSpec(prompt), source: 'mock' };
  }
  const client = new Anthropic({ apiKey: opts.apiKey });
  const response = await client.messages.create({
    model: opts.model ?? 'claude-opus-4-7',
    max_tokens: opts.maxTokens ?? 8192,
    system: SYSTEM_PROMPT,
    messages: [{ role: 'user', content: prompt }],
  });
  const text = response.content
    .filter((b): b is { type: 'text'; text: string } => b.type === 'text')
    .map((b) => b.text)
    .join('');
  const json = extractJson(text);
  const parsed = GeneratorSpec.safeParse(json);
  if (!parsed.success) {
    throw new SpecValidationError(parsed.error.message);
  }
  scanForInjection(parsed.data);
  return { spec: parsed.data, source: 'claude' };
 }
 export class SpecValidationError extends Error {
  override readonly name = 'SpecValidationError';
 }
 export class BannedPatternError extends Error {
  override readonly name = 'BannedPatternError';
 }
 function extractJson(text: string): unknown {
  const trimmed = text.trim();
  const fenced = trimmed.match(/```(?:json)?\s*([\s\S]*?)```/);
  const body = fenced ? fenced[1] : trimmed;
  if (!body) throw new SpecValidationError('empty_generation_output');
  try {
    return JSON.parse(body);
  } catch (e) {
    throw new SpecValidationError(`generation_not_json: ${(e as Error).message}`);
  }
 }
 function scanForInjection(spec: GeneratorSpecT): void {
  for (const tool of spec.tools) {
    for (const pattern of BANNED_PATTERNS) {
      if (pattern.test(tool.implementation) || pattern.test(tool.description)) {
        throw new BannedPatternError(`banned_pattern_detected: ${pattern.source}`);
      }
    }
  }
 }
 export function mockSpec(prompt: string): GeneratorSpecT {
  return {
    name: 'Echo MCP',
    description: `Mock server (no ANTHROPIC_API_KEY). Prompt was: ${prompt.slice(0, 200)}`,
    tools: [
      {
        name: 'echo',
        description: 'Echoes the input string back to the caller.',
        inputSchema: {
          message: { type: 'string', description: 'Message to echo back', required: true },
        },
        implementation: `const msg = String(args.message ?? '');\nreturn { content: [{ type: 'text', text: \`echo: \${msg}\` }] };`,
      },
      {
        name: 'now',
        description: 'Returns the current server UTC timestamp.',
        inputSchema: {},
        implementation: `return { content: [{ type: 'text', text: new Date().toISOString() }] };`,
      },
    ],
    resources: [],
    prompts: [],
    requiredSecrets: [],
    scopes: ['mcp:read'],
    dependencies: {},
  };
 }
--- a/packages/llm/tsconfig.json
+++ b/packages/llm/tsconfig.json
@ -0,0 +1,9 @@
 {
  "extends": "../../tsconfig.base.json",
  "compilerOptions": {
    "outDir": "./dist",
    "rootDir": "./src",
    "types": ["node"]
  },
  "include": ["src/**/*"]
 }
--- a/pnpm-lock.yaml
+++ b/pnpm-lock.yaml
@ -26,6 +26,9 @@ importers:
      '@bmm/db':
        specifier: workspace:*
        version: link:../../packages/db
      '@bmm/llm':
        specifier: workspace:*
        version: link:../../packages/llm
      '@bmm/types':
        specifier: workspace:*
        version: link:../../packages/types
@ -75,6 +78,9 @@ importers:
      '@bmm/db':
        specifier: workspace:*
        version: link:../../packages/db
      '@bmm/llm':
        specifier: workspace:*
        version: link:../../packages/llm
      '@bmm/types':
        specifier: workspace:*
        version: link:../../packages/types
@ -213,6 +219,25 @@ importers:
        specifier: 5.7.2
        version: 5.7.2
  packages/llm:
    dependencies:
      '@anthropic-ai/sdk':
        specifier: 0.32.1
        version: 0.32.1
      '@bmm/types':
        specifier: workspace:*
        version: link:../types
      zod:
        specifier: 3.25.76
        version: 3.25.76
    devDependencies:
      '@types/node':
        specifier: 22.10.2
        version: 22.10.2
      typescript:
        specifier: 5.7.2
        version: 5.7.2
  packages/types:
    dependencies:
      zod: