Name: AI Engineer Skill
Author: cffrank

Buscar habilidades.../

AI Engineer Skill | Skills Pool

// Text generation
const response = await env.AI.run('@cf/meta/llama-3.1-8b-instruct', {
  messages: [
    { role: 'system', content: 'You are a helpful assistant.' },
    { role: 'user', content: userMessage },
  ],
  max_tokens: 500,
  temperature: 0.7,
});
const text = response.response;

// Embeddings
const embeddings = await env.AI.run('@cf/baai/bge-base-en-v1.5', {
  text: ['Document chunk 1', 'Document chunk 2'],
});
// embeddings.data = [[0.1, 0.2, ...], [0.3, 0.4, ...]]

// Text classification
const result = await env.AI.run('@cf/huggingface/distilbert-sst-2-int8', {
  text: 'This product is amazing!',
});
// result = [{ label: 'POSITIVE', score: 0.98 }]

// Route through AI Gateway for caching, logging, rate limiting
const GATEWAY_URL = 'https://gateway.ai.cloudflare.com/v1/ACCOUNT_ID/GATEWAY_NAME';

// Anthropic via Gateway
const response = await fetch(`${GATEWAY_URL}/anthropic/v1/messages`, {
  method: 'POST',
  headers: {
    'Authorization': `Bearer ${env.ANTHROPIC_API_KEY}`,
    'Content-Type': 'application/json',
  },
  body: JSON.stringify({
    model: 'claude-sonnet-4-20250514',
    max_tokens: 1000,
    messages: [{ role: 'user', content: prompt }],
  }),
});

// OpenAI via Gateway
const response = await fetch(`${GATEWAY_URL}/openai/chat/completions`, {
  method: 'POST',
  headers: {
    'Authorization': `Bearer ${env.OPENAI_API_KEY}`,
    'Content-Type': 'application/json',
  },
  body: JSON.stringify({
    model: 'gpt-4o-mini',
    messages: [{ role: 'user', content: prompt }],
  }),
});

// 1. Chunk document
function chunkText(text: string, chunkSize = 500, overlap = 50): string[] {
  const chunks: string[] = [];
  for (let i = 0; i < text.length; i += chunkSize - overlap) {
    chunks.push(text.slice(i, i + chunkSize));
  }
  return chunks;
}

// 2. Generate embeddings and store
async function ingestDocument(doc: { id: string; text: string }, env: Env) {
  const chunks = chunkText(doc.text);
  const embeddings = await env.AI.run('@cf/baai/bge-base-en-v1.5', {
    text: chunks,
  });

  // Store chunks in D1
  const batch = chunks.map((chunk, i) =>
    env.DB.prepare('INSERT INTO chunks (doc_id, chunk_index, text) VALUES (?, ?, ?)')
      .bind(doc.id, i, chunk)
  );
  await env.DB.batch(batch);

  // Store vectors in Vectorize
  const vectors = embeddings.data.map((values, i) => ({
    id: `${doc.id}-${i}`,
    values,
    metadata: { docId: doc.id, chunkIndex: i },
  }));
  await env.VECTORIZE.upsert(vectors);
}

// 3. Query
async function ragQuery(query: string, env: Env): Promise<string> {
  // Embed the query
  const queryEmb = await env.AI.run('@cf/baai/bge-base-en-v1.5', {
    text: [query],
  });

  // Find similar chunks
  const matches = await env.VECTORIZE.query(queryEmb.data[0], {
    topK: 5,
    returnMetadata: true,
  });

  // Retrieve chunk text from D1
  const chunkIds = matches.matches.map(m => m.metadata?.chunkIndex);
  const docId = matches.matches[0]?.metadata?.docId;
  const chunks = await env.DB
    .prepare('SELECT text FROM chunks WHERE doc_id = ? AND chunk_index IN (?)')
    .bind(docId, chunkIds.join(','))
    .all();

  const context = chunks.results.map(c => c.text).join('\n\n');

  // Generate answer with context
  const answer = await env.AI.run('@cf/meta/llama-3.1-8b-instruct', {
    messages: [
      { role: 'system', content: `Answer based on this context:\n${context}` },
      { role: 'user', content: query },
    ],
  });

  return answer.response;
}

Use case	Model	Binding
General text generation	`@cf/meta/llama-3.1-8b-instruct`	`env.AI`
Embeddings	`@cf/baai/bge-base-en-v1.5`	`env.AI`
Summarization	`@cf/meta/llama-3.1-8b-instruct`	`env.AI`
Classification	`@cf/huggingface/distilbert-sst-2-int8`	`env.AI`
Code generation	Route to Claude via AI Gateway	Gateway
Complex reasoning	Route to Claude Opus via AI Gateway	Gateway
High-volume, low-cost	Workers AI (free tier: 10K requests/day)	`env.AI`

CREATE TABLE prompts (
  id TEXT PRIMARY KEY,
  name TEXT NOT NULL,
  version INTEGER NOT NULL DEFAULT 1,
  system_prompt TEXT NOT NULL,
  model TEXT NOT NULL,
  temperature REAL DEFAULT 0.7,
  max_tokens INTEGER DEFAULT 500,
  is_active BOOLEAN DEFAULT TRUE,
  created_at TEXT DEFAULT (datetime('now'))
);

CREATE UNIQUE INDEX idx_prompt_name_version ON prompts(name, version);

async function getPrompt(name: string, env: Env) {
  return env.DB
    .prepare('SELECT * FROM prompts WHERE name = ? AND is_active = TRUE ORDER BY version DESC LIMIT 1')
    .bind(name)
    .first();
}

Component	Purpose	Binding
Workers AI	Run models at the edge (text, embeddings, image)	`env.AI`
AI Gateway	Proxy, cache, rate limit, log AI requests	Gateway URL
Vectorize	Vector database for embeddings	`env.VECTORIZE`
D1	Store prompts, results, metadata	`env.DB`
R2	Store documents for RAG ingestion	`env.ASSETS`

Component	Purpose	Binding
Workers AI	Run models at the edge (text, embeddings, image)	`env.AI`
AI Gateway	Proxy, cache, rate limit, log AI requests	Gateway URL
Vectorize	Vector database for embeddings	`env.VECTORIZE`
D1	Store prompts, results, metadata	`env.DB`
R2	Store documents for RAG ingestion	`env.ASSETS`

AI Engineer Skill

Platform Components

Workers AI Inference

AI Engineer Skill

Platform Components

Workers AI Inference

AI Gateway (Provider Routing)

Gateway Benefits

RAG Pipeline on D1 + Vectorize

Document Ingestion

Model Selection Guide

Prompt Management

Cost Optimization

Relationship to Other Skills

Openai Whisper

Voice Call

Prose

Clawhub

Sherpa Onnx Tts

Openai Whisper Api