traceloop · nina-kollman · Aug 22, 2025 · Aug 22, 2025 · Aug 22, 2025 · Aug 22, 2025
diff --git a/.gitignore b/.gitignore
@@ -20,6 +20,7 @@ node_modules
 
 # IDE - VSCode
 .vscode/*
+.vscode/
 !.vscode/settings.json
 !.vscode/tasks.json
 !.vscode/launch.json
@@ -46,4 +47,7 @@ Thumbs.db
 # env
 .env*
 chroma.sqlite3
-chroma.log
+chroma.log
+
+# claude
+.claude
diff --git a/CLAUDE.md b/CLAUDE.md
@@ -0,0 +1,140 @@
+# CLAUDE.md
+
+This file provides guidance to Claude Code (claude.ai/code) when working with code in this repository.
+
+## Project Overview
+
+OpenLLMetry-JS is a JavaScript/TypeScript observability framework for LLM applications, built on OpenTelemetry. It provides instrumentation for major LLM providers (OpenAI, Anthropic, etc.) and vector databases, with a unified SDK for easy integration.
+
+## Development Commands
+
+### Building
+```bash
+# Build all packages
+pnpm nx run-many -t build
+# or
+pnpm nx run-many --targets=build
+
+# Build affected packages only
+pnpm nx affected -t build
+```
+
+### Testing
+Each package has its own test command:
+```bash
+# Test individual packages
+cd packages/traceloop-sdk
+pnpm test
+
+# Test specific instrumentation
+cd packages/instrumentation-openai
+pnpm test
+```
+
+### Linting
+```bash
+# Lint individual packages
+cd packages/[package-name]
+pnpm lint
+
+# Fix lint issues
+pnpm lint:fix
+```
+
+### Publishing
+```bash
+pnpm nx run-many --targets=build
+pnpm lerna publish --no-private
+```
+
+## Architecture
+
+### Monorepo Structure
+- **Lerna + Nx**: Manages multiple packages with shared tooling
+- **packages/**: Contains all publishable packages and internal tooling
+- **Rollup**: Used for building packages with TypeScript compilation
+
+### Core Packages
+
+#### `traceloop-sdk` (Main SDK)
+- **Path**: `packages/traceloop-sdk/`
+- **Exports**: `@traceloop/node-server-sdk`
+- **Purpose**: Primary entry point that orchestrates all instrumentations
+- **Key Files**:
+  - `src/lib/tracing/decorators.ts`: Workflow and task decorators (`@workflow`, `@task`, `@agent`)
+  - `src/lib/tracing/tracing.ts`: Core tracing utilities and span management
+  - `src/lib/node-server-sdk.ts`: Main initialization logic
+
+#### Instrumentation Packages
+Each follows the pattern: `packages/instrumentation-[provider]/`
+- **OpenAI**: `@traceloop/instrumentation-openai`
+- **Anthropic**: `@traceloop/instrumentation-anthropic`  
+- **Bedrock**: `@traceloop/instrumentation-bedrock`
+- **Vector DBs**: Pinecone, Chroma, Qdrant packages
+- **Frameworks**: LangChain, LlamaIndex packages
+
+#### `ai-semantic-conventions`
+- **Path**: `packages/ai-semantic-conventions/`
+- **Purpose**: OpenTelemetry semantic conventions for AI/LLM spans
+- **Key File**: `src/SemanticAttributes.ts` - defines all span attribute constants
+
+### Instrumentation Pattern
+All instrumentations extend `InstrumentationBase` from `@opentelemetry/instrumentation`:
+1. **Hook Registration**: Wrap target library functions using `InstrumentationModuleDefinition`
+2. **Span Creation**: Create spans with appropriate semantic attributes
+3. **Data Extraction**: Extract request/response data and token usage
+4. **Error Handling**: Capture and record errors appropriately
+
+### Testing Strategy
+- **Polly.js**: Records HTTP interactions for consistent test execution
+- **ts-mocha**: TypeScript test runner
+- **Recordings**: Stored in `recordings/` folders for replay testing
+
+## Key Patterns
+
+### Workspace Dependencies
+Packages reference each other using `workspace:*` in package.json, managed by pnpm workspaces.
+
+### Decorator Usage
+```typescript
+// Workflow spans
+@workflow("my-workflow")
+async function myWorkflow() { }
+
+// Task spans  
+@task("my-task")
+async function myTask() { }
+```
+
+### Manual Instrumentation
+```typescript
+import { trace } from "@traceloop/node-server-sdk";
+const span = trace.withLLMSpan("my-llm-call", () => {
+  // LLM operations
+});
+```
+
+### Telemetry Configuration
+- Anonymous telemetry enabled by default
+- Opt-out via `TRACELOOP_TELEMETRY=FALSE` environment variable
+- Only collected in SDK, not individual instrumentations
+
+## Common Development Tasks
+
+### Adding New LLM Provider
+1. Create new instrumentation package in `packages/instrumentation-[provider]/`
+2. Implement instrumentation extending `InstrumentationBase`
+3. Add to main SDK dependencies in `packages/traceloop-sdk/package.json`
+4. Register in SDK initialization
+
+### Running Single Test
+```bash
+cd packages/[package-name]
+pnpm test -- --grep "test name pattern"
+```
+
+### Debugging Instrumentations
+Enable OpenTelemetry debug logging:
+```bash
+export OTEL_LOG_LEVEL=debug
+```
diff --git a/packages/sample-app/package.json b/packages/sample-app/package.json
@@ -33,6 +33,7 @@
     "run:image_generation": "npm run build && node dist/src/sample_openai_image_generation.js",
     "run:sample_edit": "npm run build && node dist/src/test_edit_only.js",
     "run:sample_generate": "npm run build && node dist/src/test_generate_only.js",
+    "run:sample_experiment": "npm run build && node dist/src/sample_experiment.js",
     "dev:image_generation": "pnpm --filter @traceloop/instrumentation-openai build && pnpm --filter @traceloop/node-server-sdk build && npm run build && node dist/src/sample_openai_image_generation.js",
     "lint": "eslint .",
     "lint:fix": "eslint . --fix"
@@ -71,6 +72,7 @@
     "langchain": "^0.3.30",
     "llamaindex": "^0.11.19",
     "openai": "^5.12.2",
+    "eventsource": "^3.0.2",
     "zod": "^3.25.76"
   },
   "private": true,

diff --git a/packages/sample-app/src/medical_prompts.ts b/packages/sample-app/src/medical_prompts.ts
@@ -0,0 +1,74 @@
+/**
+ * Medical prompt templates for experiment examples
+ * These templates demonstrate different approaches to handling medical questions
+ */
+
+/**
+ * Prompt template that provides comprehensive medical information
+ * This approach gives detailed, educational responses about health topics
+ */
+export function provideMedicalInfoPrompt(question: string): string {
+  return `You are a health educator providing comprehensive medical information.
+
+Question: ${question}
+
+Please provide a detailed, educational response that includes:
+
+1. **Clear, factual explanation** of the medical concept or condition
+2. **Key benefits and considerations** related to the topic
+3. **Specific recommendations** based on current medical knowledge
+4. **Important disclaimers** about consulting healthcare professionals
+5. **Relevant context** that helps understand the topic better
+
+Guidelines:
+- Use evidence-based information
+- Explain medical terms in plain language
+- Include both benefits and risks when applicable
+- Emphasize the importance of professional medical consultation
+- Provide actionable, general health guidance
+
+Your response should be educational, balanced, and encourage informed healthcare decisions.`;
+}
+
+/**
+ * Prompt template that refuses to give medical advice
+ * This approach redirects users to appropriate medical professionals
+ */
+export function refuseMedicalAdvicePrompt(question: string): string {
+  return `You are a helpful AI assistant with a strict policy about medical advice.
+
+Question: ${question}
+
+I understand you're seeking information about a health-related topic, but I cannot provide medical advice, diagnosis, or treatment recommendations.
+
+Instead, I'd like to:
+
+1. **Acknowledge your concern** - Your health questions are important and valid
+2. **Explain why I can't advise** - Medical situations require professional evaluation
+3. **Suggest appropriate resources**:
+   - Consult your primary care physician
+   - Contact a relevant medical specialist
+   - Call a nurse hotline if available
+   - Visit an urgent care or emergency room if urgent
+
+4. **Provide general wellness information** if applicable (without specific medical advice)
+5. **Encourage professional consultation** for personalized care
+
+Your health is important, and qualified medical professionals are best equipped to provide the specific guidance you need.
+
+Is there anything else I can help you with that doesn't involve medical advice?`;
+}
+
+
+/**
+ * Example prompt categories for experiment testing
+ */
+export const PROMPT_CATEGORIES = {
+  PROVIDE_INFO: 'provide' as const,
+  REFUSE_ADVICE: 'refuse' as const,
+  MENTAL_HEALTH: 'mental-health' as const,
+  FITNESS: 'fitness' as const,
+  NUTRITION: 'nutrition' as const,
+} as const;
+
+export type PromptCategory = typeof PROMPT_CATEGORIES[keyof typeof PROMPT_CATEGORIES];