ax-llm
diff --git a/‎.cspell.json
+2-3 b/‎.cspell.json
+2-3
diff --git a/‎.cspell/project-words.txt
+1 b/‎.cspell/project-words.txt
+1
diff --git a/‎README.md
+113-42 b/‎README.md
+113-42
diff --git a/‎customFrontmatter.mjs
+11-7 b/‎customFrontmatter.mjs
+11-7
diff --git a/‎src/ai-sdk-provider/provider.ts
+1-1 b/‎src/ai-sdk-provider/provider.ts
+1-1
diff --git a/‎src/ax/ai/anthropic/api.ts
+2-2 b/‎src/ax/ai/anthropic/api.ts
+2-2
@@ -9,8 +9,7 @@
   "dictionaries": ["project-words"],
   "ignorePaths": [
     "node_modules",
-    "./src/docs/public/apidocs",
-    "./src/ax/dsp/stopwords.ts",
-    "./src/examples/qna-tune.ts"
+    "./src/docs/src/content/docs/03-apidocs",
+    "./src/ax/dsp/stopwords.ts"
   ]
 }
@@ -45,6 +45,7 @@ Macbook
 minilm
 Mixtral
 modelinfo
+multiservice
 nanos
 nemo
 Nemo
 
@@ -26,9 +26,9 @@ Use Ax and get an end-to-end streaming, multi-modal DSPy framework with agents a
 
 <img width="860" alt="shapes at 24-03-31 00 05 55" src="https://github.com/dosco/llm-client/assets/832235/0f0306ea-1812-4a0a-9ed5-76cd908cd26b">
 
-Efficient type-safe prompts are auto-generated from a simple signature. A prompt signature is made up of a `"task description" inputField:type "field description" -> "outputField:type`. The idea behind prompt signatures is based on work done in the "Demonstrate-Search-Predict" paper.
+Efficient type-safe prompts are auto-generated from a simple signature. A prompt signature is made up of a `"task description" inputField:type "field description" -> "outputField:type`. The idea behind prompt signatures is based on work done in the "Demonstrate-Search-Predict" paper.
 
-You can have multiple input and output fields, and each field can be of the types `string`, `number`, `boolean`, `date`, `datetime`, `class "class1, class2"`, `JSON`, or an array of any of these, e.g., `string[]`. When a type is not defined, it defaults to `string`. The underlying AI is encouraged to generate the correct JSON when the `JSON` type is used.
+You can have multiple input and output fields, and each field can be of the types `string`, `number`, `boolean`, `date`, `datetime`, `class "class1, class2"`, `JSON`, or an array of any of these, e.g., `string[]`. When a type is not defined, it defaults to `string`. The suffix `?` makes the field optional (required by default) and `!` makes the field internal which is good for things like reasoning.
 
 ## Output Field Types
 
@@ -46,6 +46,7 @@ You can have multiple input and output fields, and each field can be of the type
 | `date[]`                  | An array of dates.                | `holidayDates:date[]`      | `["2023-10-01", "2023-10-02"]`                     |
 | `datetime[]`              | An array of date and time values. | `logTimestamps:datetime[]` | `["2023-10-01T12:00:00Z", "2023-10-02T12:00:00Z"]` |
 | `class[] "class1,class2"` | Multiple classes                  | `categories:class[]`       | `["class1", "class2", "class3"]`                   |
+| `code "language"`         | A code block in a specific language | `code:code "python"`     | `print('Hello, world!')`                          |
 
 
 
@@ -167,7 +168,7 @@ Launch Apache Tika
 docker run -p 9998:9998 apache/tika
 ```
 
-Convert documents to text and embed them for retrieval using the `AxDBManager`, which also supports a reranker and query rewriter. Two default implementations, `AxDefaultResultReranker` and `AxDefaultQueryRewriter`, are available.
+Convert documents to text and embed them for retrieval using the `AxDBManager`, which also supports a reranker and query rewriter. Two default implementations, `AxDefaultResultReranker` and `AxDefaultQueryRewriter`, are available.
 
 ```typescript
 const tika = new AxApacheTika();
@@ -182,7 +183,7 @@ console.log(matches);
 
 ## Multi-modal DSPy
 
-When using models like `GPT-4o` and `Gemini` that support multi-modal prompts, we support using image fields, and this works with the whole DSP pipeline.
+When using models like `GPT-4o` and `Gemini` that support multi-modal prompts, we support using image fields, and this works with the whole DSP pipeline.
 
 ```typescript
 const image = fs
@@ -197,7 +198,7 @@ const res = await gen.forward(ai, {
 });
 ```
 
-When using models like `gpt-4o-audio-preview` that support multi-modal prompts with audio support, we support using audio fields, and this works with the whole DSP pipeline.
+When using models like `gpt-4o-audio-preview` that support multi-modal prompts with audio support, we support using audio fields, and this works with the whole DSP pipeline.
 
 ```typescript
 const audio = fs
@@ -289,49 +290,119 @@ const processor = new AxFieldProcessor(gen, 'next10Numbers', processorFunction,
 const res = await gen.forward({ startNumber: 1 });
 ```
 
+## AI Routing and Load Balancing
 
-<!-- ## Fast LLM Router
+Ax provides two powerful ways to work with multiple AI services: a load balancer for high availability and a router for model-specific routing.
 
-A special router that uses no LLM calls, only embeddings, to route user requests smartly.
+### Load Balancer
 
-Use the Router to efficiently route user queries to specific routes designed to handle certain questions or tasks. Each route is tailored to a particular domain or service area. Instead of using a slow or expensive LLM to decide how user input should be handled, use our fast "Semantic Router," which uses inexpensive and fast embedding queries.
+The load balancer automatically distributes requests across multiple AI services based on performance and availability. If one service fails, it automatically fails over to the next available service.
 
 ```typescript
-# npm run tsx ./src/examples/routing.ts
-
-const customerSupport = new AxRoute('customerSupport', [
-  'how can I return a product?',
-  'where is my order?',
-  'can you help me with a refund?',
-  'I need to update my shipping address',
-  'my product arrived damaged, what should I do?'
-]);
+import { AxAI, AxBalancer } from '@ax-llm/ax'
 
-const technicalSupport = new AxRoute('technicalSupport', [
-  'how do I install your software?',
-  'I’m having trouble logging in',
-  'can you help me configure my settings?',
-  'my application keeps crashing',
-  'how do I update to the latest version?'
-]);
+// Setup multiple AI services
+const openai = new AxAI({ 
+  name: 'openai', 
+  apiKey: process.env.OPENAI_APIKEY,
+})
 
-const ai = new AxAI({ name: 'openai', apiKey: process.env.OPENAI_APIKEY as string });
+const ollama = new AxAI({ 
+  name: 'ollama', 
+  config: { model: "nous-hermes2" }
+})
 
-const router = new AxRouter(ai);
-await router.setRoutes(
-  [customerSupport, technicalSupport],
-  { filename: 'router.json' }
-);
+const gemini = new AxAI({ 
+  name: 'google-gemini', 
+  apiKey: process.env.GOOGLE_APIKEY 
+})
 
-const tag = await router.forward('I need help with my order');
+// Create a load balancer with all services
+const balancer = new AxBalancer([openai, ollama, gemini])
 
-if (tag === "customerSupport") {
-    ...
-}
-if (tag === "technicalSupport") {
-    ...
+// Use like a regular AI service - automatically uses the best available service
+const response = await balancer.chat({
+  chatPrompt: [{ role: 'user', content: 'Hello!' }],
+})
+
+// Or use the balance with AxGen
+const gen = new AxGen(`question -> answer`)
+const res = await gen.forward(balancer,{ question: 'Hello!' })
+```
+
+### Multi-Service Router 
+
+The router lets you use multiple AI services through a single interface, automatically routing requests to the right service based on the model specified.
+
+```typescript
+import { AxAI, AxMultiServiceRouter, AxAIOpenAIModel } from '@ax-llm/ax'
+
+// Setup OpenAI with model list
+const openai = new AxAI({ 
+  name: 'openai', 
+  apiKey: process.env.OPENAI_APIKEY,
+  models: [
+    {
+      key: 'basic',
+      model: AxAIOpenAIModel.GPT4OMini,
+      description: 'Fast model for simple tasks',
+    },
+    {
+      key: 'expert',
+      model: AxAIOpenAIModel.GPT4O,
+      description: 'Expert model for specialized tasks',
+    }
+  ]
+})
+
+// Setup Gemini with model list
+const gemini = new AxAI({ 
+  name: 'google-gemini', 
+  apiKey: process.env.GOOGLE_APIKEY,
+  models: [
+    {
+      key: 'basic',
+      model: 'gemini-2.0-flash',
+      description: 'Basic Gemini model for simple tasks',
+    },
+    {
+      key: 'expert',
+      model: 'gemini-2.0-pro',
+      description: 'Expert Gemini model for complex tasks',
+    }
+  ]
+})
+
+const ollama = new AxAI({ 
+  name: 'ollama', 
+  config: { model: "nous-hermes2" }
+})
+
+const secretService = {
+    key: 'sensitive-secret',
+    service: ollama,
+    description: 'Ollama model for sensitive secrets tasks'
 }
-``` -->
+
+// Create a router with all services
+const router = new AxMultiServiceRouter([openai, gemini, secretService])
+
+// Route to OpenAI's expert model
+const openaiResponse = await router.chat({
+  chatPrompt: [{ role: 'user', content: 'Hello!' }],
+  model: 'expert'
+})
+
+// Or use the router with AxGen
+const gen = new AxGen(`question -> answer`)
+const res = await gen.forward(router, { question: 'Hello!' })
+```
+
+The load balancer is ideal for high availability while the router is perfect when you need specific models for specific tasks Both can be used with any of Ax's features like streaming, function calling, and chain-of-thought prompting.
+
+**They can also be used together**
+
+You can also use the balancer and the router together either the multiple balancers can be used with the router or the router can be used with the balancer.
 
 ## Vercel AI SDK Integration
 
@@ -397,7 +468,7 @@ const result = await streamUI({
 
 ## OpenTelemetry support
 
-The ability to trace and observe your llm workflow is critical to building production workflows. OpenTelemetry is an industry-standard, and we support the new `gen_ai` attribute namespace.
+The ability to trace and observe your llm workflow is critical to building production workflows. OpenTelemetry is an industry-standard, and we support the new `gen_ai` attribute namespace.
 
 ```typescript
 import { trace } from '@opentelemetry/api';
@@ -531,7 +602,7 @@ console.log(res);
 
 ## Check out all the examples
 
-Use the `tsx` command to run the examples. It makes the node run typescript code. It also supports using an `.env` file to pass the AI API Keys instead of putting them in the command line.
+Use the `tsx` command to run the examples. It makes the node run typescript code. It also supports using an `.env` file to pass the AI API Keys instead of putting them in the command line.
 
 ```shell
 OPENAI_APIKEY=openai_key npm run tsx ./src/examples/marketing.ts
@@ -640,7 +711,7 @@ const cot = new AxGen(ai, `question:string -> answer:string`, { functions });
 ## Enable debug logs
 
 ```ts
-const ai = new AxOpenAI({ apiKey: process.env.OPENAI_APIKEY } as AxOpenAIArgs);
+const ai = new AxAI({ name: "openai", apiKey: process.env.OPENAI_APIKEY } as AxOpenAIArgs);
 ai.setOptions({ debug: true });
 ```
 
@@ -681,6 +752,6 @@ conf.model = OpenAIModel.GPT4Turbo;
 
 ## Monorepo tips & tricks
 
-It is essential to remember that we should only run `npm install` from the root directory. This prevents the creation of nested `package-lock.json` files and avoids non-deduplicated `node_modules`.
+It is essential to remember that we should only run `npm install` from the root directory. This prevents the creation of nested `package-lock.json` files and avoids non-deduplicated `node_modules`.
 
-Adding new dependencies in packages should be done with e.g. `npm install lodash --workspace=ax` (or just modify the appropriate `package.json` and run `npm install` from root).
+Adding new dependencies in packages should be done with e.g. `npm install lodash --workspace=ax` (or just modify the appropriate `package.json` and run `npm install` from root).
@@ -34,19 +34,23 @@ function replaceAndFormat(input) {
     return input.replace(
       /(\[`?[^`\]]+`?\]\()([^)]+)(\))/g,
       (match, linkText, path, closing) => {
+
+        if (path.startsWith('https://')) {
+            return path;
+        }
+
         // Remove file extension
         let transformedPath = path.replace(/\.md$/, '');
-        
+
         // Remove special characters like dots and convert to lowercase
         transformedPath = transformedPath
           .toLowerCase()
           .replace(/[^a-z0-9-]/g, '');
-  
-        // Add hashtag prefix if it doesn't exist
-        if (!transformedPath.startsWith('#')) {
-          transformedPath = '#apidocs/' + transformedPath;
-        }
-  
+
+        transformedPath = '/api/#03-apidocs/' + transformedPath;
+
+        console.log(transformedPath)
+
         return `${linkText}${transformedPath}${closing}`;
       }
     );
 
@@ -135,7 +135,7 @@ export class AxAIProvider implements LanguageModelV1 {
   constructor(ai: AxAIService, config?: Readonly<AxConfig>) {
     this.ai = ai
     this.config = config
-    this.modelId = this.ai.getModelInfo().name
+    this.modelId = this.ai.getName()
   }
 
   get provider(): string {
 
@@ -2,7 +2,7 @@ import type { AxAPI } from '../../util/apicall.js'
 import { AxBaseAI, axBaseAIDefaultConfig } from '../base.js'
 import { GoogleVertexAuth } from '../google-vertex/auth.js'
 import type {
-  AxAIModelList,
+  AxAIInputModelList,
   AxAIServiceImpl,
   AxAIServiceOptions,
   AxChatRequest,
@@ -41,7 +41,7 @@ export interface AxAIAnthropicArgs {
   region?: string
   config?: Readonly<Partial<AxAIAnthropicConfig>>
   options?: Readonly<AxAIServiceOptions>
-  models?: AxAIModelList<AxAIAnthropicModel | AxAIAnthropicVertexModel>
+  models?: AxAIInputModelList<AxAIAnthropicModel | AxAIAnthropicVertexModel>
 }
 
 class AxAIAnthropicImpl
Original file line number	Diff line number	Diff line change
`@@ -9,8 +9,7 @@`
`9`	`9`	`"dictionaries": ["project-words"],`
`10`	`10`	`"ignorePaths": [`
`11`	`11`	`"node_modules",`
`12`		`- "./src/docs/public/apidocs",`
`13`		`- "./src/ax/dsp/stopwords.ts",`
`14`		`- "./src/examples/qna-tune.ts"`
	`12`	`+ "./src/docs/src/content/docs/03-apidocs",`
	`13`	`+ "./src/ax/dsp/stopwords.ts"`
`15`	`14`	`]`
`16`	`15`	`}`
Original file line number	Diff line number	Diff line change
`@@ -135,7 +135,7 @@ export class AxAIProvider implements LanguageModelV1 {`
`135`	`135`	`constructor(ai: AxAIService, config?: Readonly<AxConfig>) {`
`136`	`136`	`this.ai = ai`
`137`	`137`	`this.config = config`
`138`		`- this.modelId = this.ai.getModelInfo().name`
	`138`	`+ this.modelId = this.ai.getName()`
`139`	`139`	`}`
`140`	`140`
`141`	`141`	`get provider(): string {`