run-llama
diff --git a/‎.changeset/famous-ducks-bathe.md‎
Lines changed: 6 additions & 0 deletions b/‎.changeset/famous-ducks-bathe.md‎
Lines changed: 6 additions & 0 deletions
diff --git a/‎docs/src/content/docs/framework/modules/models/embeddings/ovhcloud.mdx‎
Lines changed: 123 additions & 0 deletions b/‎docs/src/content/docs/framework/modules/models/embeddings/ovhcloud.mdx‎
Lines changed: 123 additions & 0 deletions
diff --git a/‎docs/src/content/docs/framework/modules/models/llms/ovhcloud.mdx‎
Lines changed: 164 additions & 0 deletions b/‎docs/src/content/docs/framework/modules/models/llms/ovhcloud.mdx‎
Lines changed: 164 additions & 0 deletions
diff --git a/‎examples/models/ovhcloud.ts‎
Lines changed: 50 additions & 0 deletions b/‎examples/models/ovhcloud.ts‎
Lines changed: 50 additions & 0 deletions
diff --git a/‎examples/package.json‎
Lines changed: 1 addition & 0 deletions b/‎examples/package.json‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎packages/providers/ovhcloud/CHANGELOG.md‎
Lines changed: 7 additions & 0 deletions b/‎packages/providers/ovhcloud/CHANGELOG.md‎
Lines changed: 7 additions & 0 deletions
@@ -0,0 +1,6 @@
+---
+"@llamaindex/ovhcloud": major
+"@llamaindex/examples": minor
+---
+
+Add OVHcloud AI Endpoints provider
@@ -0,0 +1,123 @@
+---
+title: OVHcloud AI Endpoints
+---
+
+OVHcloud AI Endpoints provide OpenAI-compatible embedding models. The service can be used for free with rate limits, or with an API key for higher limits.
+
+OVHcloud is a global player and the leading European cloud provider operating over 450,000 servers within 40 data centers across 4 continents to reach 1.6 million customers in over 140 countries. Our product AI Endpoints offers access to various models with sovereignty, data privacy and GDPR compliance.
+
+You can find the full list of models in the [OVHcloud AI Endpoints catalog](https://www.ovhcloud.com/en/public-cloud/ai-endpoints/catalog/).
+
+## Installation
+
+```package-install
+npm i llamaindex @llamaindex/ovhcloud
+```
+
+## Authentication
+
+OVHcloud AI Endpoints can be used in two ways:
+
+1. **Free tier (with rate limits)**: No API key required. You can omit the `apiKey` parameter or set it to an empty string.
+2. **With API key**: For higher rate limits, generate an API key from the [OVHcloud Manager](https://ovh.com/manager) → Public Cloud → AI & Machine Learning → AI Endpoints → API keys.
+
+## Basic Usage
+
+```ts
+import { Document, Settings, VectorStoreIndex } from "llamaindex";
+import { OVHcloudEmbedding } from "@llamaindex/ovhcloud";
+
+// Update Embed Model (using free tier)
+Settings.embedModel = new OVHcloudEmbedding();
+
+// Or with API key from environment variable
+import { config } from "dotenv";
+config();
+Settings.embedModel = new OVHcloudEmbedding({
+  apiKey: process.env.OVHCLOUD_API_KEY || "",
+});
+
+const document = new Document({ text: essay, id_: "essay" });
+
+const index = await VectorStoreIndex.fromDocuments([document]);
+
+const queryEngine = index.asQueryEngine();
+
+const query = "What is the meaning of life?";
+
+const results = await queryEngine.query({
+  query,
+});
+```
+
+By default, `OVHcloudEmbedding` uses the `BGE-M3` model. You can change the model by passing the model parameter to the constructor:
+
+```ts
+import { OVHcloudEmbedding } from "@llamaindex/ovhcloud";
+
+const model = "text-embedding-3-small";
+Settings.embedModel = new OVHcloudEmbedding({
+  model,
+});
+```
+
+You can also set the `maxRetries` and `timeout` parameters when initializing `OVHcloudEmbedding` for better control over the request behavior:
+
+```ts
+import { Settings } from "llamaindex";
+import { OVHcloudEmbedding } from "@llamaindex/ovhcloud";
+
+const model = "text-embedding-3-small";
+const maxRetries = 5;
+const timeout = 5000; // 5 seconds
+
+Settings.embedModel = new OVHcloudEmbedding({
+  model,
+  maxRetries,
+  timeout,
+});
+```
+
+## Standalone Usage
+
+```ts
+import { OVHcloudEmbedding } from "@llamaindex/ovhcloud";
+import { config } from "dotenv";
+// For standalone usage, you can optionally configure OVHCLOUD_API_KEY in .env file
+config();
+
+const main = async () => {
+  const model = "BGE-M3";
+  // Using without API key (free tier)
+  const embeddings = new OVHcloudEmbedding({ model });
+  const text = "What is the meaning of life?";
+  const response = await embeddings.embed([text]);
+  console.log(response);
+};
+
+main();
+```
+
+## Base URL
+
+The default base URL is `https://oai.endpoints.kepler.ai.cloud.ovh.net/v1`. You can override it if needed:
+
+```ts
+const embedding = new OVHcloudEmbedding({
+  model: "BGE-M3",
+  additionalSessionOptions: {
+    baseURL: "https://custom.endpoint.com/v1",
+  },
+});
+```
+
+## Resources
+
+- [OVHcloud AI Endpoints Catalog](https://www.ovhcloud.com/en/public-cloud/ai-endpoints/catalog/)
+- [OVHcloud Manager](https://ovh.com/manager)
+- [OVHcloud AI Endpoints Documentation](https://www.ovhcloud.com/en/public-cloud/ai-endpoints/)
+
+## API Reference
+
+- [OVHcloudEmbedding](/typescript/framework-api-reference/classes/ovhcloudembedding/)
+
@@ -0,0 +1,164 @@
+---
+title: OVHcloud AI Endpoints
+---
+
+OVHcloud AI Endpoints provide serverless access to a variety of pre-trained AI models. The service is OpenAI-compatible and can be used for free with rate limits, or with an API key for higher limits.
+
+OVHcloud is a global player and the leading European cloud provider operating over 450,000 servers within 40 data centers across 4 continents to reach 1.6 million customers in over 140 countries. Our product AI Endpoints offers access to various models with sovereignty, data privacy and GDPR compliance.
+
+You can find the full list of models in the [OVHcloud AI Endpoints catalog](https://www.ovhcloud.com/en/public-cloud/ai-endpoints/catalog/).
+
+## Installation
+
+```package-install
+npm i llamaindex @llamaindex/ovhcloud
+```
+
+## Authentication
+
+OVHcloud AI Endpoints can be used in two ways:
+
+1. **Free tier (with rate limits)**: No API key required. You can omit the `apiKey` parameter or set it to an empty string.
+2. **With API key**: For higher rate limits, generate an API key from the [OVHcloud Manager](https://ovh.com/manager) → Public Cloud → AI & Machine Learning → AI Endpoints → API keys.
+
+## Basic Usage
+
+```ts
+import { OVHcloudLLM } from "@llamaindex/ovhcloud";
+import { Settings } from "llamaindex";
+
+// Using without API key (free tier with rate limits)
+Settings.llm = new OVHcloudLLM({
+  model: "gpt-oss-120b",
+});
+
+// Or with API key from environment variable
+import { config } from "dotenv";
+config();
+Settings.llm = new OVHcloudLLM({
+  model: "gpt-oss-120b",
+  apiKey: process.env.OVHCLOUD_API_KEY || "",
+});
+
+// Or with explicit API key
+Settings.llm = new OVHcloudLLM({
+  model: "gpt-oss-120b",
+  apiKey: "YOUR_API_KEY",
+});
+```
+
+You can set the API key via environment variable:
+
+```bash
+export OVHCLOUD_API_KEY="<YOUR_API_KEY>"
+```
+
+## Load and index documents
+
+For this example, we will use a single document. In a real-world scenario, you would have multiple documents to index.
+
+```ts
+import { Document, VectorStoreIndex } from "llamaindex";
+
+const document = new Document({ text: essay, id_: "essay" });
+
+const index = await VectorStoreIndex.fromDocuments([document]);
+```
+
+## Query
+
+```ts
+const queryEngine = index.asQueryEngine();
+
+const query = "What is the meaning of life?";
+
+const results = await queryEngine.query({
+  query,
+});
+```
+
+## Full Example
+
+```ts
+import { OVHcloudLLM } from "@llamaindex/ovhcloud";
+import { Document, VectorStoreIndex, Settings } from "llamaindex";
+
+// Use custom LLM
+const model = "gpt-oss-120b";
+Settings.llm = new OVHcloudLLM({ model, temperature: 0 });
+
+async function main() {
+  const document = new Document({ text: essay, id_: "essay" });
+
+  // Load and index documents
+  const index = await VectorStoreIndex.fromDocuments([document]);
+
+  // get retriever
+  const retriever = index.asRetriever();
+
+  // Create a query engine
+  const queryEngine = index.asQueryEngine({
+    retriever,
+  });
+
+  const query = "What is the meaning of life?";
+
+  // Query
+  const response = await queryEngine.query({
+    query,
+  });
+
+  // Log the response
+  console.log(response.response);
+}
+```
+
+## Streaming
+
+OVHcloud AI Endpoints supports streaming responses:
+
+```ts
+import { OVHcloudLLM } from "@llamaindex/ovhcloud";
+
+const llm = new OVHcloudLLM({
+  model: "gpt-oss-120b",
+});
+
+const generator = await llm.chat({
+  messages: [
+    {
+      role: "user",
+      content: "Tell me about OVHcloud AI Endpoints",
+    },
+  ],
+  stream: true,
+});
+
+for await (const message of generator) {
+  process.stdout.write(message.delta);
+}
+```
+
+## Base URL
+
+The default base URL is `https://oai.endpoints.kepler.ai.cloud.ovh.net/v1`. You can override it if needed:
+
+```ts
+const llm = new OVHcloudLLM({
+  model: "gpt-oss-120b",
+  additionalSessionOptions: {
+    baseURL: "https://custom.endpoint.com/v1",
+  },
+});
+```
+
+## Resources
+
+- [OVHcloud AI Endpoints Catalog](https://www.ovhcloud.com/en/public-cloud/ai-endpoints/catalog/)
+- [OVHcloud Manager](https://ovh.com/manager)
+- [OVHcloud AI Endpoints Documentation](https://www.ovhcloud.com/en/public-cloud/ai-endpoints/)
+
+## API Reference
+
+- [OVHcloudLLM](/typescript/framework-api-reference/classes/ovhcloudllm/)
+
@@ -0,0 +1,50 @@
+import { OVHcloudEmbedding, OVHcloudLLM } from "@llamaindex/ovhcloud";
+
+// OVHcloud AI Endpoints can be used for free with rate limits without an API key
+// To use with an API key, set OVHCLOUD_API_KEY environment variable
+// or pass it directly in the constructor
+// To generate an API key, go to https://ovh.com/manager > Public Cloud > AI & Machine Learning > AI Endpoints > API keys
+// Visit our catalog for the list of all available models: https://www.ovhcloud.com/en/public-cloud/ai-endpoints/catalog/
+
+// Example 1: Using without API key (free tier with rate limits)
+const ovhcloudFree = new OVHcloudLLM({
+  model: "gpt-oss-120b",
+  // apiKey is optional - can be omitted or set to empty string for free tier
+});
+
+// Example 2: Using with API key
+const ovhcloud = new OVHcloudLLM({
+  model: "gpt-oss-120b",
+  apiKey: process.env.OVHCLOUD_API_KEY || "",
+});
+
+(async () => {
+  console.log("Chatting with OVHcloud AI Endpoints...");
+  const generator = await ovhcloud.chat({
+    messages: [
+      {
+        role: "system",
+        content: "You are a helpful AI assistant.",
+      },
+      {
+        role: "user",
+        content: "Tell me about OVHcloud AI Endpoints",
+      },
+    ],
+    stream: true,
+  });
+
+  for await (const message of generator) {
+    process.stdout.write(message.delta);
+  }
+  console.log("\n");
+
+  // Example with embeddings
+  console.log("Getting embeddings...");
+  const embedding = new OVHcloudEmbedding({
+    model: "BGE-M3",
+  });
+  const vector = await embedding.getTextEmbedding("Hello world!");
+  console.log("Vector dimensions:", vector.length);
+  console.log("First 5 values:", vector.slice(0, 5));
+})();
@@ -40,6 +40,7 @@
     "@llamaindex/notion": "^0.1.21",
     "@llamaindex/ollama": "^0.1.23",
     "@llamaindex/openai": "^0.4.21",
+    "@llamaindex/ovhcloud": "^0.0.1",
     "@llamaindex/perplexity": "^0.0.34",
     "@llamaindex/pinecone": "^0.1.22",
     "@llamaindex/portkey-ai": "^0.0.64",
 
@@ -0,0 +1,7 @@
+# @llamaindex/ovhcloud
+
+## 0.0.1
+
+### Patch Changes
+
+- Initial release of OVHcloud AI Endpoints provider