From 6e4f4a17436d94693d7bb70e5695e66df8446dd3 Mon Sep 17 00:00:00 2001 From: Celina Hanouti Date: Wed, 15 Apr 2026 18:21:57 +0200 Subject: [PATCH 1/2] add DeepInfra docs --- docs/inference-providers/_toctree.yml | 2 + docs/inference-providers/index.md | 1 + .../providers/deepinfra.md | 47 +++++++++++++++++++ .../inference-providers/scripts/generate.ts | 1 + .../templates/providers/deepinfra.handlebars | 16 +++++++ 5 files changed, 67 insertions(+) create mode 100644 docs/inference-providers/providers/deepinfra.md create mode 100644 scripts/inference-providers/templates/providers/deepinfra.handlebars diff --git a/docs/inference-providers/_toctree.yml b/docs/inference-providers/_toctree.yml index ce55cb644f..b1919f13fa 100644 --- a/docs/inference-providers/_toctree.yml +++ b/docs/inference-providers/_toctree.yml @@ -106,6 +106,8 @@ title: Cerebras - local: providers/cohere title: Cohere + - local: providers/deepinfra + title: DeepInfra - local: providers/fal-ai title: Fal AI - local: providers/featherless-ai diff --git a/docs/inference-providers/index.md b/docs/inference-providers/index.md index 6f12bf65c2..72ebe4dd11 100644 --- a/docs/inference-providers/index.md +++ b/docs/inference-providers/index.md @@ -15,6 +15,7 @@ Our platform integrates with leading AI infrastructure providers, giving you acc | -------------------------------------------- | :-------------------: | :-------------------: | :----------------: | :-----------: | :-----------: | :------------: | | [Cerebras](./providers/cerebras) | ✅ | | | | | | | [Cohere](./providers/cohere) | ✅ | ✅ | | | | | +| [DeepInfra](./providers/deepinfra) | ✅ | ✅ | | | | | | [Fal AI](./providers/fal-ai) | | | | ✅ | ✅ | ✅ | | [Featherless AI](./providers/featherless-ai) | ✅ | ✅ | | | | | | [Fireworks](./providers/fireworks-ai) | ✅ | ✅ | | | | | diff --git a/docs/inference-providers/providers/deepinfra.md b/docs/inference-providers/providers/deepinfra.md new file mode 100644 index 0000000000..e8085ada49 --- /dev/null +++ b/docs/inference-providers/providers/deepinfra.md @@ -0,0 +1,47 @@ + + +# DeepInfra + +> [!TIP] +> All supported DeepInfra models can be found [here](https://huggingface.co/models?inference_provider=deepinfra&sort=trending) + +
+ + + + +
+ +
+ + + + +
+ +DeepInfra is a serverless AI inference platform that enables developers to run machine learning models through a simple API, without managing infrastructure. The platform handles GPUs, scaling, and monitoring, offering cost-efficient pay-per-token pricing with OpenAI-compatible endpoints. + +## Resources +- **Website**: https://deepinfra.com/ +- **Documentation**: https://deepinfra.com/docs + +## Supported tasks + + diff --git a/scripts/inference-providers/scripts/generate.ts b/scripts/inference-providers/scripts/generate.ts index 21607f41f4..9078a6f4ae 100644 --- a/scripts/inference-providers/scripts/generate.ts +++ b/scripts/inference-providers/scripts/generate.ts @@ -37,6 +37,7 @@ const HEADERS: Record = process.env.HF_TOKEN const PROVIDERS_URLS: Record = { cerebras: "https://www.cerebras.ai/", cohere: "https://cohere.com/", + deepinfra: "https://deepinfra.com/", "fal-ai": "https://fal.ai/", "featherless-ai": "https://featherless.ai/", "fireworks-ai": "https://fireworks.ai/", diff --git a/scripts/inference-providers/templates/providers/deepinfra.handlebars b/scripts/inference-providers/templates/providers/deepinfra.handlebars new file mode 100644 index 0000000000..cc5d142a41 --- /dev/null +++ b/scripts/inference-providers/templates/providers/deepinfra.handlebars @@ -0,0 +1,16 @@ +# DeepInfra + +> [!TIP] +> All supported DeepInfra models can be found [here](https://huggingface.co/models?inference_provider=deepinfra&sort=trending) + +{{{logoSection}}} + +{{{followUsSection}}} + +DeepInfra is a serverless AI inference platform that enables developers to run machine learning models through a simple API, without managing infrastructure. The platform handles GPUs, scaling, and monitoring, offering cost-efficient pay-per-token pricing with OpenAI-compatible endpoints. + +## Resources +- **Website**: https://deepinfra.com/ +- **Documentation**: https://deepinfra.com/docs + +{{{tasksSection}}} From 8f28dd5d597c9cdb3ac9e50189bed97f8c153198 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?c=C3=A9lina?= Date: Thu, 16 Apr 2026 10:48:52 +0200 Subject: [PATCH 2/2] Apply suggestions from code review MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Co-authored-by: célina --- .../templates/providers/deepinfra.handlebars | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/scripts/inference-providers/templates/providers/deepinfra.handlebars b/scripts/inference-providers/templates/providers/deepinfra.handlebars index cc5d142a41..d9af401b23 100644 --- a/scripts/inference-providers/templates/providers/deepinfra.handlebars +++ b/scripts/inference-providers/templates/providers/deepinfra.handlebars @@ -7,10 +7,10 @@ {{{followUsSection}}} -DeepInfra is a serverless AI inference platform that enables developers to run machine learning models through a simple API, without managing infrastructure. The platform handles GPUs, scaling, and monitoring, offering cost-efficient pay-per-token pricing with OpenAI-compatible endpoints. +DeepInfra is a serverless AI inference platform offering one of the most cost-effective pricing per token in the industry. With a catalog of over 100 models spanning LLMs, text-to-image, text-to-speech, speech-to-text, video generation, OCR, and more, DeepInfra makes it easy for developers to integrate a wide range of AI capabilities into their applications with minimal setup. ## Resources - **Website**: https://deepinfra.com/ -- **Documentation**: https://deepinfra.com/docs +- **Documentation**: https://docs.deepinfra.com {{{tasksSection}}}