diff --git a/docs/inference-providers/_toctree.yml b/docs/inference-providers/_toctree.yml index ce55cb644f..b1919f13fa 100644 --- a/docs/inference-providers/_toctree.yml +++ b/docs/inference-providers/_toctree.yml @@ -106,6 +106,8 @@ title: Cerebras - local: providers/cohere title: Cohere + - local: providers/deepinfra + title: DeepInfra - local: providers/fal-ai title: Fal AI - local: providers/featherless-ai diff --git a/docs/inference-providers/index.md b/docs/inference-providers/index.md index 6f12bf65c2..72ebe4dd11 100644 --- a/docs/inference-providers/index.md +++ b/docs/inference-providers/index.md @@ -15,6 +15,7 @@ Our platform integrates with leading AI infrastructure providers, giving you acc | -------------------------------------------- | :-------------------: | :-------------------: | :----------------: | :-----------: | :-----------: | :------------: | | [Cerebras](./providers/cerebras) | ✅ | | | | | | | [Cohere](./providers/cohere) | ✅ | ✅ | | | | | +| [DeepInfra](./providers/deepinfra) | ✅ | ✅ | | | | | | [Fal AI](./providers/fal-ai) | | | | ✅ | ✅ | ✅ | | [Featherless AI](./providers/featherless-ai) | ✅ | ✅ | | | | | | [Fireworks](./providers/fireworks-ai) | ✅ | ✅ | | | | | diff --git a/docs/inference-providers/providers/deepinfra.md b/docs/inference-providers/providers/deepinfra.md new file mode 100644 index 0000000000..e8085ada49 --- /dev/null +++ b/docs/inference-providers/providers/deepinfra.md @@ -0,0 +1,47 @@ + + +# DeepInfra + +> [!TIP] +> All supported DeepInfra models can be found [here](https://huggingface.co/models?inference_provider=deepinfra&sort=trending) + +
+ + + + +
+ +
+ + + + +
+ +DeepInfra is a serverless AI inference platform that enables developers to run machine learning models through a simple API, without managing infrastructure. The platform handles GPUs, scaling, and monitoring, offering cost-efficient pay-per-token pricing with OpenAI-compatible endpoints. + +## Resources +- **Website**: https://deepinfra.com/ +- **Documentation**: https://deepinfra.com/docs + +## Supported tasks + + diff --git a/scripts/inference-providers/scripts/generate.ts b/scripts/inference-providers/scripts/generate.ts index 21607f41f4..9078a6f4ae 100644 --- a/scripts/inference-providers/scripts/generate.ts +++ b/scripts/inference-providers/scripts/generate.ts @@ -37,6 +37,7 @@ const HEADERS: Record = process.env.HF_TOKEN const PROVIDERS_URLS: Record = { cerebras: "https://www.cerebras.ai/", cohere: "https://cohere.com/", + deepinfra: "https://deepinfra.com/", "fal-ai": "https://fal.ai/", "featherless-ai": "https://featherless.ai/", "fireworks-ai": "https://fireworks.ai/", diff --git a/scripts/inference-providers/templates/providers/deepinfra.handlebars b/scripts/inference-providers/templates/providers/deepinfra.handlebars new file mode 100644 index 0000000000..d9af401b23 --- /dev/null +++ b/scripts/inference-providers/templates/providers/deepinfra.handlebars @@ -0,0 +1,16 @@ +# DeepInfra + +> [!TIP] +> All supported DeepInfra models can be found [here](https://huggingface.co/models?inference_provider=deepinfra&sort=trending) + +{{{logoSection}}} + +{{{followUsSection}}} + +DeepInfra is a serverless AI inference platform offering one of the most cost-effective pricing per token in the industry. With a catalog of over 100 models spanning LLMs, text-to-image, text-to-speech, speech-to-text, video generation, OCR, and more, DeepInfra makes it easy for developers to integrate a wide range of AI capabilities into their applications with minimal setup. + +## Resources +- **Website**: https://deepinfra.com/ +- **Documentation**: https://docs.deepinfra.com + +{{{tasksSection}}}