Skip to content

Commit b5ce090

Browse files
Wauplingithub-actions[bot]
authored andcommitted
Update Inference Providers documentation (automated)
1 parent f666b4a commit b5ce090

19 files changed

+100
-52
lines changed

docs/inference-providers/providers/cerebras.md

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -50,7 +50,7 @@ Find out more about Chat Completion (LLM) [here](../tasks/chat-completion).
5050

5151
<InferenceSnippet
5252
pipeline=text-generation
53-
providersMapping={ {"cerebras":{"modelId":"meta-llama/Llama-3.3-70B-Instruct","providerModelId":"llama-3.3-70b"} } }
53+
providersMapping={ {"cerebras":{"modelId":"meta-llama/Llama-3.1-8B-Instruct","providerModelId":"llama3.1-8b"} } }
5454
conversational />
5555

5656

docs/inference-providers/providers/fal-ai.md

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -80,6 +80,6 @@ Find out more about Text To Video [here](../tasks/text_to_video).
8080

8181
<InferenceSnippet
8282
pipeline=text-to-video
83-
providersMapping={ {"fal-ai":{"modelId":"tencent/HunyuanVideo","providerModelId":"fal-ai/hunyuan-video"} } }
83+
providersMapping={ {"fal-ai":{"modelId":"Wan-AI/Wan2.1-T2V-14B","providerModelId":"fal-ai/wan-t2v"} } }
8484
/>
8585

docs/inference-providers/providers/featherless-ai.md

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -52,7 +52,7 @@ Find out more about Chat Completion (LLM) [here](../tasks/chat-completion).
5252

5353
<InferenceSnippet
5454
pipeline=text-generation
55-
providersMapping={ {"featherless-ai":{"modelId":"mistralai/Magistral-Small-2506","providerModelId":"mistralai/Magistral-Small-2506"} } }
55+
providersMapping={ {"featherless-ai":{"modelId":"meta-llama/Llama-3.1-8B-Instruct","providerModelId":"meta-llama/Meta-Llama-3.1-8B-Instruct"} } }
5656
conversational />
5757

5858

@@ -62,7 +62,7 @@ Find out more about Chat Completion (VLM) [here](../tasks/chat-completion).
6262

6363
<InferenceSnippet
6464
pipeline=image-text-to-text
65-
providersMapping={ {"featherless-ai":{"modelId":"CEIA-UFG/Gemma-3-Gaia-PT-BR-4b-it","providerModelId":"CEIA-UFG/Gemma-3-Gaia-PT-BR-4b-it"} } }
65+
providersMapping={ {"featherless-ai":{"modelId":"google/gemma-3-27b-it","providerModelId":"google/gemma-3-27b-it"} } }
6666
conversational />
6767

6868

@@ -72,6 +72,6 @@ Find out more about Text Generation [here](../tasks/text_generation).
7272

7373
<InferenceSnippet
7474
pipeline=text-generation
75-
providersMapping={ {"featherless-ai":{"modelId":"mistralai/Magistral-Small-2506","providerModelId":"mistralai/Magistral-Small-2506"} } }
75+
providersMapping={ {"featherless-ai":{"modelId":"meta-llama/Llama-3.1-8B-Instruct","providerModelId":"meta-llama/Meta-Llama-3.1-8B-Instruct"} } }
7676
/>
7777

docs/inference-providers/providers/fireworks-ai.md

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -49,7 +49,7 @@ Find out more about Chat Completion (LLM) [here](../tasks/chat-completion).
4949

5050
<InferenceSnippet
5151
pipeline=text-generation
52-
providersMapping={ {"fireworks-ai":{"modelId":"deepseek-ai/DeepSeek-R1-0528","providerModelId":"accounts/fireworks/models/deepseek-r1-0528"} } }
52+
providersMapping={ {"fireworks-ai":{"modelId":"moonshotai/Kimi-K2-Instruct","providerModelId":"accounts/fireworks/models/kimi-k2-instruct"} } }
5353
conversational />
5454

5555

docs/inference-providers/providers/groq.md

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -60,7 +60,7 @@ Find out more about Chat Completion (LLM) [here](../tasks/chat-completion).
6060

6161
<InferenceSnippet
6262
pipeline=text-generation
63-
providersMapping={ {"groq":{"modelId":"meta-llama/Llama-3.3-70B-Instruct","providerModelId":"llama-3.3-70b-versatile"} } }
63+
providersMapping={ {"groq":{"modelId":"moonshotai/Kimi-K2-Instruct","providerModelId":"moonshotai/kimi-k2-instruct"} } }
6464
conversational />
6565

6666

docs/inference-providers/providers/hf-inference.md

Lines changed: 45 additions & 13 deletions
Original file line numberDiff line numberDiff line change
@@ -42,19 +42,31 @@ All supported HF Inference models can be found [here](https://huggingface.co/mod
4242
HF Inference is the serverless Inference API powered by Hugging Face. This service used to be called "Inference API (serverless)" prior to Inference Providers.
4343
If you are interested in deploying models to a dedicated and autoscaling infrastructure managed by Hugging Face, check out [Inference Endpoints](https://huggingface.co/docs/inference-endpoints/index) instead.
4444

45+
As of July 2025, hf-inference focuses mostly on CPU inference (e.g. embedding, text-ranking, text-classification, or smaller LLMs that have historical importance like BERT or GPT-2).
46+
4547
## Supported tasks
4648

4749

4850
### Automatic Speech Recognition
4951

50-
Find out more about Automatic Speech Recognition [here](../tasks/automatic-speech-recognition).
52+
Find out more about Automatic Speech Recognition [here](../tasks/automatic_speech_recognition).
5153

5254
<InferenceSnippet
5355
pipeline=automatic-speech-recognition
5456
providersMapping={ {"hf-inference":{"modelId":"openai/whisper-large-v3","providerModelId":"openai/whisper-large-v3"} } }
5557
/>
5658

5759

60+
### Chat Completion (LLM)
61+
62+
Find out more about Chat Completion (LLM) [here](../tasks/chat-completion).
63+
64+
<InferenceSnippet
65+
pipeline=text-generation
66+
providersMapping={ {"hf-inference":{"modelId":"HuggingFaceTB/SmolLM3-3B","providerModelId":"HuggingFaceTB/SmolLM3-3B"} } }
67+
conversational />
68+
69+
5870
### Chat Completion (VLM)
5971

6072
Find out more about Chat Completion (VLM) [here](../tasks/chat-completion).
@@ -67,7 +79,7 @@ conversational />
6779

6880
### Feature Extraction
6981

70-
Find out more about Feature Extraction [here](../tasks/feature-extraction).
82+
Find out more about Feature Extraction [here](../tasks/feature_extraction).
7183

7284
<InferenceSnippet
7385
pipeline=feature-extraction
@@ -77,7 +89,7 @@ Find out more about Feature Extraction [here](../tasks/feature-extraction).
7789

7890
### Fill Mask
7991

80-
Find out more about Fill Mask [here](../tasks/fill-mask).
92+
Find out more about Fill Mask [here](../tasks/fill_mask).
8193

8294
<InferenceSnippet
8395
pipeline=fill-mask
@@ -87,7 +99,7 @@ Find out more about Fill Mask [here](../tasks/fill-mask).
8799

88100
### Image Classification
89101

90-
Find out more about Image Classification [here](../tasks/image-classification).
102+
Find out more about Image Classification [here](../tasks/image_classification).
91103

92104
<InferenceSnippet
93105
pipeline=image-classification
@@ -97,17 +109,17 @@ Find out more about Image Classification [here](../tasks/image-classification).
97109

98110
### Image Segmentation
99111

100-
Find out more about Image Segmentation [here](../tasks/image-segmentation).
112+
Find out more about Image Segmentation [here](../tasks/image_segmentation).
101113

102114
<InferenceSnippet
103115
pipeline=image-segmentation
104-
providersMapping={ {"hf-inference":{"modelId":"mattmdjaga/segformer_b2_clothes","providerModelId":"mattmdjaga/segformer_b2_clothes"} } }
116+
providersMapping={ {"hf-inference":{"modelId":"jonathandinu/face-parsing","providerModelId":"jonathandinu/face-parsing"} } }
105117
/>
106118

107119

108120
### Object Detection
109121

110-
Find out more about Object Detection [here](../tasks/object-detection).
122+
Find out more about Object Detection [here](../tasks/object_detection).
111123

112124
<InferenceSnippet
113125
pipeline=object-detection
@@ -117,7 +129,7 @@ Find out more about Object Detection [here](../tasks/object-detection).
117129

118130
### Question Answering
119131

120-
Find out more about Question Answering [here](../tasks/question-answering).
132+
Find out more about Question Answering [here](../tasks/question_answering).
121133

122134
<InferenceSnippet
123135
pipeline=question-answering
@@ -137,7 +149,7 @@ Find out more about Summarization [here](../tasks/summarization).
137149

138150
### Table Question Answering
139151

140-
Find out more about Table Question Answering [here](../tasks/table-question-answering).
152+
Find out more about Table Question Answering [here](../tasks/table_question_answering).
141153

142154
<InferenceSnippet
143155
pipeline=table-question-answering
@@ -147,17 +159,27 @@ Find out more about Table Question Answering [here](../tasks/table-question-answ
147159

148160
### Text Classification
149161

150-
Find out more about Text Classification [here](../tasks/text-classification).
162+
Find out more about Text Classification [here](../tasks/text_classification).
151163

152164
<InferenceSnippet
153165
pipeline=text-classification
154166
providersMapping={ {"hf-inference":{"modelId":"tabularisai/multilingual-sentiment-analysis","providerModelId":"tabularisai/multilingual-sentiment-analysis"} } }
155167
/>
156168

157169

170+
### Text Generation
171+
172+
Find out more about Text Generation [here](../tasks/text_generation).
173+
174+
<InferenceSnippet
175+
pipeline=text-generation
176+
providersMapping={ {"hf-inference":{"modelId":"HuggingFaceTB/SmolLM3-3B","providerModelId":"HuggingFaceTB/SmolLM3-3B"} } }
177+
/>
178+
179+
158180
### Text To Image
159181

160-
Find out more about Text To Image [here](../tasks/text-to-image).
182+
Find out more about Text To Image [here](../tasks/text_to_image).
161183

162184
<InferenceSnippet
163185
pipeline=text-to-image
@@ -167,7 +189,7 @@ Find out more about Text To Image [here](../tasks/text-to-image).
167189

168190
### Token Classification
169191

170-
Find out more about Token Classification [here](../tasks/token-classification).
192+
Find out more about Token Classification [here](../tasks/token_classification).
171193

172194
<InferenceSnippet
173195
pipeline=token-classification
@@ -181,6 +203,16 @@ Find out more about Translation [here](../tasks/translation).
181203

182204
<InferenceSnippet
183205
pipeline=translation
184-
providersMapping={ {"hf-inference":{"modelId":"google-t5/t5-base","providerModelId":"google-t5/t5-base"} } }
206+
providersMapping={ {"hf-inference":{"modelId":"google-t5/t5-small","providerModelId":"google-t5/t5-small"} } }
207+
/>
208+
209+
210+
### Zero Shot Classification
211+
212+
Find out more about Zero Shot Classification [here](../tasks/zero_shot_classification).
213+
214+
<InferenceSnippet
215+
pipeline=zero-shot-classification
216+
providersMapping={ {"hf-inference":{"modelId":"facebook/bart-large-mnli","providerModelId":"facebook/bart-large-mnli"} } }
185217
/>
186218

docs/inference-providers/providers/hyperbolic.md

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -88,7 +88,7 @@ Find out more about Chat Completion (LLM) [here](../tasks/chat-completion).
8888

8989
<InferenceSnippet
9090
pipeline=text-generation
91-
providersMapping={ {"hyperbolic":{"modelId":"deepseek-ai/DeepSeek-R1-0528","providerModelId":"deepseek-ai/DeepSeek-R1-0528"} } }
91+
providersMapping={ {"hyperbolic":{"modelId":"Qwen/Qwen3-Coder-480B-A35B-Instruct","providerModelId":"Qwen/Qwen3-Coder-480B-A35B-Instruct"} } }
9292
conversational />
9393

9494

docs/inference-providers/providers/nebius.md

Lines changed: 10 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -74,6 +74,16 @@ Find out more about Feature Extraction [here](../tasks/feature_extraction).
7474
/>
7575

7676

77+
### Text Generation
78+
79+
Find out more about Text Generation [here](../tasks/text_generation).
80+
81+
<InferenceSnippet
82+
pipeline=text-generation
83+
providersMapping={ {"nebius":{"modelId":"deepseek-ai/DeepSeek-R1-0528","providerModelId":"deepseek-ai/DeepSeek-R1-0528"} } }
84+
/>
85+
86+
7787
### Text To Image
7888

7989
Find out more about Text To Image [here](../tasks/text_to_image).

docs/inference-providers/providers/novita.md

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -52,7 +52,7 @@ Find out more about Chat Completion (LLM) [here](../tasks/chat-completion).
5252

5353
<InferenceSnippet
5454
pipeline=text-generation
55-
providersMapping={ {"novita":{"modelId":"MiniMaxAI/MiniMax-M1-80k","providerModelId":"minimaxai/minimax-m1-80k"} } }
55+
providersMapping={ {"novita":{"modelId":"moonshotai/Kimi-K2-Instruct","providerModelId":"moonshotai/kimi-k2-instruct"} } }
5656
conversational />
5757

5858

@@ -62,7 +62,7 @@ Find out more about Chat Completion (VLM) [here](../tasks/chat-completion).
6262

6363
<InferenceSnippet
6464
pipeline=image-text-to-text
65-
providersMapping={ {"novita":{"modelId":"baidu/ERNIE-4.5-VL-424B-A47B-Base-PT","providerModelId":"baidu/ernie-4.5-vl-424b-a47b"} } }
65+
providersMapping={ {"novita":{"modelId":"THUDM/GLM-4.1V-9B-Thinking","providerModelId":"thudm/glm-4.1v-9b-thinking"} } }
6666
conversational />
6767

6868

docs/inference-providers/providers/together.md

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -50,7 +50,7 @@ Find out more about Chat Completion (LLM) [here](../tasks/chat-completion).
5050

5151
<InferenceSnippet
5252
pipeline=text-generation
53-
providersMapping={ {"together":{"modelId":"deepseek-ai/DeepSeek-R1-0528","providerModelId":"deepseek-ai/DeepSeek-R1"} } }
53+
providersMapping={ {"together":{"modelId":"moonshotai/Kimi-K2-Instruct","providerModelId":"moonshotai/Kimi-K2-Instruct"} } }
5454
conversational />
5555

5656

@@ -70,7 +70,7 @@ Find out more about Text Generation [here](../tasks/text_generation).
7070

7171
<InferenceSnippet
7272
pipeline=text-generation
73-
providersMapping={ {"together":{"modelId":"deepseek-ai/DeepSeek-R1-0528","providerModelId":"deepseek-ai/DeepSeek-R1"} } }
73+
providersMapping={ {"together":{"modelId":"moonshotai/Kimi-K2-Instruct","providerModelId":"moonshotai/Kimi-K2-Instruct"} } }
7474
/>
7575

7676

0 commit comments

Comments
 (0)