huggingface
diff --git a/‎docs/inference-providers/providers/cerebras.md
Lines changed: 1 addition & 1 deletion b/‎docs/inference-providers/providers/cerebras.md
Lines changed: 1 addition & 1 deletion
diff --git a/‎docs/inference-providers/providers/fal-ai.md
Lines changed: 1 addition & 1 deletion b/‎docs/inference-providers/providers/fal-ai.md
Lines changed: 1 addition & 1 deletion
diff --git a/‎docs/inference-providers/providers/featherless-ai.md
Lines changed: 3 additions & 3 deletions b/‎docs/inference-providers/providers/featherless-ai.md
Lines changed: 3 additions & 3 deletions
diff --git a/‎docs/inference-providers/providers/fireworks-ai.md
Lines changed: 1 addition & 1 deletion b/‎docs/inference-providers/providers/fireworks-ai.md
Lines changed: 1 addition & 1 deletion
diff --git a/‎docs/inference-providers/providers/groq.md
Lines changed: 1 addition & 1 deletion b/‎docs/inference-providers/providers/groq.md
Lines changed: 1 addition & 1 deletion
diff --git a/‎docs/inference-providers/providers/hf-inference.md
Lines changed: 45 additions & 13 deletions b/‎docs/inference-providers/providers/hf-inference.md
Lines changed: 45 additions & 13 deletions
diff --git a/‎docs/inference-providers/providers/hyperbolic.md
Lines changed: 1 addition & 1 deletion b/‎docs/inference-providers/providers/hyperbolic.md
Lines changed: 1 addition & 1 deletion
diff --git a/‎docs/inference-providers/providers/nebius.md
Lines changed: 10 additions & 0 deletions b/‎docs/inference-providers/providers/nebius.md
Lines changed: 10 additions & 0 deletions
diff --git a/‎docs/inference-providers/providers/novita.md
Lines changed: 2 additions & 2 deletions b/‎docs/inference-providers/providers/novita.md
Lines changed: 2 additions & 2 deletions
diff --git a/‎docs/inference-providers/providers/together.md
Lines changed: 2 additions & 2 deletions b/‎docs/inference-providers/providers/together.md
Lines changed: 2 additions & 2 deletions
@@ -50,7 +50,7 @@ Find out more about Chat Completion (LLM) [here](../tasks/chat-completion).
 
 <InferenceSnippet
     pipeline=text-generation
-    providersMapping={ {"cerebras":{"modelId":"meta-llama/Llama-3.3-70B-Instruct","providerModelId":"llama-3.3-70b"} } }
+    providersMapping={ {"cerebras":{"modelId":"meta-llama/Llama-3.1-8B-Instruct","providerModelId":"llama3.1-8b"} } }
 conversational />
 
 
 
@@ -80,6 +80,6 @@ Find out more about Text To Video [here](../tasks/text_to_video).
 
 <InferenceSnippet
     pipeline=text-to-video
-    providersMapping={ {"fal-ai":{"modelId":"tencent/HunyuanVideo","providerModelId":"fal-ai/hunyuan-video"} } }
+    providersMapping={ {"fal-ai":{"modelId":"Wan-AI/Wan2.1-T2V-14B","providerModelId":"fal-ai/wan-t2v"} } }
 />
 
@@ -52,7 +52,7 @@ Find out more about Chat Completion (LLM) [here](../tasks/chat-completion).
 
 <InferenceSnippet
     pipeline=text-generation
-    providersMapping={ {"featherless-ai":{"modelId":"mistralai/Magistral-Small-2506","providerModelId":"mistralai/Magistral-Small-2506"} } }
+    providersMapping={ {"featherless-ai":{"modelId":"meta-llama/Llama-3.1-8B-Instruct","providerModelId":"meta-llama/Meta-Llama-3.1-8B-Instruct"} } }
 conversational />
 
 
@@ -62,7 +62,7 @@ Find out more about Chat Completion (VLM) [here](../tasks/chat-completion).
 
 <InferenceSnippet
     pipeline=image-text-to-text
-    providersMapping={ {"featherless-ai":{"modelId":"CEIA-UFG/Gemma-3-Gaia-PT-BR-4b-it","providerModelId":"CEIA-UFG/Gemma-3-Gaia-PT-BR-4b-it"} } }
+    providersMapping={ {"featherless-ai":{"modelId":"google/gemma-3-27b-it","providerModelId":"google/gemma-3-27b-it"} } }
 conversational />
 
 
@@ -72,6 +72,6 @@ Find out more about Text Generation [here](../tasks/text_generation).
 
 <InferenceSnippet
     pipeline=text-generation
-    providersMapping={ {"featherless-ai":{"modelId":"mistralai/Magistral-Small-2506","providerModelId":"mistralai/Magistral-Small-2506"} } }
+    providersMapping={ {"featherless-ai":{"modelId":"meta-llama/Llama-3.1-8B-Instruct","providerModelId":"meta-llama/Meta-Llama-3.1-8B-Instruct"} } }
 />
 
@@ -49,7 +49,7 @@ Find out more about Chat Completion (LLM) [here](../tasks/chat-completion).
 
 <InferenceSnippet
     pipeline=text-generation
-    providersMapping={ {"fireworks-ai":{"modelId":"deepseek-ai/DeepSeek-R1-0528","providerModelId":"accounts/fireworks/models/deepseek-r1-0528"} } }
+    providersMapping={ {"fireworks-ai":{"modelId":"moonshotai/Kimi-K2-Instruct","providerModelId":"accounts/fireworks/models/kimi-k2-instruct"} } }
 conversational />
 
 
 
@@ -60,7 +60,7 @@ Find out more about Chat Completion (LLM) [here](../tasks/chat-completion).
 
 <InferenceSnippet
     pipeline=text-generation
-    providersMapping={ {"groq":{"modelId":"meta-llama/Llama-3.3-70B-Instruct","providerModelId":"llama-3.3-70b-versatile"} } }
+    providersMapping={ {"groq":{"modelId":"moonshotai/Kimi-K2-Instruct","providerModelId":"moonshotai/kimi-k2-instruct"} } }
 conversational />
 
 
 
@@ -42,19 +42,31 @@ All supported HF Inference models can be found [here](https://huggingface.co/mod
 HF Inference is the serverless Inference API powered by Hugging Face. This service used to be called "Inference API (serverless)" prior to Inference Providers.
 If you are interested in deploying models to a dedicated and autoscaling infrastructure managed by Hugging Face, check out [Inference Endpoints](https://huggingface.co/docs/inference-endpoints/index) instead.
 
+As of July 2025, hf-inference focuses mostly on CPU inference (e.g. embedding, text-ranking, text-classification, or smaller LLMs that have historical importance like BERT or GPT-2).
+
 ## Supported tasks
 
 
 ### Automatic Speech Recognition
 
-Find out more about Automatic Speech Recognition [here](../tasks/automatic-speech-recognition).
+Find out more about Automatic Speech Recognition [here](../tasks/automatic_speech_recognition).
 
 <InferenceSnippet
     pipeline=automatic-speech-recognition
     providersMapping={ {"hf-inference":{"modelId":"openai/whisper-large-v3","providerModelId":"openai/whisper-large-v3"} } }
 />
 
 
+### Chat Completion (LLM)
+
+Find out more about Chat Completion (LLM) [here](../tasks/chat-completion).
+
+<InferenceSnippet
+    pipeline=text-generation
+    providersMapping={ {"hf-inference":{"modelId":"HuggingFaceTB/SmolLM3-3B","providerModelId":"HuggingFaceTB/SmolLM3-3B"} } }
+conversational />
+
+
 ### Chat Completion (VLM)
 
 Find out more about Chat Completion (VLM) [here](../tasks/chat-completion).
@@ -67,7 +79,7 @@ conversational />
 
 ### Feature Extraction
 
-Find out more about Feature Extraction [here](../tasks/feature-extraction).
+Find out more about Feature Extraction [here](../tasks/feature_extraction).
 
 <InferenceSnippet
     pipeline=feature-extraction
@@ -77,7 +89,7 @@ Find out more about Feature Extraction [here](../tasks/feature-extraction).
 
 ### Fill Mask
 
-Find out more about Fill Mask [here](../tasks/fill-mask).
+Find out more about Fill Mask [here](../tasks/fill_mask).
 
 <InferenceSnippet
     pipeline=fill-mask
@@ -87,7 +99,7 @@ Find out more about Fill Mask [here](../tasks/fill-mask).
 
 ### Image Classification
 
-Find out more about Image Classification [here](../tasks/image-classification).
+Find out more about Image Classification [here](../tasks/image_classification).
 
 <InferenceSnippet
     pipeline=image-classification
@@ -97,17 +109,17 @@ Find out more about Image Classification [here](../tasks/image-classification).
 
 ### Image Segmentation
 
-Find out more about Image Segmentation [here](../tasks/image-segmentation).
+Find out more about Image Segmentation [here](../tasks/image_segmentation).
 
 <InferenceSnippet
     pipeline=image-segmentation
-    providersMapping={ {"hf-inference":{"modelId":"mattmdjaga/segformer_b2_clothes","providerModelId":"mattmdjaga/segformer_b2_clothes"} } }
+    providersMapping={ {"hf-inference":{"modelId":"jonathandinu/face-parsing","providerModelId":"jonathandinu/face-parsing"} } }
 />
 
 
 ### Object Detection
 
-Find out more about Object Detection [here](../tasks/object-detection).
+Find out more about Object Detection [here](../tasks/object_detection).
 
 <InferenceSnippet
     pipeline=object-detection
@@ -117,7 +129,7 @@ Find out more about Object Detection [here](../tasks/object-detection).
 
 ### Question Answering
 
-Find out more about Question Answering [here](../tasks/question-answering).
+Find out more about Question Answering [here](../tasks/question_answering).
 
 <InferenceSnippet
     pipeline=question-answering
@@ -137,7 +149,7 @@ Find out more about Summarization [here](../tasks/summarization).
 
 ### Table Question Answering
 
-Find out more about Table Question Answering [here](../tasks/table-question-answering).
+Find out more about Table Question Answering [here](../tasks/table_question_answering).
 
 <InferenceSnippet
     pipeline=table-question-answering
@@ -147,17 +159,27 @@ Find out more about Table Question Answering [here](../tasks/table-question-answ
 
 ### Text Classification
 
-Find out more about Text Classification [here](../tasks/text-classification).
+Find out more about Text Classification [here](../tasks/text_classification).
 
 <InferenceSnippet
     pipeline=text-classification
     providersMapping={ {"hf-inference":{"modelId":"tabularisai/multilingual-sentiment-analysis","providerModelId":"tabularisai/multilingual-sentiment-analysis"} } }
 />
 
 
+### Text Generation
+
+Find out more about Text Generation [here](../tasks/text_generation).
+
+<InferenceSnippet
+    pipeline=text-generation
+    providersMapping={ {"hf-inference":{"modelId":"HuggingFaceTB/SmolLM3-3B","providerModelId":"HuggingFaceTB/SmolLM3-3B"} } }
+/>
+
+
 ### Text To Image
 
-Find out more about Text To Image [here](../tasks/text-to-image).
+Find out more about Text To Image [here](../tasks/text_to_image).
 
 <InferenceSnippet
     pipeline=text-to-image
@@ -167,7 +189,7 @@ Find out more about Text To Image [here](../tasks/text-to-image).
 
 ### Token Classification
 
-Find out more about Token Classification [here](../tasks/token-classification).
+Find out more about Token Classification [here](../tasks/token_classification).
 
 <InferenceSnippet
     pipeline=token-classification
@@ -181,6 +203,16 @@ Find out more about Translation [here](../tasks/translation).
 
 <InferenceSnippet
     pipeline=translation
-    providersMapping={ {"hf-inference":{"modelId":"google-t5/t5-base","providerModelId":"google-t5/t5-base"} } }
+    providersMapping={ {"hf-inference":{"modelId":"google-t5/t5-small","providerModelId":"google-t5/t5-small"} } }
+/>
+
+
+### Zero Shot Classification
+
+Find out more about Zero Shot Classification [here](../tasks/zero_shot_classification).
+
+<InferenceSnippet
+    pipeline=zero-shot-classification
+    providersMapping={ {"hf-inference":{"modelId":"facebook/bart-large-mnli","providerModelId":"facebook/bart-large-mnli"} } }
 />
 
@@ -88,7 +88,7 @@ Find out more about Chat Completion (LLM) [here](../tasks/chat-completion).
 
 <InferenceSnippet
     pipeline=text-generation
-    providersMapping={ {"hyperbolic":{"modelId":"deepseek-ai/DeepSeek-R1-0528","providerModelId":"deepseek-ai/DeepSeek-R1-0528"} } }
+    providersMapping={ {"hyperbolic":{"modelId":"Qwen/Qwen3-Coder-480B-A35B-Instruct","providerModelId":"Qwen/Qwen3-Coder-480B-A35B-Instruct"} } }
 conversational />
 
 
 
@@ -74,6 +74,16 @@ Find out more about Feature Extraction [here](../tasks/feature_extraction).
 />
 
 
+### Text Generation
+
+Find out more about Text Generation [here](../tasks/text_generation).
+
+<InferenceSnippet
+    pipeline=text-generation
+    providersMapping={ {"nebius":{"modelId":"deepseek-ai/DeepSeek-R1-0528","providerModelId":"deepseek-ai/DeepSeek-R1-0528"} } }
+/>
+
+
 ### Text To Image
 
 Find out more about Text To Image [here](../tasks/text_to_image).
 
@@ -52,7 +52,7 @@ Find out more about Chat Completion (LLM) [here](../tasks/chat-completion).
 
 <InferenceSnippet
     pipeline=text-generation
-    providersMapping={ {"novita":{"modelId":"MiniMaxAI/MiniMax-M1-80k","providerModelId":"minimaxai/minimax-m1-80k"} } }
+    providersMapping={ {"novita":{"modelId":"moonshotai/Kimi-K2-Instruct","providerModelId":"moonshotai/kimi-k2-instruct"} } }
 conversational />
 
 
@@ -62,7 +62,7 @@ Find out more about Chat Completion (VLM) [here](../tasks/chat-completion).
 
 <InferenceSnippet
     pipeline=image-text-to-text
-    providersMapping={ {"novita":{"modelId":"baidu/ERNIE-4.5-VL-424B-A47B-Base-PT","providerModelId":"baidu/ernie-4.5-vl-424b-a47b"} } }
+    providersMapping={ {"novita":{"modelId":"THUDM/GLM-4.1V-9B-Thinking","providerModelId":"thudm/glm-4.1v-9b-thinking"} } }
 conversational />
 
 
 
@@ -50,7 +50,7 @@ Find out more about Chat Completion (LLM) [here](../tasks/chat-completion).
 
 <InferenceSnippet
     pipeline=text-generation
-    providersMapping={ {"together":{"modelId":"deepseek-ai/DeepSeek-R1-0528","providerModelId":"deepseek-ai/DeepSeek-R1"} } }
+    providersMapping={ {"together":{"modelId":"moonshotai/Kimi-K2-Instruct","providerModelId":"moonshotai/Kimi-K2-Instruct"} } }
 conversational />
 
 
@@ -70,7 +70,7 @@ Find out more about Text Generation [here](../tasks/text_generation).
 
 <InferenceSnippet
     pipeline=text-generation
-    providersMapping={ {"together":{"modelId":"deepseek-ai/DeepSeek-R1-0528","providerModelId":"deepseek-ai/DeepSeek-R1"} } }
+    providersMapping={ {"together":{"modelId":"moonshotai/Kimi-K2-Instruct","providerModelId":"moonshotai/Kimi-K2-Instruct"} } }
 />