Commit 496a4f6
File tree
- .claude/skills
- add-jit-kernel
- add-sgl-kernel
- ci-workflow-guide
- debug-cuda-crash
- generate-profile
- sglang-bisect-ci-regression
- write-sglang-test
- .github
- actions
- check-maintenance
- check-stage-health
- upload-cuda-coredumps
- wait-for-jobs
- linters
- workflows
- 3rdparty/amd
- sgl-kernel
- tuning
- wheel
- sgl-kernel
- sglang
- benchmark
- asr
- bench_linear_attention
- blog_v0_2
- deepseek_v3
- fla
- gsm8k
- hicache
- kernels
- all_reduce
- deepep
- deepseek
- elementwise
- flashinfer_allreduce_fusion
- fused_moe_triton
- quantization
- scheduler_batch
- sliding_window_attention_triton
- lora
- mmlu
- mmmu
- tip_suggestion
- docker
- docs
- _static/image
- advanced_features
- basic_usage
- developer_guide
- diffusion
- api
- performance
- cache
- get_started
- performance_dashboard
- platforms
- references
- frontend
- multi_node_deployment
- release_lookup
- supported_models
- extending
- image_generation
- retrieval_ranking
- specialized
- text_generation
- examples
- frontend_language/usage/rag_using_parea
- profiler/nsys_profile_tools
- runtime
- engine
- multimodal
- token_in_token_out
- python
- sglang
- benchmark
- datasets
- cli
- eval
- jit_kernel
- benchmark
- diffusion
- csrc
- diffusion
- distributed
- elementwise
- fast-hadamard-transform
- gemm
- marlin_moe
- marlin
- nvfp4
- lora
- moe
- nsa
- diffusion
- cutedsl
- triton
- flash_attention/cute
- include/sgl_kernel
- distributed
- tests
- diffusion
- triton
- lang
- backend
- multimodal_gen
- .claude
- skills
- sglang-diffusion-add-model
- sglang-diffusion-ako4all-kernel
- references
- scripts
- sglang-diffusion-benchmark-profile
- scripts
- sglang-diffusion-cuda-kernel
- references
- sglang-diffusion-performance
- sglang-diffusion-triton-kernel
- apps
- ComfyUI_SGLDiffusion
- test
- webui
- benchmarks
- configs
- models
- adapter
- dits
- encoders
- vaes
- pipeline_configs
- quantization
- sample
- csrc
- attn/vmoba_attn/tests
- render
- hunyuan3d_rasterizer
- mesh_processor
- docs
- cache
- runtime
- cache
- distributed
- entrypoints
- cli
- openai
- post_training
- layers
- attention
- backends
- lora
- quantization
- configs
- rotary_embedding
- loader
- component_loaders
- managers
- models
- adapter
- bridges
- dits
- encoders
- schedulers
- vaes
- parallel
- pipelines_core
- executors
- stages
- model_specific_stages
- pipelines
- platforms
- postprocess
- utils
- test
- cli
- manual
- scripts
- server
- ascend
- unit
- third_party
- tools
- srt
- batch_invariant_ops
- batch_overlap
- checkpoint_engine
- compilation
- configs
- connector
- constrained
- debug_utils
- comparator
- aligner
- entrypoint
- reorderer
- token_aligner
- concat_steps
- smart
- unsharder
- dims_spec
- tensor_comparator
- visualizer
- source_patcher
- disaggregation
- ascend
- base
- common
- fake
- mooncake
- mori
- nixl
- distributed
- device_communicators
- dllm
- algorithm
- mixin
- elastic_ep
- entrypoints
- anthropic
- openai
- eplb
- eplb_algorithms
- function_call
- grpc
- hardware_backend
- mlx
- npu
- attention
- graph_runner
- modules
- moe
- quantization
- layers
- attention
- fla
- linear
- kernels
- mamba
- ops
- nsa
- triton_ops
- wave_ops
- deep_gemm_wrapper
- moe
- ep_moe
- fused_moe_triton
- configs
- triton_3_4_0
- triton_3_5_1
- moe_runner
- token_dispatcher
- quantization
- compressed_tensors
- schemes
- configs
- modelslim
- schemes
- quark
- schemes
- rotary_embedding
- utils
- lora
- backend
- torch_ops
- triton_ops
- managers
- mem_cache
- hybrid_cache
- sparsity
- core
- storage
- hf3fs
- mooncake_store
- nixl
- model_executor
- model_loader
- models
- deepseek_common
- attention_forward_methods
- multimodal
- processors
- observability
- parser
- ray
- sampling
- speculative
- cpp_ngram
- tracing
- utils
- test
- ascend
- attention
- ci
- kits
- server_fixtures
- scripts
- ci_monitor
- ci
- amd
- cuda
- musa
- npu
- utils
- diffusion
- code_sync
- playground
- release
- sgl-kernel
- benchmark
- csrc
- attention
- cpu
- elementwise
- expert_specialization
- gemm
- marlin
- kvcacheio
- memory
- moe/marlin_moe_wna16
- include
- python/sgl_kernel
- testing
- tests
- spatial
- speculative
- sgl-model-gateway
- benches
- bindings
- golang/src
- python/src
- sglang_router
- src
- config
- core
- steps
- worker
- external
- local
- grpc_client
- observability
- policies
- proto
- routers
- conversations
- grpc
- common
- responses
- stages
- harmony
- responses
- regular
- responses
- openai
- responses
- tests
- api
- common
- routing
- test
- lm_eval_configs
- manual
- ep
- hicache
- layers/attention/nsa
- lora
- nightly
- piecewise_cudagraph
- quant
- vlm
- registered
- 4-gpu-models
- 8-gpu-models
- amd
- accuracy
- mi30x
- mi35x
- disaggregation
- perf/mi35x
- ascend
- basic_function
- HiCache
- parallel_strategy/expert_parallelism
- parameter
- speculative_inference
- embedding_models
- interface
- llm_models
- rerank_models
- reward_models
- vlm_models
- attention
- backends
- bench_fn
- constrained_decoding
- core
- cp
- cuda_graph
- debug_utils
- comparator
- aligner
- entrypoint
- reorderer
- token_aligner
- unsharder
- dims_spec
- tensor_comparator
- source_patcher
- disaggregation
- distributed
- dllm
- embedding
- ep
- eval
- function_call
- hicache
- kernels
- language
- layers
- mamba
- lora
- metrics
- mla
- model_loading
- models
- moe
- openai_server
- basic
- features
- function_call
- validation
- ops
- parser
- perf
- piecewise_cuda_graph
- profiling
- quant
- radix_cache
- rl
- rotary
- sampling
- scheduler
- sessions
- spec
- eagle
- utils
- tokenizer
- unit
- batch_invariant_ops
- constrained
- entrypoints
- openai
- function_call
- layers
- managers
- mem_cache
- model_executor
- model_loader
- observability
- parser
- sampling
- server_args
- utils
- utils
- vlm
- srt
- ascend
- cpu
- models
Some content is hidden
Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.
Large diffs are not rendered by default.
| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
| 1 | + | |
| 2 | + | |
| 3 | + | |
| 4 | + | |
| 5 | + | |
| 6 | + | |
| 7 | + | |
| 8 | + | |
| 9 | + | |
| 10 | + | |
| 11 | + | |
| 12 | + | |
| 13 | + | |
| 14 | + | |
| 15 | + | |
| 16 | + | |
| 17 | + | |
| 18 | + | |
| 19 | + | |
| 20 | + | |
| 21 | + | |
| 22 | + | |
| 23 | + | |
| 24 | + | |
| 25 | + | |
| 26 | + | |
| 27 | + | |
| 28 | + | |
| 29 | + | |
| 30 | + | |
| 31 | + | |
| 32 | + | |
| 33 | + | |
| 34 | + | |
| 35 | + | |
| 36 | + | |
| 37 | + | |
| 38 | + | |
| 39 | + | |
| 40 | + | |
| 41 | + | |
| 42 | + | |
| 43 | + | |
| 44 | + | |
| 45 | + | |
| 46 | + | |
| 47 | + | |
| 48 | + | |
| 49 | + | |
| 50 | + | |
| 51 | + | |
| 52 | + | |
| 53 | + | |
| 54 | + | |
| 55 | + | |
| 56 | + | |
| 57 | + | |
| 58 | + | |
| 59 | + | |
| 60 | + | |
| 61 | + | |
| 62 | + | |
| 63 | + | |
| 64 | + | |
| 65 | + | |
| 66 | + | |
| 67 | + | |
| 68 | + | |
| 69 | + | |
| 70 | + | |
| 71 | + | |
| 72 | + | |
| 73 | + | |
| 74 | + | |
| 75 | + | |
| 76 | + | |
| 77 | + | |
| 78 | + | |
| 79 | + | |
| 80 | + | |
| 81 | + | |
| 82 | + | |
| 83 | + | |
| 84 | + | |
| 85 | + | |
| 86 | + | |
| 87 | + | |
| 88 | + | |
| 89 | + | |
| 90 | + | |
| 91 | + | |
| 92 | + | |
| 93 | + | |
| 94 | + | |
| 95 | + | |
| 96 | + | |
| 97 | + | |
| 98 | + | |
| 99 | + | |
| 100 | + | |
| 101 | + | |
| 102 | + | |
| 103 | + | |
| 104 | + | |
| 105 | + | |
| 106 | + | |
| 107 | + | |
| 108 | + | |
| 109 | + | |
| 110 | + | |
| 111 | + | |
| 112 | + | |
| 113 | + | |
| 114 | + | |
| 115 | + | |
| 116 | + | |
| 117 | + | |
| 118 | + | |
| 119 | + | |
| 120 | + | |
| 121 | + | |
| 122 | + | |
| 123 | + | |
| 124 | + | |
| 125 | + | |
| 126 | + | |
| 127 | + | |
| 128 | + | |
| 129 | + | |
| 130 | + | |
| 131 | + | |
| 132 | + | |
| 133 | + | |
| 134 | + | |
| 135 | + | |
| 136 | + | |
| 137 | + | |
| 138 | + | |
| 139 | + | |
| 140 | + | |
| 141 | + | |
| 142 | + | |
| 143 | + | |
| 144 | + | |
| 145 | + | |
| 146 | + | |
| 147 | + | |
| 148 | + | |
| 149 | + | |
| 150 | + | |
| 151 | + | |
| 152 | + | |
| 153 | + | |
| 154 | + | |
| 155 | + | |
| 156 | + | |
| 157 | + | |
| 158 | + | |
| 159 | + | |
| 160 | + | |
| 161 | + | |
| 162 | + | |
| 163 | + | |
| 164 | + | |
| 165 | + | |
| 166 | + | |
| 167 | + | |
| 168 | + | |
| 169 | + | |
| 170 | + | |
| 171 | + | |
| 172 | + | |
| 173 | + | |
| 174 | + | |
| 175 | + | |
| 176 | + | |
| 177 | + | |
| 178 | + | |
| 179 | + | |
| 180 | + | |
| 181 | + | |
| 182 | + | |
| 183 | + | |
| 184 | + | |
| 185 | + | |
| 186 | + | |
| 187 | + | |
| 188 | + | |
| 189 | + | |
| 190 | + | |
| 191 | + | |
| 192 | + | |
| 193 | + | |
| 194 | + | |
| 195 | + | |
| 196 | + | |
| 197 | + | |
| 198 | + | |
| 199 | + | |
| 200 | + | |
| 201 | + | |
| 202 | + | |
| 203 | + | |
| 204 | + | |
| 205 | + | |
| 206 | + | |
| 207 | + | |
| 208 | + | |
| 209 | + | |
| 210 | + | |
| 211 | + | |
| 212 | + | |
| 213 | + | |
| 214 | + | |
| 215 | + | |
| 216 | + | |
| 217 | + | |
| 218 | + | |
| 219 | + | |
| 220 | + | |
| 221 | + | |
| 222 | + | |
| 223 | + | |
| 224 | + | |
| 225 | + | |
| 226 | + | |
| 227 | + | |
| 228 | + | |
| 229 | + | |
| 230 | + | |
| 231 | + | |
| 232 | + | |
| 233 | + | |
| 234 | + | |
| 235 | + | |
| 236 | + | |
| 237 | + | |
| 238 | + | |
| 239 | + | |
| 240 | + | |
| 241 | + | |
| 242 | + | |
| 243 | + | |
| 244 | + | |
| 245 | + | |
| 246 | + | |
| 247 | + | |
| 248 | + | |
| 249 | + | |
| 250 | + | |
| 251 | + | |
| 252 | + | |
| 253 | + | |
| 254 | + | |
| 255 | + | |
| 256 | + | |
| 257 | + | |
| 258 | + | |
| 259 | + | |
| 260 | + | |
| 261 | + | |
| 262 | + | |
| 263 | + | |
| 264 | + | |
| 265 | + | |
| 266 | + | |
| 267 | + | |
| 268 | + | |
| 269 | + | |
| 270 | + | |
| 271 | + | |
| 272 | + | |
| 273 | + | |
| 274 | + | |
| 275 | + | |
| 276 | + | |
| 277 | + | |
| 278 | + | |
| 279 | + | |
| 280 | + | |
| 281 | + | |
| 282 | + | |
| 283 | + | |
| 284 | + | |
| 285 | + | |
| 286 | + | |
| 287 | + | |
| 288 | + | |
| 289 | + | |
| 290 | + | |
| 291 | + | |
| 292 | + | |
| 293 | + | |
| 294 | + | |
| 295 | + | |
| 296 | + | |
| 297 | + | |
| 298 | + | |
| 299 | + | |
| 300 | + | |
| 301 | + | |
| 302 | + | |
| 303 | + | |
| 304 | + | |
| 305 | + | |
| 306 | + | |
| 307 | + | |
| 308 | + | |
| 309 | + | |
| 310 | + | |
| 311 | + | |
| 312 | + | |
| 313 | + | |
| 314 | + | |
| 315 | + | |
| 316 | + | |
| 317 | + | |
| 318 | + | |
| 319 | + | |
| 320 | + | |
| 321 | + | |
| 322 | + | |
| 323 | + | |
| 324 | + | |
| 325 | + | |
| 326 | + | |
| 327 | + | |
| 328 | + | |
| 329 | + | |
| 330 | + | |
| 331 | + | |
| 332 | + | |
| 333 | + | |
| 334 | + | |
| 335 | + | |
| 336 | + | |
| 337 | + | |
| 338 | + | |
| 339 | + | |
| 340 | + | |
| 341 | + | |
| 342 | + | |
| 343 | + | |
| 344 | + | |
| 345 | + | |
| 346 | + | |
| 347 | + | |
| 348 | + | |
| 349 | + | |
| 350 | + | |
| 351 | + | |
| 352 | + | |
| 353 | + | |
| 354 | + | |
| 355 | + | |
| 356 | + | |
| 357 | + | |
| 358 | + | |
| 359 | + | |
| 360 | + | |
| 361 | + | |
| 362 | + | |
| 363 | + | |
0 commit comments