Skip to content

Commit 308858a

Browse files
committed
pageattn ver
1 parent e548164 commit 308858a

1 file changed

Lines changed: 1 addition & 0 deletions

File tree

onnxruntime/contrib_ops/cuda/bert/paged_attention.cc

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -51,6 +51,7 @@ struct THEvent {
5151
};
5252

5353
struct InputMetadata {
54+
int64_t schedule_type; // 0: vllm. 1:sarathi, 2:custom, 3:self-build
5455
int64_t block_tables;
5556
int64_t max_num_blocks_per_seq;
5657
int64_t context_lens;

0 commit comments

Comments
 (0)