We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent d7f9a40 commit 02e887bCopy full SHA for 02e887b
1 file changed
onnxruntime/python/tools/transformers/large_model_exporter.py
@@ -213,6 +213,7 @@ def fetch_onnx_inputs_outputs_name(
213
):
214
"""fetch onnx inputs and outputs name"""
215
num_of_past_key = 0
216
+ kv_cache_axis = {0: "batch_size"}
217
# try get num_of_past_key and shape of past_key_value
218
if past_key_values is not None:
219
num_of_past_key = len(past_key_values)
0 commit comments