Skip to content

Commit c095cf1

Browse files
committed
add variant
1 parent 37c2315 commit c095cf1

File tree

1 file changed

+6
-6
lines changed

1 file changed

+6
-6
lines changed

optimum/exporters/onnx/model_configs.py

+6-6
Original file line numberDiff line numberDiff line change
@@ -1890,15 +1890,15 @@ class LlavaOnnxConfig(OnnxConfigWithPast):
18901890

18911891
VARIANTS = {
18921892
"default": "The export follows the Transformers implementation of forward in LlavaModelForConditionalGeneration, with the following components exported:\n\t - "
1893-
"model.onnx: corresponds to the vision encoder + projection + decoder in a single file without past key value support in https://github.com/huggingface/transformers/blob/v4.33.2/src/transformers/models/speecht5/modeling_speecht5.py#L2544-L2556.\n\t - "
1894-
"decoder_model.onnx: corresponds to the decoder part in with past_key_values input https://github.com/huggingface/transformers/blob/v4.33.2/src/transformers/models/speecht5/modeling_speecht5.py#L2572-L2602.",
1893+
"model.onnx: corresponds to the vision encoder + projection + decoder in a single file without past key value support in https://github.com/huggingface/transformers/blob/v4.39.3/src/transformers/models/llava/modeling_llava.py#L360-L519.\n\t - "
1894+
"decoder_model.onnx: corresponds to the decoder part in with past_key_values input https://github.com/huggingface/transformers/blob/v4.39.3/src/transformers/models/llava/modeling_llava.py#L449-L489.",
18951895
"optimized": "The export follows the memory optimized implementation of Transformers forward. This is a recommended export as decoder is exported only once`. It has the following components exported:\n\t - "
1896-
"encoder_model.onnx: corresponds to the vision encoder + projection + decoder in https://github.com/huggingface/transformers/blob/v4.33.2/src/transformers/models/speecht5/modeling_speecht5.py#L2544-L2556.\n\t - "
1897-
"decoder_model.onnx: corresponds to the decoder part in https://github.com/huggingface/transformers/blob/v4.33.2/src/transformers/models/speecht5/modeling_speecht5.py#L2572-L2602.\n\t - "
1898-
"attention_position_id_generator.onnx: corresponds to attention_mask and position_ids generation when past_key_values is provided in https://github.com/huggingface/transformers/blob/v4.33.2/src/transformers/models/speecht5/modeling_speecht5.py#L2572-L2602.",
1896+
"encoder_model.onnx: corresponds to the vision encoder + projection + decoder in https://github.com/huggingface/transformers/blob/v4.39.3/src/transformers/models/llava/modeling_llava.py#L421-L445.\n\t - "
1897+
"decoder_model.onnx: corresponds to the decoder part in https://github.com/huggingface/transformers/blob/v4.39.3/src/transformers/models/llava/modeling_llava.py#L480-L489.\n\t - "
1898+
"attention_position_id_generator.onnx: corresponds to attention_mask and position_ids generation when past_key_values is provided in https://github.com/huggingface/transformers/blob/v4.39.3/src/transformers/models/llava/modeling_llava.py#L421-L478.",
18991899
}
19001900

1901-
DEFAULT_VARIANT = "default"
1901+
DEFAULT_VARIANT = "optimized"
19021902

19031903
def __init__(
19041904
self,

0 commit comments

Comments
 (0)