3131 CustomOpTransform ,
3232 FP16ClipTransform ,
3333 OnnxSlimTransform ,
34+ RenameFunctionOutputsTransform ,
3435 SplitTensorsTransform ,
3536)
3637from QEfficient .base .pytorch_transforms import SplitGateUpWeightsTransform
@@ -2116,7 +2117,13 @@ class QEFFAutoModelForCausalLM(QEFFBaseModel):
21162117 SplitGateUpWeightsTransform ,
21172118 KVCacheExternalModuleMapperTransform ,
21182119 ]
2119- _onnx_transforms = [FP16ClipTransform , CustomOpTransform , OnnxSlimTransform , SplitTensorsTransform ]
2120+ _onnx_transforms = [
2121+ FP16ClipTransform ,
2122+ CustomOpTransform ,
2123+ RenameFunctionOutputsTransform ,
2124+ OnnxSlimTransform ,
2125+ SplitTensorsTransform ,
2126+ ]
21202127
21212128 def __init__ (
21222129 self ,
@@ -2364,7 +2371,7 @@ def export(self, export_dir: Optional[str] = None) -> str:
23642371 for kv in ["key" , "value" ]:
23652372 example_inputs ["past_key_values" ][i ].append (torch .zeros (pkv_cache [0 ][0 ].shape , dtype = torch .float32 ))
23662373 dynamic_axes [f"past_{ kv } .{ i } " ] = pkv_dynamic_axes
2367- output_names .append (f"past_{ kv } .{ i } _RetainedState " )
2374+ output_names .append (f"past_{ kv } .{ i } _InternalRetainedState " )
23682375
23692376 else :
23702377 # HACK: create common function for this including above if condition code
@@ -2381,8 +2388,8 @@ def export(self, export_dir: Optional[str] = None) -> str:
23812388 pkv_dynamic_axes [i ][0 ] = "full_batch_size" if self .continuous_batching else "batch_size"
23822389 for kv in ["key" , "value" ]:
23832390 example_inputs ["past_key_values" ][i ].append (torch .zeros (kv_cache_shape , dtype = torch .float32 ))
2384- dynamic_axes [f"past_{ kv } .{ i } " ] = pkv_dynamic_axes [ i ]
2385- output_names .append (f"past_{ kv } .{ i } _RetainedState " )
2391+ dynamic_axes [f"past_{ kv } .{ i } " ] = pkv_dynamic_axes
2392+ output_names .append (f"past_{ kv } .{ i } _InternalRetainedState " )
23862393
23872394 if self .continuous_batching :
23882395 example_inputs ["batch_index" ] = torch .arange (bs ).view (bs , 1 )
0 commit comments