cbensimon HF Staff commited on
Commit
6ff4937
·
1 Parent(s): fee4cc2
Files changed (1) hide show
  1. optimization.py +1 -0
optimization.py CHANGED
@@ -50,6 +50,7 @@ def optimize_pipeline_(pipeline: Callable[P, Any], *args: P.args, **kwargs: P.kw
50
  dynamic_shapes |= TRANSFORMER_DYNAMIC_SHAPES
51
 
52
  quantize_(pipeline.transformer, Float8DynamicActivationFloat8WeightConfig())
 
53
 
54
  hidden_states: torch.Tensor = call.kwargs['hidden_states']
55
  hidden_states_transposed = hidden_states.transpose(-1, -2).contiguous()
 
50
  dynamic_shapes |= TRANSFORMER_DYNAMIC_SHAPES
51
 
52
  quantize_(pipeline.transformer, Float8DynamicActivationFloat8WeightConfig())
53
+ quantize_(pipeline.transformer_2, Float8DynamicActivationFloat8WeightConfig())
54
 
55
  hidden_states: torch.Tensor = call.kwargs['hidden_states']
56
  hidden_states_transposed = hidden_states.transpose(-1, -2).contiguous()