We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 66ea9d7 commit e324df8Copy full SHA for e324df8
models/tt_transformers/tt/generator_vllm.py
@@ -391,7 +391,7 @@ def initialize_vllm_model(
391
max_seq_len=max_seq_len,
392
n_layers=n_layers,
393
dtype=ttnn.bfloat16,
394
- optimizations=DecodersPrecision.performance,
+ optimizations=DecodersPrecision.accuracy,
395
)
396
return cls(tt_model, model_args, mesh_device)
397
0 commit comments