@@ -955,7 +955,15 @@ def test_demo_text(
955955 )
956956
957957 # Benchmark targets
958- supported_models = ["Llama-3.2-1B" , "Llama-3.2-3B" , "Llama-3.1-8B" , "Llama-3.2-11B" , "Llama-3.1-70B" , "Mistral-7B" ]
958+ supported_models = [
959+ "Llama-3.2-1B" ,
960+ "Llama-3.2-3B" ,
961+ "Llama-3.1-8B" ,
962+ "Llama-3.2-11B" ,
963+ "Llama-3.1-70B" ,
964+ "Mistral-7B" ,
965+ "Mistral-Small-3.1-24B" ,
966+ ]
959967 supported_devices = ["N150" , "P100" , "P150" , "P300" , "N300" , "P150x4" , "P150x8" , "T3K" , "TG" ]
960968
961969 tt_device_name = determine_device_name (mesh_device ) # submesh device should not decide performance target
@@ -1004,6 +1012,7 @@ def test_demo_text(
10041012 "N300_Mistral-7B" : 38 , # TODO Update target
10051013 "T3K_Mistral-7B" : 45 , # TODO Update target
10061014 "TG_Mistral-7B" : 45 , # TODO Update target
1015+ "T3K_Mistral-Small-3.1-24B" : 33 , # TODO Update target
10071016 }
10081017 if model_device_key in dict_target_decode_tok_s_u :
10091018 target_decode_tok_s_u = dict_target_decode_tok_s_u [model_device_key ]
@@ -1099,6 +1108,7 @@ def test_demo_text(
10991108 # "T3K_Qwen2.5-72B": 13, # too much variability in CI (https://github.com/tenstorrent/tt-metal/issues/24303)
11001109 "T3K_Qwen2.5-Coder-32B" : 21 ,
11011110 # "T3K_Qwen3-32B": 20, # too much variability in CI (https://github.com/tenstorrent/tt-metal/issues/24303)
1111+ "T3K_Mistral-Small-3.1-24B" : 33 , # TODO Update target
11021112 }
11031113
11041114 # Only call verify_perf if the model_device_key exists in the targets
0 commit comments