@@ -142,11 +142,11 @@ def main():
142
142
if mem_place == "none" :
143
143
cmd = ["numactl" , f"--physcpubind={ gen_threads_config (args .num_threads , n )} " ,
144
144
"/llm/llama-batched-bench" , "-m" , args .model , "-c" , str (args .kv_cache ), "-b" , "2048" , "-ub" , "512" , "-npp" , str (args .prompt_size ), "-ntg" , str (TOKENS ),
145
- "-npl" , str (args .batch_size ), "-t" , str (args .num_threads ), "-tb" , str (args .num_threads )]
145
+ "-npl" , str (args .batch_size ), "-t" , str (args .num_threads ), "-tb" , str (args .num_threads ), "--no-mmap" ]
146
146
else :
147
147
cmd = ["numactl" , f"--physcpubind={ gen_threads_config (args .num_threads , n )} " ,str (mem_place ),
148
148
"/llm/llama-batched-bench" , "-m" , args .model , "-c" , str (args .kv_cache ), "-b" , "2048" , "-ub" , "512" , "-npp" , str (args .prompt_size ), "-ntg" , str (TOKENS ),
149
- "-npl" , str (args .batch_size ), "-t" , str (args .num_threads ), "-tb" , str (args .num_threads )]
149
+ "-npl" , str (args .batch_size ), "-t" , str (args .num_threads ), "-tb" , str (args .num_threads ), "--no-mmap" ]
150
150
151
151
else :
152
152
print ("FAIL: batched-bench not found!" )
0 commit comments