diff --git a/examples/cpp/llama/llama_config.ini b/examples/cpp/llama/llama_config.ini index ef789d35d..3e9ea8c92 100644 --- a/examples/cpp/llama/llama_config.ini +++ b/examples/cpp/llama/llama_config.ini @@ -6,7 +6,7 @@ tensor_para_size=1 pipeline_para_size=1 model_name=llama_7b -model_dir=/notebooks/llama-2-70b-hf-ft-tp-1_llama_decoder/1/1-gpu/ +model_dir=/notebooks/code-llama-ft/code-llama-34b/code-llama-34b_llama_decoder/1/1-gpu [request] beam_width=1 # beam width for beam search @@ -17,14 +17,14 @@ repetition_penalty=1.0 ; Use for sampling presence_penalty=0.0 ; Only one of repetition_penalty and presence_penalty are allowed. len_penalty=0.0 beam_search_diversity_rate=0.0 -request_batch_size=8 # determine by the request +request_batch_size=1 # determine by the request request_output_len=32 # determine by the request [llama_7b] head_num = 64 kv_head_num = 8 size_per_head = 128 -inter_size = 28672 +inter_size = 22016 num_layer = 3 rotary_embedding = 128 layernorm_eps = 1e-05 diff --git a/examples/cpp/llama/llama_example.cc b/examples/cpp/llama/llama_example.cc index 84a0b54aa..00fa5bad5 100644 --- a/examples/cpp/llama/llama_example.cc +++ b/examples/cpp/llama/llama_example.cc @@ -44,7 +44,7 @@ int main(int argc, char* argv[]) ini_name = std::string(argv[1]); } else { - ini_name = "/notebooks/FasterTransformer/examples/cpp/llama/llama_config.ini"; + ini_name = "/notebooks/tmp/FasterTransformer/examples/cpp/llama/llama_config.ini"; } INIReader reader = INIReader(ini_name); diff --git a/examples/cpp/llama/start_ids.csv b/examples/cpp/llama/start_ids.csv index 6b8b9c375..612c85964 100644 --- a/examples/cpp/llama/start_ids.csv +++ b/examples/cpp/llama/start_ids.csv @@ -1,8 +1 @@ 1, 18637, 29892, 526, 366, 1136, 455, 2470, 29973, 1815, 366, 5193, 304, 592, 29973 -1, 18637 -1, 18637, 29892, 526, 366, 1136, 455, 2470, 29973, 1815, 366, 5193, 304, 592, 29973 -1, 18637, 29892, 526, 366, 1136, 455, 2470, 29973, 1815, 366, 5193, 304, 592, 29973 -1, 18637, 29892, 526, 366, 1136, 455, 2470, 29973, 1815, 366, 5193, 304, 592, 29973 -1, 18637, 29892, 526, 366, 1136, 455, 2470, 29973, 1815, 366, 5193, 304, 592, 29973 -1, 18637, 29892, 526, 366, 1136, 455, 2470, 29973, 1815, 366, 5193, 304, 592, 29973 -1, 18637, 29892, 526, 366, 1136