diff --git a/tests/multi_card_tests/pipeline_parallel/test_gpt_pp.py b/tests/multi_card_tests/pipeline_parallel/test_gpt_pp.py index 5d9796844..0f4e30bc6 100644 --- a/tests/multi_card_tests/pipeline_parallel/test_gpt_pp.py +++ b/tests/multi_card_tests/pipeline_parallel/test_gpt_pp.py @@ -198,23 +198,23 @@ def test_pp(self): if paddle.distributed.get_rank() == 0: baseline = { - "_layers.9.0.input_layernorm.weight": "b75652fc8c6d4bba4513e90a2c5a7596", - "_layers.9.0.mlp.down_proj.weight": "7becd6a8b649192155befc2ec16fe250", - "_layers.9.0.mlp.up_gate_proj.weight": "121d4eb684ed0c9f63b357bc00f4815a", - "_layers.9.0.post_attention_layernorm.weight": "4c3f808bf274eddd33dad2d96f4b8804", - "_layers.9.0.self_attn.k_norm.weight": "8a94851abc94463b6eee1e18440ad6ef", - "_layers.9.0.self_attn.o_proj.weight": "1d2477b05c078e71bacd435fac5731e8", - "_layers.9.0.self_attn.q_norm.weight": "ac1adb34d94a0cf8e9154ed3cbf097c0", - "_layers.9.0.self_attn.qkv_proj.weight": "1a6e380b99c46f8f360bec6dc4bbea33", - "_layers.9.1.input_layernorm.weight": "74e13bcebc22f55da1ea996996faa1f1", - "_layers.9.1.mlp.down_proj.weight": "bd18ba2e343c07ddcb43133995917c03", - "_layers.9.1.mlp.up_gate_proj.weight": "f1d4215e022a65e3401ae3e2c80fb4ba", - "_layers.9.1.post_attention_layernorm.weight": "91df0009a11c69192fafa1dd13690bff", - "_layers.9.1.self_attn.k_norm.weight": "0a17912c1aaf609354cfdb7ba9289fbb", - "_layers.9.1.self_attn.o_proj.weight": "bb579d22c85c7d7d9b266d2195dc0326", - "_layers.9.1.self_attn.q_norm.weight": "74cc012f0bc84b6aff0c3372bb62c9c4", - "_layers.9.1.self_attn.qkv_proj.weight": "d71928b0d80a20082fd7f9ed794e0cae", - "_layers.shared_layers.embed.embedding.embed_tokens.weight": "ab8ed982bcd685d6617717b0da1aafda", + "_layers.9.0.input_layernorm.weight": "34707dfb7a96f6ac9a11e7fc3713f1ea", + "_layers.9.0.mlp.down_proj.weight": "728d03046bfb2ab0e4f191d3b045c93c", + "_layers.9.0.mlp.up_gate_proj.weight": "9fdb6a2101890e7adef7b1ebbf353714", + "_layers.9.0.post_attention_layernorm.weight": "fb5064a5a66b476bec0419b3687e14bf", + "_layers.9.0.self_attn.k_norm.weight": "fde5089a9ba2b68900b994179ec0598d", + "_layers.9.0.self_attn.o_proj.weight": "76866f06592ebadcd9b9a2c55f02cb44", + "_layers.9.0.self_attn.q_norm.weight": "897588977d1854c1a1b7db8cd654107c", + "_layers.9.0.self_attn.qkv_proj.weight": "9d04ca986be4a71fee8a18254014f30e", + "_layers.9.1.input_layernorm.weight": "405839bc23ff3aef9604824c60f8f3ba", + "_layers.9.1.mlp.down_proj.weight": "b89aa17a9e18ccaa09859bea25229e05", + "_layers.9.1.mlp.up_gate_proj.weight": "e0834ac457fa687903cdb2dbb8178400", + "_layers.9.1.post_attention_layernorm.weight": "8cb08725344776fc41659930b700c337", + "_layers.9.1.self_attn.k_norm.weight": "81af5c50e3fff9ca35b6cd10050330be", + "_layers.9.1.self_attn.o_proj.weight": "6d0f4851c8f63ea3435296248992c68f", + "_layers.9.1.self_attn.q_norm.weight": "cb16a452bd7fb5fd4466d7cedca12e20", + "_layers.9.1.self_attn.qkv_proj.weight": "fe969890118275f355692eedeb446083", + "_layers.shared_layers.embed.embedding.embed_tokens.weight": "3f5909c4bd328a15662835e5c566762e", } for name, p in overlap_gpt_model.named_parameters():