diff --git a/tests/test_tipc/static/auto_parallel/llama2/pretrain_config_llama2_7b/pretrain-llama2_7b_dynamic_auto.json b/tests/test_tipc/static/auto_parallel/llama2/pretrain_config_llama2_7b/pretrain-llama2_7b_dynamic_auto.json index c8740be72afb..d8d36a468ba9 100644 --- a/tests/test_tipc/static/auto_parallel/llama2/pretrain_config_llama2_7b/pretrain-llama2_7b_dynamic_auto.json +++ b/tests/test_tipc/static/auto_parallel/llama2/pretrain_config_llama2_7b/pretrain-llama2_7b_dynamic_auto.json @@ -21,12 +21,13 @@ "fuse_attention_qkv": true, "use_fused_rope": true, "fused_linear_param_grad_add": true, + "enable_linear_fused_grad_add": true, "max_seq_length": 4096, "learning_rate": 3e-05, "min_learning_rate": 3e-06, "warmup_steps": 30, - "logging_steps": 2, - "max_steps": 50, + "logging_steps": 10, + "max_steps": 500, "save_steps": 5000, "eval_steps": 1000, "weight_decay": 0.01, @@ -52,4 +53,4 @@ "device": "gpu", "to_static": false, "enable_auto_parallel": true -} \ No newline at end of file +}