We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 64afc81 commit adf2768Copy full SHA for adf2768
tests/test_tipc/static/auto_parallel/llama2/benchmark_common/run_benchmark.sh
@@ -265,6 +265,7 @@ export FLAGS_use_cinn=1
265
export FLAGS_dist_prim_all=1
266
export FLAGS_prim_forward_blacklist="pd_op.stack;pd_op.squeeze;pd_op.swiglu;pd_op.squared_l2_norm"
267
export FLAGS_prim_backward_blacklist="swiglu_grad"
268
+export FLAGS_merge_all_horizontal_groups=1
269
270
source ${BENCHMARK_ROOT}/scripts/run_model.sh # 在该脚本中会对符合benchmark规范的log使用analysis.py 脚本进行性能数据解析;如果不联调只想要产出训练log可以注掉本行,提交时需打开
271
_set_params $@
0 commit comments