Skip to content

Commit 23e4c1a

Browse files
authored
[Auto-Parallel] Add ci for tensor_fusion and overlap in auto-dy (#10598)
* Update ci_case_auto.sh * Update ci_case_auto.sh * Update ci_case_auto.sh * Update ci_case_auto.sh * Update ci_case_auto.sh * Update ci_case_auto.sh * Update ci_case_auto.sh
1 parent dbf9c44 commit 23e4c1a

File tree

1 file changed

+10
-4
lines changed

1 file changed

+10
-4
lines changed

scripts/distribute/ci_case_auto.sh

Lines changed: 10 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -221,15 +221,17 @@ function llama_dygraph_auto_bs4_bf16_SD2() {
221221

222222
export CUDA_DEVICE_MAX_CONNECTIONS=1
223223

224-
flags=("" "FLAGS_fuse_allreduce_in_opt" "FLAGS_fuse_reducescatter_in_opt")
224+
flags=("" "FLAGS_fuse_allreduce_in_opt" "FLAGS_fuse_reducescatter_in_opt" "FLAGS_enable_tensor_fusion FLAGS_enable_sharding_overlap")
225225
for i in "${!flags[@]}"; do
226226
flag="${flags[$i]}"
227227

228228
if [ -n "$flag" ]; then
229-
export "$flag=true"
229+
for f in $flag; do
230+
export "$f=true"
231+
done
230232
fi
231233

232-
task_name="llama_dygraph_auto_bs4_bf16_SD2_$flag"
234+
task_name="llama_dygraph_auto_bs4_bf16_SD2_$f"
233235
case_out_dir="output/$task_name"
234236
case_log_dir="output/$task_name""_log"
235237
rm -rf $case_out_dir
@@ -299,6 +301,8 @@ function llama_dygraph_auto_bs4_bf16_SD2() {
299301
loss_base=9.23502579
300302
elif [ "$flag" = "FLAGS_fuse_reducescatter_in_opt" ]; then
301303
loss_base=9.23504105
304+
elif [ "$flag" = "FLAGS_enable_tensor_fusion FLAGS_enable_sharding_overlap" ]; then
305+
loss_base=9.23504868
302306
else
303307
loss_base=-1
304308
fi
@@ -308,7 +312,9 @@ function llama_dygraph_auto_bs4_bf16_SD2() {
308312
check_result $FUNCNAME ${loss_base} ${loss} ${ips_base} ${ips} ${mem_base} ${mem}
309313

310314
if [ -n "$flag" ]; then
311-
export "$flag=false"
315+
for f in $flag; do
316+
export "$f=false"
317+
done
312318
fi
313319
done
314320
echo "=========== $FUNCNAME run end ==========="

0 commit comments

Comments
 (0)