@@ -160,11 +160,11 @@ function llm_gpt_case_list_auto() {
160
160
fun_list=(
161
161
# The test name must have "llm_gpt_dygraph_auto_" as a prefix,
162
162
# which will be used for tracking the execution status of the case.
163
- # llm_gpt_dygraph_auto_bs8_fp32_DP2
164
- # llm_gpt_dygraph_auto_bs8_fp32_DP2-MP2
165
- # llm_gpt_dygraph_auto_bs8_fp32_DP2-MP2-PP2
166
- # llm_gpt_dygraph_auto_bs8_fp16_DP2-MP2-PP2
167
- # llm_gpt_dygraph_auto_bs8_fp16_DP2-MP2-PP2_intermediate
163
+ llm_gpt_dygraph_auto_bs8_fp32_DP2
164
+ llm_gpt_dygraph_auto_bs8_fp32_DP2-MP2
165
+ llm_gpt_dygraph_auto_bs8_fp32_DP2-MP2-PP2
166
+ llm_gpt_dygraph_auto_bs8_fp16_DP2-MP2-PP2
167
+ llm_gpt_dygraph_auto_bs8_fp16_DP2-MP2-PP2_intermediate
168
168
llm_gpt_pir_auto_bs4_TP2
169
169
llm_gpt_pir_auto_bs4_TP2_PP2
170
170
llm_gpt_pir_auto_bs8_DP2_TP2_PP2
@@ -2293,11 +2293,11 @@ function llm_gpt_dygraph_auto_bs8_fp32_DP2() {
2293
2293
ips=-1
2294
2294
mem=-1
2295
2295
echo " result: loss=$loss ips=$ips mem=$mem loss_md5=$loss_md5 "
2296
- loss_base=10.55848312 # output of dropout is different after supporting spmd
2296
+ loss_base=10.55853653 # output of dropout is different after supporting spmd
2297
2297
ips_base=-1
2298
2298
mem_base=-1
2299
2299
if [ $IS_A100 -ne 0 ]; then
2300
- loss_base=10.55920792 # after add dropout spmd
2300
+ loss_base=10.56019211 # after add dropout spmd
2301
2301
fi
2302
2302
check_result $FUNCNAME ${loss_base} ${loss} ${ips_base} ${ips} ${mem_base} ${mem}
2303
2303
echo " =========== $FUNCNAME run end ==========="
@@ -2365,11 +2365,11 @@ function llm_gpt_dygraph_auto_bs8_fp32_DP2-MP2() {
2365
2365
ips=-1
2366
2366
mem=-1
2367
2367
echo " result: loss=$loss ips=$ips mem=$mem loss_md5=$loss_md5 "
2368
- loss_base=10.56786537 # output of dropout is different after supporting spmd
2368
+ loss_base=10.5657959 # output of dropout is different after supporting spmd
2369
2369
ips_base=-1
2370
2370
mem_base=-1
2371
2371
if [ $IS_A100 -ne 0 ]; then
2372
- loss_base=10.57873726 # after add dropout spmd
2372
+ loss_base=10.5760107 # after add dropout spmd
2373
2373
fi
2374
2374
check_result $FUNCNAME ${loss_base} ${loss} ${ips_base} ${ips} ${mem_base} ${mem}
2375
2375
echo " =========== $FUNCNAME run end ==========="
@@ -2438,11 +2438,11 @@ function llm_gpt_dygraph_auto_bs8_fp32_DP2-MP2-PP2() {
2438
2438
mem=-1
2439
2439
echo " result: loss=$loss ips=$ips mem=$mem loss_md5=$loss_md5 "
2440
2440
# loss_base=10.59993172 # note: need to debug
2441
- loss_base=10.57312012 # output of dropout is different after supporting spmd
2441
+ loss_base=10.57174778 # output of dropout is different after supporting spmd
2442
2442
ips_base=-1
2443
2443
mem_base=-1
2444
2444
if [ $IS_A100 -ne 0 ]; then
2445
- loss_base=10.5769043 # after add dropout spmd
2445
+ loss_base=10.57701015 # after add dropout spmd
2446
2446
fi
2447
2447
check_result $FUNCNAME ${loss_base} ${loss} ${ips_base} ${ips} ${mem_base} ${mem}
2448
2448
echo " =========== $FUNCNAME run end ==========="
@@ -2511,11 +2511,11 @@ function llm_gpt_dygraph_auto_bs8_fp16_DP2-MP2-PP2() {
2511
2511
mem=-1
2512
2512
echo " result: loss=$loss ips=$ips mem=$mem loss_md5=$loss_md5 "
2513
2513
# loss_base=10.58456802 # note: need to debug
2514
- loss_base=10.57452488
2514
+ loss_base=10.57304478
2515
2515
ips_base=-1
2516
2516
mem_base=-1
2517
2517
if [ $IS_A100 -ne 0 ]; then
2518
- loss_base=10.57843781 # after add dropout spmd
2518
+ loss_base=10.57861042 # after add dropout spmd
2519
2519
fi
2520
2520
check_result $FUNCNAME ${loss_base} ${loss} ${ips_base} ${ips} ${mem_base} ${mem}
2521
2521
echo " =========== $FUNCNAME run end ==========="
@@ -2585,11 +2585,11 @@ function llm_gpt_dygraph_auto_bs8_fp16_DP2-MP2-PP2_intermediate() {
2585
2585
mem=-1
2586
2586
echo " result: loss=$loss ips=$ips mem=$mem loss_md5=$loss_md5 "
2587
2587
# loss_base=10.58456802 # note: need to debug
2588
- loss_base=10.566679
2588
+ loss_base=10.56716251
2589
2589
ips_base=-1
2590
2590
mem_base=-1
2591
2591
if [ $IS_A100 -ne 0 ]; then
2592
- loss_base=10.56109619 # after add dropout spmd
2592
+ loss_base=10.56166935 # after add dropout spmd
2593
2593
fi
2594
2594
check_result $FUNCNAME ${loss_base} ${loss} ${ips_base} ${ips} ${mem_base} ${mem}
2595
2595
echo " =========== $FUNCNAME run end ==========="
0 commit comments