diff --git a/training/nvidia/transformer_xl-pytorch/README.md b/training/nvidia/transformer_xl-pytorch/README.md index b43805b40..8b960c7d1 100644 --- a/training/nvidia/transformer_xl-pytorch/README.md +++ b/training/nvidia/transformer_xl-pytorch/README.md @@ -46,4 +46,5 @@ | 配置 | precision | fix_hp | e2e_time | p_whole | p_train | p_core | ppl | mem | |----------------|-----------|------------------|----------|---------|---------|--------|------|-----------| +| A100单机单卡(1x1) | fp32 | bs=60,lr=0.00025 | - | 110 | 110 | 112 | - | 15.4/40.0 | | A100单机8卡(1x8) | fp32 | bs=60,lr=0.00025 | 2412 | 873 | 873 | 890 | 49.8 | 15.6/40.0 | diff --git a/training/run_benchmarks/config/test_conf.py b/training/run_benchmarks/config/test_conf.py index 617e6ce98..1c988f61d 100644 --- a/training/run_benchmarks/config/test_conf.py +++ b/training/run_benchmarks/config/test_conf.py @@ -74,5 +74,5 @@ # "transformer:pytorch_1.13:A100:1:8:1": "/home/datasets_ckpt/transformer/train/", # "swin_transformer:pytorch_1.8:A100:1:8:1": "/raid/dataset/ImageNet_1k_2012/", - # "transformer_xl:pytorch_1.8:A100:1:8:1": "/raid/dataset/transformer_xl/coco2017/", + # "transformer_xl:pytorch_1.8:A100:1:8:1": "/raid/dataset/transformer_xl/", }