From b95d1fcba703e229a2070f7555e9e87e8a56ee68 Mon Sep 17 00:00:00 2001 From: zhouyu Date: Tue, 15 Aug 2023 11:24:43 +0800 Subject: [PATCH] add cpu model for nvidia training case readme --- training/nvidia/README.md | 3 ++- training/nvidia/WaveGlow-pytorch/README.md | 4 +++- training/nvidia/bert-paddle/README.md | 4 +++- training/nvidia/bert-pytorch/README.md | 4 +++- training/nvidia/bigtransfer-pytorch/README.md | 4 +++- training/nvidia/cpm-pytorch/README.md | 4 +++- training/nvidia/efficientnet-pytorch/README.md | 4 +++- training/nvidia/faster_rcnn-pytorch/README.md | 4 +++- training/nvidia/glm-pytorch/README.md | 4 +++- training/nvidia/mask_rcnn-pytorch/README.md | 4 +++- training/nvidia/mobilenetv2-pytorch/README.md | 4 +++- training/nvidia/resnet50-pytorch/README.md | 4 +++- training/nvidia/retinanet-pytorch/README.md | 4 +++- training/nvidia/swin_transformer-pytorch/README.md | 4 +++- training/nvidia/tacotron2-pytorch/README.md | 4 +++- training/nvidia/transformer-pytorch/README.md | 5 +++-- training/nvidia/vit-pytorch/README.md | 4 +++- 17 files changed, 50 insertions(+), 18 deletions(-) diff --git a/training/nvidia/README.md b/training/nvidia/README.md index 5b8c27fb9..3fdacb0e1 100644 --- a/training/nvidia/README.md +++ b/training/nvidia/README.md @@ -9,8 +9,9 @@ NVIDIA 是人工智能计算领域的领导者。率先采用加速计算,以 # FlagPerf适配验证环境说明 ## 环境配置参考 - 硬件 - - 机器型号: NVIDIA A100 + - 机器型号: NVIDIA DGX A100(40G) - 加速卡型号: NVIDIA_A100-SXM4-40GB + - CPU型号:AMD EPYC7742-64core@1.5G - 多机网络类型、带宽: InfiniBand,2x200 Gb/s - 软件 - OS版本:Ubuntu 20.04 diff --git a/training/nvidia/WaveGlow-pytorch/README.md b/training/nvidia/WaveGlow-pytorch/README.md index 4d9611321..cc90a30ee 100644 --- a/training/nvidia/WaveGlow-pytorch/README.md +++ b/training/nvidia/WaveGlow-pytorch/README.md @@ -6,7 +6,9 @@ #### 环境配置 - ##### 硬件环境 - - 机器、加速卡型号: NVIDIA_A100-SXM4-40GB + - 机器型号: NVIDIA DGX A100(40G) + - 加速卡型号: NVIDIA_A100-SXM4-40GB + - CPU型号: AMD EPYC7742-64core@1.5G - 多机网络类型、带宽: InfiniBand,200Gb/s - ##### 软件环境 diff --git a/training/nvidia/bert-paddle/README.md b/training/nvidia/bert-paddle/README.md index 4838a1279..1fee876b7 100644 --- a/training/nvidia/bert-paddle/README.md +++ b/training/nvidia/bert-paddle/README.md @@ -60,7 +60,9 @@ python run_pretraining.py ### Nvidia GPU配置与运行信息参考 #### 环境配置 - ##### 硬件环境 - - 机器、加速卡型号: NVIDIA_A100-SXM4-40GB + - 机器型号: NVIDIA DGX A100(40G) + - 加速卡型号: NVIDIA_A100-SXM4-40GB + - CPU型号: AMD EPYC7742-64core@1.5G - 多机网络类型、带宽: InfiniBand,200Gb/s - ##### 软件环境 - OS版本:Ubuntu 20.04 diff --git a/training/nvidia/bert-pytorch/README.md b/training/nvidia/bert-pytorch/README.md index 0cfc3ef5f..7634e2069 100644 --- a/training/nvidia/bert-pytorch/README.md +++ b/training/nvidia/bert-pytorch/README.md @@ -4,7 +4,9 @@ ### Nvidia GPU配置与运行信息参考 #### 环境配置 - ##### 硬件环境 - - 机器、加速卡型号: NVIDIA_A100-SXM4-40GB + - 机器型号: NVIDIA DGX A100(40G) + - 加速卡型号: NVIDIA_A100-SXM4-40GB + - CPU型号: AMD EPYC7742-64core@1.5G - 多机网络类型、带宽: InfiniBand,200Gb/s - ##### 软件环境 - OS版本:Ubuntu 20.04 diff --git a/training/nvidia/bigtransfer-pytorch/README.md b/training/nvidia/bigtransfer-pytorch/README.md index 9ba35e6d9..c3bc2115c 100644 --- a/training/nvidia/bigtransfer-pytorch/README.md +++ b/training/nvidia/bigtransfer-pytorch/README.md @@ -9,7 +9,9 @@ #### 环境配置 - ##### 硬件环境 - - 机器、加速卡型号: NVIDIA_A100-SXM4-40GB + - 机器型号: NVIDIA DGX A100(40G) + - 加速卡型号: NVIDIA_A100-SXM4-40GB + - CPU型号: AMD EPYC7742-64core@1.5G - 多机网络类型、带宽: InfiniBand,200Gb/s - ##### 软件环境 diff --git a/training/nvidia/cpm-pytorch/README.md b/training/nvidia/cpm-pytorch/README.md index b6dcafa26..7f26bfccc 100644 --- a/training/nvidia/cpm-pytorch/README.md +++ b/training/nvidia/cpm-pytorch/README.md @@ -10,7 +10,9 @@ ### Nvidia GPU配置与运行信息参考 #### 环境配置 - ##### 硬件环境 - - 机器、加速卡型号: NVIDIA_A100-SXM4-40GB + - 机器型号: NVIDIA DGX A100(40G) + - 加速卡型号: NVIDIA_A100-SXM4-40GB + - CPU型号: AMD EPYC7742-64core@1.5G - 多机网络类型、带宽: InfiniBand,200Gb/s - ##### 软件环境 - OS版本:Ubuntu 20.04 diff --git a/training/nvidia/efficientnet-pytorch/README.md b/training/nvidia/efficientnet-pytorch/README.md index aa6220031..b8cb5ebe9 100644 --- a/training/nvidia/efficientnet-pytorch/README.md +++ b/training/nvidia/efficientnet-pytorch/README.md @@ -4,7 +4,9 @@ ### Nvidia GPU配置与运行信息参考 #### 环境配置 - ##### 硬件环境 - - 机器、加速卡型号: NVIDIA_A100-SXM4-40GB + - 机器型号: NVIDIA DGX A100(40G) + - 加速卡型号: NVIDIA_A100-SXM4-40GB + - CPU型号: AMD EPYC7742-64core@1.5G - 多机网络类型、带宽: InfiniBand,200Gb/s - ##### 软件环境 - OS版本:Ubuntu 20.04 diff --git a/training/nvidia/faster_rcnn-pytorch/README.md b/training/nvidia/faster_rcnn-pytorch/README.md index ac83f7e65..b0139de8a 100644 --- a/training/nvidia/faster_rcnn-pytorch/README.md +++ b/training/nvidia/faster_rcnn-pytorch/README.md @@ -17,7 +17,9 @@ torchvision.models.resnet.__dict__['model_urls'][ #### 环境配置 - ##### 硬件环境 - - 机器、加速卡型号: NVIDIA_A100-SXM4-40GB + - 机器型号: NVIDIA DGX A100(40G) + - 加速卡型号: NVIDIA_A100-SXM4-40GB + - CPU型号: AMD EPYC7742-64core@1.5G - 多机网络类型、带宽: InfiniBand,200Gb/s - ##### 软件环境 diff --git a/training/nvidia/glm-pytorch/README.md b/training/nvidia/glm-pytorch/README.md index 7e325eff0..8507c2b0e 100644 --- a/training/nvidia/glm-pytorch/README.md +++ b/training/nvidia/glm-pytorch/README.md @@ -6,7 +6,9 @@ ### Nvidia GPU配置与运行信息参考 #### 环境配置 - ##### 硬件环境 - - 机器、加速卡型号: NVIDIA_A100-SXM4-40GB + - 机器型号: NVIDIA DGX A100(40G) + - 加速卡型号: NVIDIA_A100-SXM4-40GB + - CPU型号: AMD EPYC7742-64core@1.5G - 多机网络类型、带宽: InfiniBand,200Gb/s - ##### 软件环境 - OS版本:Ubuntu 20.04 diff --git a/training/nvidia/mask_rcnn-pytorch/README.md b/training/nvidia/mask_rcnn-pytorch/README.md index 34e316aaf..19068ccad 100644 --- a/training/nvidia/mask_rcnn-pytorch/README.md +++ b/training/nvidia/mask_rcnn-pytorch/README.md @@ -7,7 +7,9 @@ #### 环境配置 - ##### 硬件环境 - - 机器、加速卡型号: NVIDIA_A100-SXM4-40GB + - 机器型号: NVIDIA DGX A100(40G) + - 加速卡型号: NVIDIA_A100-SXM4-40GB + - CPU型号: AMD EPYC7742-64core@1.5G - 多机网络类型、带宽: InfiniBand,200Gb/s - ##### 软件环境 diff --git a/training/nvidia/mobilenetv2-pytorch/README.md b/training/nvidia/mobilenetv2-pytorch/README.md index 8d75a0ac0..996f2a1a9 100644 --- a/training/nvidia/mobilenetv2-pytorch/README.md +++ b/training/nvidia/mobilenetv2-pytorch/README.md @@ -4,7 +4,9 @@ ### Nvidia GPU配置与运行信息参考 #### 环境配置 - ##### 硬件环境 - - 机器、加速卡型号: NVIDIA_A100-SXM4-40GB + - 机器型号: NVIDIA DGX A100(40G) + - 加速卡型号: NVIDIA_A100-SXM4-40GB + - CPU型号: AMD EPYC7742-64core@1.5G - 多机网络类型、带宽: InfiniBand,200Gb/s - ##### 软件环境 - OS版本:Ubuntu 20.04 diff --git a/training/nvidia/resnet50-pytorch/README.md b/training/nvidia/resnet50-pytorch/README.md index f71832323..c5c46a3c9 100644 --- a/training/nvidia/resnet50-pytorch/README.md +++ b/training/nvidia/resnet50-pytorch/README.md @@ -4,7 +4,9 @@ ### 2. Nvidia GPU配置与运行信息参考 #### 环境配置 - ##### 硬件环境 - - 机器、加速卡型号: NVIDIA_A100-SXM4-40GB + - 机器型号: NVIDIA DGX A100(40G) + - 加速卡型号: NVIDIA_A100-SXM4-40GB + - CPU型号: AMD EPYC7742-64core@1.5G - 多机网络类型、带宽: InfiniBand,200Gb/s - ##### 软件环境 - OS版本:Ubuntu 20.04 diff --git a/training/nvidia/retinanet-pytorch/README.md b/training/nvidia/retinanet-pytorch/README.md index 913a26d4d..f6c58c8e4 100644 --- a/training/nvidia/retinanet-pytorch/README.md +++ b/training/nvidia/retinanet-pytorch/README.md @@ -17,7 +17,9 @@ torchvision.models.resnet.__dict__['model_urls'][ #### 环境配置 - ##### 硬件环境 - - 机器、加速卡型号: NVIDIA_A100-SXM4-40GB + - 机器型号: NVIDIA DGX A100(40G) + - 加速卡型号: NVIDIA_A100-SXM4-40GB + - CPU型号: AMD EPYC7742-64core@1.5G - 多机网络类型、带宽: InfiniBand,200Gb/s - ##### 软件环境 diff --git a/training/nvidia/swin_transformer-pytorch/README.md b/training/nvidia/swin_transformer-pytorch/README.md index 044367102..46ac31803 100644 --- a/training/nvidia/swin_transformer-pytorch/README.md +++ b/training/nvidia/swin_transformer-pytorch/README.md @@ -4,7 +4,9 @@ ### Nvidia GPU配置与运行信息参考 #### 环境配置 - ##### 硬件环境 - - 机器、加速卡型号: NVIDIA_A100-SXM4-40GB + - 机器型号: NVIDIA DGX A100(40G) + - 加速卡型号: NVIDIA_A100-SXM4-40GB + - CPU型号: AMD EPYC7742-64core@1.5G - 多机网络类型、带宽: InfiniBand,200Gb/s - ##### 软件环境 - OS版本:Ubuntu 20.04 diff --git a/training/nvidia/tacotron2-pytorch/README.md b/training/nvidia/tacotron2-pytorch/README.md index 4f196a543..bde167837 100644 --- a/training/nvidia/tacotron2-pytorch/README.md +++ b/training/nvidia/tacotron2-pytorch/README.md @@ -6,7 +6,9 @@ #### 环境配置 - ##### 硬件环境 - - 机器、加速卡型号: NVIDIA_A100-SXM4-40GB + - 机器型号: NVIDIA DGX A100(40G) + - 加速卡型号: NVIDIA_A100-SXM4-40GB + - CPU型号: AMD EPYC7742-64core@1.5G - 多机网络类型、带宽: InfiniBand,200Gb/s - ##### 软件环境 diff --git a/training/nvidia/transformer-pytorch/README.md b/training/nvidia/transformer-pytorch/README.md index 50dae9fb5..775cbe3bb 100644 --- a/training/nvidia/transformer-pytorch/README.md +++ b/training/nvidia/transformer-pytorch/README.md @@ -7,8 +7,9 @@ #### 环境配置 - ##### 硬件环境 - - - 机器、加速卡型号: NVIDIA_A100-SXM4-40GB + - 机器型号: NVIDIA DGX A100(40G) + - 加速卡型号: NVIDIA_A100-SXM4-40GB + - CPU型号: AMD EPYC7742-64core@1.5G - 多机网络类型、带宽: InfiniBand,200Gb/s - ##### 软件环境 diff --git a/training/nvidia/vit-pytorch/README.md b/training/nvidia/vit-pytorch/README.md index 83d2f81f8..555a577b3 100644 --- a/training/nvidia/vit-pytorch/README.md +++ b/training/nvidia/vit-pytorch/README.md @@ -4,7 +4,9 @@ ### Nvidia GPU配置与运行信息参考 #### 环境配置 - ##### 硬件环境 - - 机器、加速卡型号: NVIDIA_A100-SXM4-40GB + - 机器型号: NVIDIA DGX A100(40G) + - 加速卡型号: NVIDIA_A100-SXM4-40GB + - CPU型号: AMD EPYC7742-64core@1.5G - 多机网络类型、带宽: InfiniBand,200Gb/s - ##### 软件环境 - OS版本:Ubuntu 20.04