FlagOpen · yuzhou03 · Dec 6, 2023 · Dec 1, 2023 · Dec 1, 2023 · Dec 4, 2023
diff --git a/training/benchmarks/tacotron2/pytorch/model/data/data_function.py b/training/benchmarks/tacotron2/pytorch/model/data/data_function.py
@@ -74,7 +74,7 @@ def get_mel(self, filename):
             melspec = self.stft.mel_spectrogram(audio_norm)
             melspec = torch.squeeze(melspec, 0)
         else:
-            melspec = torch.load(filename)
+            melspec = torch.load(filename, map_location='cpu')
             assert melspec.size(0) == self.stft.n_mel_channels, (
                 'Mel dimension mismatch: given {}, expected {}'.format(
                     melspec.size(0), self.stft.n_mel_channels))

diff --git a/training/kunlunxin/tacotron2-pytorch/README.md b/training/kunlunxin/tacotron2-pytorch/README.md
@@ -18,12 +18,31 @@
 
 
 ### 运行情况
-| 训练资源 | 配置文件        | 运行时长(s) | 目标val_loss | 收敛val_loss | epoch数 | 性能(samples/s) |
-| -------- | --------------- | ----------- | ------------ | ------------ | ------- | --------------- |
-| 单机1卡  | config_R300x1x1 | /           |              | /            |         |                 |
-| 单机8卡  | config_R300x1x8 |             | 0.4852(fp32) | 0.4271(fp32) | 1235    |                 |
-| 两机8卡  | config_R300x2x8 | /           |              | /            |         |                 |
+* 通用指标
 
+| 指标名称       | 指标值                  | 特殊说明                                    |
+| -------------- | ----------------------- | ------------------------------------------- |
+| 任务类别       | SpeechSynthesis         |                                             |
+| 模型           | tacotron2               |                                             |
+| 数据集         | LJSpeech                |                                             |
+| 数据精度       | precision,见“性能指标”  | 可选fp32/amp/fp16/tf32                      |
+| 超参修改       | fix_hp,见“性能指标”     | 跑满硬件设备评测吞吐量所需特殊超参          |
+| 硬件设备简称   | Kunlunxin R300        |                                             |
+| 硬件存储使用   | mem,见“性能指标”        | 通常称为“显存”,单位为GiB                    |
+| 端到端时间     | e2e_time,见“性能指标”   | 总时间+Perf初始化等时间                     |
+| 总吞吐量       | p_whole,见“性能指标”    | 实际训练样本数除以总时间(performance_whole) |
+| 训练吞吐量     | p_train,见“性能指标”    | 不包含每个epoch末尾的评估部分耗时           |
+| **计算吞吐量** | **p_core,见“性能指标”** | 不包含数据IO部分的耗时(p3>p2>p1)            |
+| 训练结果       | val_loss,见“性能指标”   | 验证loss                                    |
+| 额外修改项     | 无                      |                                             |
+
+* 性能指标
+
+| 配置                 | precision | fix_hp          | e2e_time | p_whole | p_train | p_core | val_loss | mem       |
+| -------------------- | --------- | --------------- | -------- | ------- | ------- | ------ | -------- | --------- |
+| R300单机8卡(1x8)  | fp32      | bs=96, lr=0.001 | /        | /       | /       | /      | 0.4801   | 26.3/32.0   |
+| R300双机8卡(2x8)  | fp32      | bs=96, lr=0.001 | /        | /       | /       | /      | /        | 25.0/32.0 |
+| R300单机单卡(1x1) | fp32      | bs=128, lr=0.001 | /        | /       | /       | /      | /        | 30.5/32.0 |
 ### 许可证
 
 Apache 2.0 license。
diff --git a/training/kunlunxin/tacotron2-pytorch/config/config_R300x1x1.py b/training/kunlunxin/tacotron2-pytorch/config/config_R300x1x1.py
@@ -0,0 +1,9 @@
+from config_common import *
+
+train_batch_size = 128
+eval_batch_size = train_batch_size
+
+warmup = 0.2
+learning_rate = 1e-3
+
+seed = 23333
diff --git a/training/kunlunxin/tacotron2-pytorch/config/config_R300x1x8.py b/training/kunlunxin/tacotron2-pytorch/config/config_R300x1x8.py
@@ -1,6 +1,6 @@
 from config_common import *
 
-train_batch_size = 48
+train_batch_size = 96
 eval_batch_size = train_batch_size
 
 warmup = 0.2

diff --git a/training/kunlunxin/tacotron2-pytorch/config/config_R300x2x8.py b/training/kunlunxin/tacotron2-pytorch/config/config_R300x2x8.py
@@ -0,0 +1,9 @@
+from config_common import *
+
+train_batch_size = 96
+eval_batch_size = train_batch_size
+
+warmup = 0.2
+learning_rate = 1e-3
+
+seed = 23333
diff --git a/training/kunlunxin/tacotron2-pytorch/config/environment_variables.sh b/training/kunlunxin/tacotron2-pytorch/config/environment_variables.sh
@@ -0,0 +1,4 @@
+export XACC=1
+export BKCL_PCIE_RING=1
+export BKCL_TIMEOUT=1800
+export XMLIR_D_XPU_L3_SIZE=10485760
diff --git a/training/run_benchmarks/config/test_conf.py b/training/run_benchmarks/config/test_conf.py
@@ -115,6 +115,7 @@
     # "bert:pytorch:R300:1:8:1": "/raid/dataset/bert_large/train",
     # "longformer:pytorch:R300:1:8:1": "/raid/dataset/longformer_train",
     # "distilbert:pytorch:R300:1:8:1": "/raid/dataset/distilbert/",
-    # "swin_transformer:pytorch:R300:1:8:1": "/raid/dataset/ImageNet_1k_2012/"
+    # "swin_transformer:pytorch:R300:1:8:1": "/raid/dataset/ImageNet_1k_2012/",
+    # "tacotron2:pytorch:R300:1:8:1": "/raid/dataset/tacotron2/LJSpeech/"
 }