From aab02997f920d543c0ecf36b81bfaa032f46186f Mon Sep 17 00:00:00 2001
From: Hui Zhang <zhtclz@foxmail.com>
Date: Mon, 23 Aug 2021 06:47:36 +0000
Subject: [PATCH] fix specaug config

---
 deepspeech/frontend/augmentor/spec_augment.py  |  2 ++
 examples/aishell/s0/conf/augmentation.json     | 11 ++++++-----
 examples/aishell/s1/conf/augmentation.json     |  3 ++-
 examples/augmentation/augmentation.json        |  9 +++++----
 examples/librispeech/s0/conf/augmentation.json |  3 ++-
 examples/librispeech/s1/conf/augmentation.json |  3 ++-
 examples/librispeech/s2/conf/augmentation.json |  3 ++-
 examples/timit/s1/conf/augmentation.json       |  3 ++-
 examples/tiny/s0/conf/augmentation.json        | 12 +++++++-----
 examples/tiny/s1/conf/augmentation.json        |  3 ++-
 10 files changed, 32 insertions(+), 20 deletions(-)

diff --git a/deepspeech/frontend/augmentor/spec_augment.py b/deepspeech/frontend/augmentor/spec_augment.py
index a3f4e268..7c23b628 100644
--- a/deepspeech/frontend/augmentor/spec_augment.py
+++ b/deepspeech/frontend/augmentor/spec_augment.py
@@ -245,6 +245,8 @@ class SpecAugmentor(AugmentorBase):
         Returns:
             x (np.ndarray): `[T, F]`
         """
+        assert isinstance(x, np.ndarray)
+        assert x.ndim == 2
         x = self.time_warp(x, self.mode)
         x = self.mask_freq(x, self.replace_with_zero)
         x = self.mask_time(x, self.replace_with_zero)
diff --git a/examples/aishell/s0/conf/augmentation.json b/examples/aishell/s0/conf/augmentation.json
index 81d110b0..39afe4e6 100644
--- a/examples/aishell/s0/conf/augmentation.json
+++ b/examples/aishell/s0/conf/augmentation.json
@@ -19,17 +19,18 @@
   {
     "type": "specaug",
     "params": {
-      "F": 10,
-      "T": 50,
+      "W": 5,
+      "warp_mode": "PIL",
+      "F": 30,
       "n_freq_masks": 2,
+      "T": 40,
       "n_time_masks": 2,
       "p": 1.0,
-      "W": 80,
       "adaptive_number_ratio": 0,
       "adaptive_size_ratio": 0,
       "max_n_time_masks": 20,
-      "replace_with_zero": true
+      "replace_with_zero": false
     },
     "prob": 1.0
   }
-]
+]
\ No newline at end of file
diff --git a/examples/aishell/s1/conf/augmentation.json b/examples/aishell/s1/conf/augmentation.json
index 81d110b0..d0409b14 100644
--- a/examples/aishell/s1/conf/augmentation.json
+++ b/examples/aishell/s1/conf/augmentation.json
@@ -28,7 +28,8 @@
       "adaptive_number_ratio": 0,
       "adaptive_size_ratio": 0,
       "max_n_time_masks": 20,
-      "replace_with_zero": true
+      "replace_with_zero": true,
+      "warp_mode": "PIL"
     },
     "prob": 1.0
   }
diff --git a/examples/augmentation/augmentation.json b/examples/augmentation/augmentation.json
index baf2cac3..c99299d6 100644
--- a/examples/augmentation/augmentation.json
+++ b/examples/augmentation/augmentation.json
@@ -52,17 +52,18 @@
   {
     "type": "specaug",
     "params": {
+      "W": 80,
+      "warp_mode": "PIL",
       "F": 10,
-      "T": 50,
       "n_freq_masks": 2,
+      "T": 50,
       "n_time_masks": 2,
       "p": 1.0,
-      "W": 80,
       "adaptive_number_ratio": 0,
       "adaptive_size_ratio": 0,
       "max_n_time_masks": 20,
-      "replace_with_zero": true
+      "replace_with_zero": false
     },
-    "prob": 0.0
+    "prob": 1.0
   }
 ]
diff --git a/examples/librispeech/s0/conf/augmentation.json b/examples/librispeech/s0/conf/augmentation.json
index 81d110b0..d0409b14 100644
--- a/examples/librispeech/s0/conf/augmentation.json
+++ b/examples/librispeech/s0/conf/augmentation.json
@@ -28,7 +28,8 @@
       "adaptive_number_ratio": 0,
       "adaptive_size_ratio": 0,
       "max_n_time_masks": 20,
-      "replace_with_zero": true
+      "replace_with_zero": true,
+      "warp_mode": "PIL"
     },
     "prob": 1.0
   }
diff --git a/examples/librispeech/s1/conf/augmentation.json b/examples/librispeech/s1/conf/augmentation.json
index 7dd158eb..8e6e9704 100644
--- a/examples/librispeech/s1/conf/augmentation.json
+++ b/examples/librispeech/s1/conf/augmentation.json
@@ -28,7 +28,8 @@
       "adaptive_number_ratio": 0,
       "adaptive_size_ratio": 0,
       "max_n_time_masks": 20,
-      "replace_with_zero": true
+      "replace_with_zero": true,
+      "warp_mode": "PIL"
     },
     "prob": 1.0
   }
diff --git a/examples/librispeech/s2/conf/augmentation.json b/examples/librispeech/s2/conf/augmentation.json
index cc8c7e00..e20fc199 100644
--- a/examples/librispeech/s2/conf/augmentation.json
+++ b/examples/librispeech/s2/conf/augmentation.json
@@ -11,7 +11,8 @@
       "adaptive_number_ratio": 0,
       "adaptive_size_ratio": 0,
       "max_n_time_masks": 20,
-      "replace_with_zero": true
+      "replace_with_zero": true,
+      "warp_mode": "PIL"
     },
     "prob": 1.0
   }
diff --git a/examples/timit/s1/conf/augmentation.json b/examples/timit/s1/conf/augmentation.json
index 7dd158eb..8e6e9704 100644
--- a/examples/timit/s1/conf/augmentation.json
+++ b/examples/timit/s1/conf/augmentation.json
@@ -28,7 +28,8 @@
       "adaptive_number_ratio": 0,
       "adaptive_size_ratio": 0,
       "max_n_time_masks": 20,
-      "replace_with_zero": true
+      "replace_with_zero": true,
+      "warp_mode": "PIL"
     },
     "prob": 1.0
   }
diff --git a/examples/tiny/s0/conf/augmentation.json b/examples/tiny/s0/conf/augmentation.json
index 8f9ff7fd..83705516 100644
--- a/examples/tiny/s0/conf/augmentation.json
+++ b/examples/tiny/s0/conf/augmentation.json
@@ -6,7 +6,7 @@
       "max_speed_rate": 1.1,
       "num_rates": 3
     },
-    "prob": 1.0
+    "prob": 0.0
   },
   {
     "type": "shift",
@@ -19,16 +19,18 @@
   {
     "type": "specaug",
     "params": {
-      "F": 10,
-      "T": 50,
+      "W": 5,
+      "warp_mode": "PIL",
+      "F": 30,
       "n_freq_masks": 2,
+      "T": 40,
       "n_time_masks": 2,
       "p": 1.0,
-      "W": 80,
       "adaptive_number_ratio": 0,
       "adaptive_size_ratio": 0,
       "max_n_time_masks": 20,
-      "replace_with_zero": true
+      "replace_with_zero": true,
+      "warp_mode": "PIL"
     },
     "prob": 1.0
   }
diff --git a/examples/tiny/s1/conf/augmentation.json b/examples/tiny/s1/conf/augmentation.json
index 8f9ff7fd..6010c2e4 100644
--- a/examples/tiny/s1/conf/augmentation.json
+++ b/examples/tiny/s1/conf/augmentation.json
@@ -28,7 +28,8 @@
       "adaptive_number_ratio": 0,
       "adaptive_size_ratio": 0,
       "max_n_time_masks": 20,
-      "replace_with_zero": true
+      "replace_with_zero": true,
+      "warp_mode": "PIL"
     },
     "prob": 1.0
   }