diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer.py index 01ba1f1b6..9178527a6 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer.py @@ -65,6 +65,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.encoder = nn.ConformerEncoder( in_dim, nn.FeatureDim("enc", 512), diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_d384_h6_wd0_nopre_blstmf_specaug.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_d384_h6_wd0_nopre_blstmf_specaug.py index 335f89588..fbe552b72 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_d384_h6_wd0_nopre_blstmf_specaug.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_d384_h6_wd0_nopre_blstmf_specaug.py @@ -81,6 +81,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_d384_h6_wd0_nopre_blstmf_specaug_mgpupe4.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_d384_h6_wd0_nopre_blstmf_specaug_mgpupe4.py index 3ef0cb676..443f08443 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_d384_h6_wd0_nopre_blstmf_specaug_mgpupe4.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_d384_h6_wd0_nopre_blstmf_specaug_mgpupe4.py @@ -87,6 +87,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_d384_h6_wd0_nopre_lrd07_blstmf_specaug.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_d384_h6_wd0_nopre_lrd07_blstmf_specaug.py index 6e709d3fc..9de16b0ee 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_d384_h6_wd0_nopre_lrd07_blstmf_specaug.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_d384_h6_wd0_nopre_lrd07_blstmf_specaug.py @@ -81,6 +81,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_import_old_nick_att_conformer_lrs2.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_import_old_nick_att_conformer_lrs2.py index 5397946bd..95fe88a22 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_import_old_nick_att_conformer_lrs2.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_import_old_nick_att_conformer_lrs2.py @@ -378,6 +378,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_ln_pre9_d384_h6_wd0_blstmf2_specaug.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_ln_pre9_d384_h6_wd0_blstmf2_specaug.py index 09fa86733..9d5adf1c4 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_ln_pre9_d384_h6_wd0_blstmf2_specaug.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_ln_pre9_d384_h6_wd0_blstmf2_specaug.py @@ -89,6 +89,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_ln_pre9_lr02_d384_h6_wd0_blstmf2_specaug.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_ln_pre9_lr02_d384_h6_wd0_blstmf2_specaug.py index cf537580d..3d0e5d8be 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_ln_pre9_lr02_d384_h6_wd0_blstmf2_specaug.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_ln_pre9_lr02_d384_h6_wd0_blstmf2_specaug.py @@ -87,6 +87,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_nopre2_wd0_blstmf_specaug.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_nopre2_wd0_blstmf_specaug.py index ebd42f875..68216d7ca 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_nopre2_wd0_blstmf_specaug.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_nopre2_wd0_blstmf_specaug.py @@ -89,6 +89,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_blstmf_specaug.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_blstmf_specaug.py index 8f9a897b3..22e957746 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_blstmf_specaug.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_blstmf_specaug.py @@ -85,6 +85,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_oldspecaug4a_oldtwarp3_attdrop01_aux4812.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_oldspecaug4a_oldtwarp3_attdrop01_aux4812.py index b553cbd8f..564970867 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_oldspecaug4a_oldtwarp3_attdrop01_aux4812.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_oldspecaug4a_oldtwarp3_attdrop01_aux4812.py @@ -87,6 +87,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_oldspecaug4a_oldtwarp_attdrop01_aux24812f.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_oldspecaug4a_oldtwarp_attdrop01_aux24812f.py index dabae4b26..51e45c693 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_oldspecaug4a_oldtwarp_attdrop01_aux24812f.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_oldspecaug4a_oldtwarp_attdrop01_aux24812f.py @@ -87,6 +87,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_oldspecaug4a_oldtwarp_attdrop01_aux48.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_oldspecaug4a_oldtwarp_attdrop01_aux48.py index 565f57eea..c9a1ffece 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_oldspecaug4a_oldtwarp_attdrop01_aux48.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_oldspecaug4a_oldtwarp_attdrop01_aux48.py @@ -87,6 +87,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_oldspecaug4a_oldtwarp_attdrop01_aux4812.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_oldspecaug4a_oldtwarp_attdrop01_aux4812.py index e8b264e85..f6ad897bc 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_oldspecaug4a_oldtwarp_attdrop01_aux4812.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_oldspecaug4a_oldtwarp_attdrop01_aux4812.py @@ -87,6 +87,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_oldspecaug4a_oldtwarp_attdrop01_aux4812f.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_oldspecaug4a_oldtwarp_attdrop01_aux4812f.py index 7a69ec7da..93587c01b 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_oldspecaug4a_oldtwarp_attdrop01_aux4812f.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_oldspecaug4a_oldtwarp_attdrop01_aux4812f.py @@ -87,6 +87,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_oldspecaug4a_oldtwarp_attdrop01_aux4812ff.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_oldspecaug4a_oldtwarp_attdrop01_aux4812ff.py index 33de3735c..f46b04f0d 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_oldspecaug4a_oldtwarp_attdrop01_aux4812ff.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_oldspecaug4a_oldtwarp_attdrop01_aux4812ff.py @@ -87,6 +87,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_oldspecaug4a_oldtwarp_attdrop01_aux48ff.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_oldspecaug4a_oldtwarp_attdrop01_aux48ff.py index ec58d317d..f2dd3c382 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_oldspecaug4a_oldtwarp_attdrop01_aux48ff.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_oldspecaug4a_oldtwarp_attdrop01_aux48ff.py @@ -87,6 +87,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug.py index a57409e48..0065b0e22 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug.py @@ -86,6 +86,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01.py index 4a83c4322..dd4e31c09 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01.py @@ -86,6 +86,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_attscaledist_aux48ff.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_attscaledist_aux48ff.py index 4f94b6339..e218be387 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_attscaledist_aux48ff.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_attscaledist_aux48ff.py @@ -89,6 +89,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_aux48.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_aux48.py index bda60f058..63a30187e 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_aux48.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_aux48.py @@ -88,6 +88,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_aux48_bpesample01.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_aux48_bpesample01.py index e77a45c40..fbb19355d 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_aux48_bpesample01.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_aux48_bpesample01.py @@ -88,6 +88,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_aux48_encl2_1e_2.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_aux48_encl2_1e_2.py index 6567f1acb..06a7651e0 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_aux48_encl2_1e_2.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_aux48_encl2_1e_2.py @@ -89,6 +89,8 @@ def __init__(self, in_dim: nn.Dim, *, enc_l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_aux48_encl2_1e_3.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_aux48_encl2_1e_3.py index 9ea9d6d25..b4ed70835 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_aux48_encl2_1e_3.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_aux48_encl2_1e_3.py @@ -89,6 +89,8 @@ def __init__(self, in_dim: nn.Dim, *, enc_l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_aux48ff.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_aux48ff.py index 0d5c82d48..476add110 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_aux48ff.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_aux48ff.py @@ -88,6 +88,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_aux48.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_aux48.py index 0a9520f09..7d0d75b61 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_aux48.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_aux48.py @@ -89,6 +89,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_aux4812.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_aux4812.py index 2cda8fcc9..7a2a3ddcc 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_aux4812.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_aux4812.py @@ -89,6 +89,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_aux4812f.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_aux4812f.py index 129049f2c..1ab21db75 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_aux4812f.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_aux4812f.py @@ -89,6 +89,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_aux4812ff.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_aux4812ff.py index eb4f7e288..1cd3d5084 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_aux4812ff.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_aux4812ff.py @@ -89,6 +89,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_aux48_bhv14.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_aux48_bhv14.py index 0a9520f09..7d0d75b61 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_aux48_bhv14.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_aux48_bhv14.py @@ -89,6 +89,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_aux48_bhv14_copy1.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_aux48_bhv14_copy1.py index 0a9520f09..7d0d75b61 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_aux48_bhv14_copy1.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_aux48_bhv14_copy1.py @@ -89,6 +89,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_aux48_bhv14_copy2.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_aux48_bhv14_copy2.py index 0a9520f09..7d0d75b61 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_aux48_bhv14_copy2.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_aux48_bhv14_copy2.py @@ -89,6 +89,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_aux48_bhv14_copy3.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_aux48_bhv14_copy3.py index 0a9520f09..7d0d75b61 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_aux48_bhv14_copy3.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_aux48_bhv14_copy3.py @@ -89,6 +89,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_aux48_bhv15.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_aux48_bhv15.py index 5852c0006..6cc7d8de6 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_aux48_bhv15.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_aux48_bhv15.py @@ -89,6 +89,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_aux48_bhv15_decwd0025.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_aux48_bhv15_decwd0025.py index 6337f8c7b..b6ba6be8d 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_aux48_bhv15_decwd0025.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_aux48_bhv15_decwd0025.py @@ -91,6 +91,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_aux48_lr2e_3.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_aux48_lr2e_3.py index 5aec460a1..102ff8153 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_aux48_lr2e_3.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_aux48_lr2e_3.py @@ -89,6 +89,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_aux48_lr3e_3.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_aux48_lr3e_3.py index 13d918e92..fd9663e4d 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_aux48_lr3e_3.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_aux48_lr3e_3.py @@ -89,6 +89,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_vn0025_aux48ff.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_vn0025_aux48ff.py index eb73ee5f7..7cfa005a2 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_vn0025_aux48ff.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_vn0025_aux48ff.py @@ -89,6 +89,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_vn0075_aux48.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_vn0075_aux48.py index 840eaa6c4..5abf23376 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_vn0075_aux48.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_vn0075_aux48.py @@ -89,6 +89,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_wdrop005_aux48ff.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_wdrop005_aux48ff.py index 8b4794512..6712df471 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_wdrop005_aux48ff.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_wdrop005_aux48ff.py @@ -89,6 +89,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_wdrop01_aux48.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_wdrop01_aux48.py index 0a4ca137f..61a5e4f48 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_wdrop01_aux48.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_wdrop01_aux48.py @@ -89,6 +89,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_wdrop01_aux48ff.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_wdrop01_aux48ff.py index 6f8aa0c09..6f3893cfc 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_wdrop01_aux48ff.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_wdrop01_aux48ff.py @@ -89,6 +89,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_win10_aux48_bhv15.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_win10_aux48_bhv15.py index 51806dd8a..b853861ad 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_win10_aux48_bhv15.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_win10_aux48_bhv15.py @@ -89,6 +89,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_win50_aux48_bhv15.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_win50_aux48_bhv15.py index 03d7dd5e5..1c41d08d9 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_win50_aux48_bhv15.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop01_posdrop01_win50_aux48_bhv15.py @@ -89,6 +89,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop02.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop02.py index ebf4c859c..7c49928f9 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop02.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_specaug_attdrop02.py @@ -86,6 +86,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_wdf_specaug_attdrop01_posdrop01_aux48.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_wdf_specaug_attdrop01_posdrop01_aux48.py index eefdac9a1..2b102a864 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_wdf_specaug_attdrop01_posdrop01_aux48.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_d384_h6_blstmf2_wdf_specaug_attdrop01_posdrop01_aux48.py @@ -89,6 +89,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_n8_d384_h6_blstmf2_oldspecaug4a_oldtwarp_attdrop01_aux48.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_n8_d384_h6_blstmf2_oldspecaug4a_oldtwarp_attdrop01_aux48.py index 3bbadf56c..524da28f7 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_n8_d384_h6_blstmf2_oldspecaug4a_oldtwarp_attdrop01_aux48.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_n8_d384_h6_blstmf2_oldspecaug4a_oldtwarp_attdrop01_aux48.py @@ -87,6 +87,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_n8_d384_h6_blstmf2_oldspecaug4a_oldtwarp_attdrop01_aux48ff.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_n8_d384_h6_blstmf2_oldspecaug4a_oldtwarp_attdrop01_aux48ff.py index 9b365107c..2342fd3d4 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_n8_d384_h6_blstmf2_oldspecaug4a_oldtwarp_attdrop01_aux48ff.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_n8_d384_h6_blstmf2_oldspecaug4a_oldtwarp_attdrop01_aux48ff.py @@ -87,6 +87,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_transd30_d384_h6_blstmf2_oldspecaug4a_oldtwarp_attdrop01_aux24812f.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_transd30_d384_h6_blstmf2_oldspecaug4a_oldtwarp_attdrop01_aux24812f.py index d19521e05..e5c700ff3 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_transd30_d384_h6_blstmf2_oldspecaug4a_oldtwarp_attdrop01_aux24812f.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_transd30_d384_h6_blstmf2_oldspecaug4a_oldtwarp_attdrop01_aux24812f.py @@ -91,6 +91,8 @@ def __init__(self, in_dim: nn.Dim, *, epoch: int, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_transd30_d384_h6_blstmf2_oldspecaug4a_oldtwarp_attdrop01_aux24812ff.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_transd30_d384_h6_blstmf2_oldspecaug4a_oldtwarp_attdrop01_aux24812ff.py index df4f59ffa..2a0ea6f17 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_transd30_d384_h6_blstmf2_oldspecaug4a_oldtwarp_attdrop01_aux24812ff.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre10_transd30_d384_h6_blstmf2_oldspecaug4a_oldtwarp_attdrop01_aux24812ff.py @@ -89,6 +89,8 @@ def __init__(self, in_dim: nn.Dim, *, epoch: int, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre2_blstmf_specaug.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre2_blstmf_specaug.py index ebc1ae7cc..bd48f9d8e 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre2_blstmf_specaug.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre2_blstmf_specaug.py @@ -69,6 +69,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre3_blstmf_specaug.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre3_blstmf_specaug.py index 0e211c90f..29bd050c2 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre3_blstmf_specaug.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre3_blstmf_specaug.py @@ -73,6 +73,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre4_blstmf_specaug.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre4_blstmf_specaug.py index 7e2ddc1b8..8e4c5ca55 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre4_blstmf_specaug.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre4_blstmf_specaug.py @@ -77,6 +77,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre5_blstmf_specaug.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre5_blstmf_specaug.py index 061c01771..5dc5c582b 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre5_blstmf_specaug.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre5_blstmf_specaug.py @@ -76,6 +76,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre6_blstmf_specaug.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre6_blstmf_specaug.py index 7df8108f0..a5002442a 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre6_blstmf_specaug.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre6_blstmf_specaug.py @@ -77,6 +77,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre7_blstmf_specaug.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre7_blstmf_specaug.py index 49857e58c..329583873 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre7_blstmf_specaug.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre7_blstmf_specaug.py @@ -83,6 +83,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre8_blstmf_specaug.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre8_blstmf_specaug.py index b6bb9ac64..6f8d2fa0c 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre8_blstmf_specaug.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre8_blstmf_specaug.py @@ -88,6 +88,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_blstmf_specaug.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_blstmf_specaug.py index c7e6d0208..4dc308088 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_blstmf_specaug.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_blstmf_specaug.py @@ -87,6 +87,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_blstmf2_specaug.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_blstmf2_specaug.py index 9a04df3d1..878a34ef1 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_blstmf2_specaug.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_blstmf2_specaug.py @@ -88,6 +88,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_ks8_wd0_blstmf2_specaug.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_ks8_wd0_blstmf2_specaug.py index 8e59f668c..613dba645 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_ks8_wd0_blstmf2_specaug.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_ks8_wd0_blstmf2_specaug.py @@ -89,6 +89,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_blstmf2_relold_specaug.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_blstmf2_relold_specaug.py index 17d43c4b7..57a3f9610 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_blstmf2_relold_specaug.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_blstmf2_relold_specaug.py @@ -89,6 +89,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_blstmf2_specaug.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_blstmf2_specaug.py index c703768d3..1e74061a3 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_blstmf2_specaug.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_blstmf2_specaug.py @@ -88,6 +88,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_blstmf2_specaug_attdrop01_aux48.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_blstmf2_specaug_attdrop01_aux48.py index 50861b181..3eb13042d 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_blstmf2_specaug_attdrop01_aux48.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_blstmf2_specaug_attdrop01_aux48.py @@ -90,6 +90,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_blstmf2_specaug_attdrop01_posdrop01_aux48.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_blstmf2_specaug_attdrop01_posdrop01_aux48.py index d18eb3d6e..94543d001 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_blstmf2_specaug_attdrop01_posdrop01_aux48.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_blstmf2_specaug_attdrop01_posdrop01_aux48.py @@ -91,6 +91,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_blstmf2_specaug_aux48.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_blstmf2_specaug_aux48.py index 56c08d2fc..50c26a934 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_blstmf2_specaug_aux48.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_blstmf2_specaug_aux48.py @@ -90,6 +90,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_blstmf2_specaug_aux4812.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_blstmf2_specaug_aux4812.py index 8c255b60f..fb924b45e 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_blstmf2_specaug_aux4812.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_blstmf2_specaug_aux4812.py @@ -90,6 +90,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_blstmf2_specaug_aux4812f.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_blstmf2_specaug_aux4812f.py index 3a7551e32..aa4be2465 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_blstmf2_specaug_aux4812f.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_blstmf2_specaug_aux4812f.py @@ -90,6 +90,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_blstmf2_specaug_aux48_bhv15.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_blstmf2_specaug_aux48_bhv15.py index e57928efd..05691626f 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_blstmf2_specaug_aux48_bhv15.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_blstmf2_specaug_aux48_bhv15.py @@ -90,6 +90,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_blstmf2_specaug_aux48_bhv15_copy1.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_blstmf2_specaug_aux48_bhv15_copy1.py index e57928efd..05691626f 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_blstmf2_specaug_aux48_bhv15_copy1.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_blstmf2_specaug_aux48_bhv15_copy1.py @@ -90,6 +90,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_blstmf2_specaug_aux48_bhv15_copy2.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_blstmf2_specaug_aux48_bhv15_copy2.py index e57928efd..05691626f 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_blstmf2_specaug_aux48_bhv15_copy2.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_blstmf2_specaug_aux48_bhv15_copy2.py @@ -90,6 +90,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_blstmf2_specaug_aux48ff.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_blstmf2_specaug_aux48ff.py index b96461c6d..823090ef6 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_blstmf2_specaug_aux48ff.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_blstmf2_specaug_aux48ff.py @@ -90,6 +90,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_blstmf2_specaug_bhv15.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_blstmf2_specaug_bhv15.py index 8c09337a7..0fac3fb14 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_blstmf2_specaug_bhv15.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_blstmf2_specaug_bhv15.py @@ -90,6 +90,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_blstmf2_specaug_bhv15_copy1.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_blstmf2_specaug_bhv15_copy1.py index 8c09337a7..0fac3fb14 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_blstmf2_specaug_bhv15_copy1.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_blstmf2_specaug_bhv15_copy1.py @@ -90,6 +90,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_blstmf2_specaug_bhv15_copy2.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_blstmf2_specaug_bhv15_copy2.py index 8c09337a7..0fac3fb14 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_blstmf2_specaug_bhv15_copy2.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_blstmf2_specaug_bhv15_copy2.py @@ -90,6 +90,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_convwei_specaug_aux48.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_convwei_specaug_aux48.py index f20a4b078..4b0e6cced 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_convwei_specaug_aux48.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_d384_h6_wd0_convwei_specaug_aux48.py @@ -88,6 +88,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_h8_wd0_blstmf2_relold_specaug.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_h8_wd0_blstmf2_relold_specaug.py index acd1937bd..a4a86d666 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_h8_wd0_blstmf2_relold_specaug.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_h8_wd0_blstmf2_relold_specaug.py @@ -89,6 +89,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_h8_wd0_blstmf2_specaug.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_h8_wd0_blstmf2_specaug.py index 19492b5cc..d63c40168 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_h8_wd0_blstmf2_specaug.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_h8_wd0_blstmf2_specaug.py @@ -88,6 +88,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_h8_wd0_bnmask_blstmf2_relold_specaug.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_h8_wd0_bnmask_blstmf2_relold_specaug.py index 32f911275..e0e836e43 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_h8_wd0_bnmask_blstmf2_relold_specaug.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_h8_wd0_bnmask_blstmf2_relold_specaug.py @@ -89,6 +89,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_wd0_blstmf2_specaug.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_wd0_blstmf2_specaug.py index f8a076ee2..eef5b3deb 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_wd0_blstmf2_specaug.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_wd0_blstmf2_specaug.py @@ -88,6 +88,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_wd0_blstmf_specaug.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_wd0_blstmf_specaug.py index 7cb759861..6133c8cba 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_wd0_blstmf_specaug.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_pre9_wd0_blstmf_specaug.py @@ -87,6 +87,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim, diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_prerep6noreg.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_prerep6noreg.py index 02232157f..e98f8ae53 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_prerep6noreg.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_prerep6noreg.py @@ -67,6 +67,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.encoder = nn.ConformerEncoder( in_dim, nn.FeatureDim("enc", 512), diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_prerep6noreg_blstmf.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_prerep6noreg_blstmf.py index 7243ac55d..76911120f 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_prerep6noreg_blstmf.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_prerep6noreg_blstmf.py @@ -68,6 +68,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.encoder = nn.ConformerEncoder( in_dim, nn.FeatureDim("enc", 512), diff --git a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_prerep6noreg_blstmf_specaug.py b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_prerep6noreg_blstmf_specaug.py index 262eced0d..b9eb15266 100644 --- a/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_prerep6noreg_blstmf_specaug.py +++ b/users/zeyer/experiments/exp2022_07_21_transducer/exp_fs_base/conformer_prerep6noreg_blstmf_specaug.py @@ -69,6 +69,8 @@ def __init__(self, in_dim: nn.Dim, *, l2: float = 0.0001, ): super(Model, self).__init__() + if nn.ConformerEncoderLayer.use_dropout_after_self_att: + nn.ConformerEncoderLayer.use_dropout_after_self_att = False self.in_dim = in_dim self.encoder = nn.ConformerEncoder( in_dim,