updates

rwth-i6 · Dec 5, 2023 · 8b11e09 · 8b11e09
1 parent bab4c8a
commit 8b11e09
Show file tree

Hide file tree

Showing 146 changed files with 23,743 additions and 0 deletions.
diff --git a/users/hilmes/experiments/__init__.py b/users/hilmes/experiments/__init__.py
diff --git a/users/hilmes/experiments/nick_setups/__init__.py b/users/hilmes/experiments/nick_setups/__init__.py
diff --git a/users/hilmes/experiments/nick_setups/librispeech_standalone_2023/__init__.py b/users/hilmes/experiments/nick_setups/librispeech_standalone_2023/__init__.py
@@ -0,0 +1 @@
+PACKAGE = __package__
diff --git a/users/hilmes/experiments/nick_setups/librispeech_standalone_2023/config.py b/users/hilmes/experiments/nick_setups/librispeech_standalone_2023/config.py
@@ -0,0 +1,156 @@
+import copy
+import numpy as np
+from sisyphus import tk
+from typing import Any, Dict
+
+from i6_core.returnn.config import ReturnnConfig, CodeWrapper
+
+from i6_experiments.common.setups.returnn_pytorch.serialization import (
+    Collection as TorchCollection,
+)
+from i6_experiments.common.setups.serialization import Import
+from .data.common import TrainingDatasets
+from .serializer import get_pytorch_serializer_v3, PACKAGE
+
+from i6_experiments.users.rossenbach.common_setups.returnn.datasets import GenericDataset
+
+
+def get_training_config(
+    training_datasets: TrainingDatasets,
+    network_module: str,
+    net_args: Dict[str, Any],
+    config: Dict[str, Any],
+    debug: bool = False,
+    use_custom_engine: bool = False,
+    use_speed_perturbation: bool = False,
+) -> ReturnnConfig:
+    """
+    :param training_datasets: datasets for training
+    :param network_module: path to the pytorch config file containing Model
+    :param net_args: extra arguments for the model
+    :param config:
+    :param debug: run training in debug mode (linking from recipe instead of copy)
+    """
+
+    # changing these does not change the hash
+    post_config = {
+        "cleanup_old_models": True,
+        "stop_on_nonfinite_train_score": True,  # this might break now with True
+        "num_workers_per_gpu": 2,
+    }
+
+    base_config = {
+        #############
+        "train": copy.deepcopy(training_datasets.train.as_returnn_opts()),
+        "dev": training_datasets.cv.as_returnn_opts(),
+        "eval_datasets": {"devtrain": training_datasets.devtrain.as_returnn_opts()},
+    }
+    config = {**base_config, **copy.deepcopy(config)}
+    post_config["backend"] = "torch"
+
+    serializer = get_pytorch_serializer_v3(
+        network_module=network_module, net_args=net_args, debug=debug, use_custom_engine=use_custom_engine
+    )
+    python_prolog = None
+
+    # TODO: maybe make nice
+    if use_speed_perturbation:
+        prolog_serializer = TorchCollection(
+            serializer_objects=[
+                Import(
+                    code_object_path=PACKAGE + ".dataset_code.speed_perturbation.legacy_speed_perturbation",
+                    unhashed_package_root=PACKAGE,
+                )
+            ]
+        )
+        python_prolog = [prolog_serializer]
+        config["train"]["datasets"]["zip_dataset"]["audio"]["pre_process"] = CodeWrapper("legacy_speed_perturbation")
+
+    returnn_config = ReturnnConfig(
+        config=config, post_config=post_config, python_prolog=python_prolog, python_epilog=[serializer]
+    )
+    return returnn_config
+
+
+def get_prior_config(
+    training_datasets: TrainingDatasets,
+    network_module: str,
+    net_args: Dict[str, Any],
+    config: Dict[str, Any],
+    debug: bool = False,
+    use_custom_engine=False,
+    **kwargs,
+):
+    """
+    Returns the RETURNN config serialized by :class:`ReturnnCommonSerializer` in returnn_common for the ctc_aligner
+    :param returnn_common_root: returnn_common version to be used, usually output of CloneGitRepositoryJob
+    :param training_datasets: datasets for training
+    :param kwargs: arguments to be passed to the network construction
+    :return: RETURNN training config
+    """
+
+    # changing these does not change the hash
+    post_config = {}
+
+    base_config = {
+        #############
+        "batch_size": 500 * 16000,
+        "max_seqs": 60,
+        #############
+        "forward": training_datasets.prior.as_returnn_opts(),
+    }
+    config = {**base_config, **copy.deepcopy(config)}
+    post_config["backend"] = "torch"
+
+    serializer = get_pytorch_serializer_v3(
+        network_module=network_module,
+        net_args=net_args,
+        debug=debug,
+        use_custom_engine=use_custom_engine,
+        prior=True,
+    )
+    returnn_config = ReturnnConfig(config=config, post_config=post_config, python_epilog=[serializer])
+    return returnn_config
+
+
+def get_search_config(
+    network_module: str,
+    net_args: Dict[str, Any],
+    decoder: [str],
+    decoder_args: Dict[str, Any],
+    config: Dict[str, Any],
+    debug: bool = False,
+    use_custom_engine=False,
+    **kwargs,
+):
+    """
+    Returns the RETURNN config serialized by :class:`ReturnnCommonSerializer` in returnn_common for the ctc_aligner
+    :param returnn_common_root: returnn_common version to be used, usually output of CloneGitRepositoryJob
+    :param training_datasets: datasets for training
+    :param kwargs: arguments to be passed to the network construction
+    :return: RETURNN training config
+    """
+
+    # changing these does not change the hash
+    post_config = {}
+
+    base_config = {
+        #############
+        "batch_size": 240 * 16000,
+        "max_seqs": 60,
+        #############
+        # dataset is added later in the pipeline during search_single
+    }
+    config = {**base_config, **copy.deepcopy(config)}
+    post_config["backend"] = "torch"
+
+    serializer = get_pytorch_serializer_v3(
+        network_module=network_module,
+        net_args=net_args,
+        debug=debug,
+        use_custom_engine=use_custom_engine,
+        decoder=decoder,
+        decoder_args=decoder_args,
+    )
+    returnn_config = ReturnnConfig(config=config, post_config=post_config, python_epilog=[serializer])
+    return returnn_config
diff --git a/users/hilmes/experiments/nick_setups/librispeech_standalone_2023/ctc_bpe/__init__.py b/users/hilmes/experiments/nick_setups/librispeech_standalone_2023/ctc_bpe/__init__.py