Add LSTM to easy colab (#185) - neural-amp-modeler - Neural network emulator for guitar amplifiers

commit 937c9dcea62540cd184fbae0f2773c29c6b90a30
parent 00cf58292862e3028972e5a314b452ee7a106d15
Author: Mike Oliphant <oliphant@nostatic.org>
Date:   Sun,  7 May 2023 12:06:17 -0700

Add LSTM to easy colab (#185)

* try switching to LSTM

* remove extra bracket

* trying some different layer numbers/sizes

* add model_type

* try to support both LSTM and WaveNet

* fixed train call

* python syntax...

* add default model_type to train()
Diffstat:
M nam/train/colab.py  | 2 ++
M nam/train/core.py  | 71 ++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++-----------

2 files changed, 62 insertions(+), 11 deletions(-)
diff --git a/nam/train/colab.py b/nam/train/colab.py
@@ -69,6 +69,7 @@ def _get_valid_export_directory():
 def run(
     epochs: int = 100,
     delay: Optional[int] = None,
+    model_type: str = "WaveNet",
     architecture: str = "standard",
     lr: float = 0.004,
     lr_decay: float = 0.007,
@@ -95,6 +96,7 @@ def run(
         input_version=input_version,
         epochs=epochs,
         delay=delay,
+        model_type=model_type,
         architecture=architecture,
         lr=lr,
         lr_decay=lr_decay,
diff --git a/nam/train/core.py b/nam/train/core.py
@@ -250,6 +250,27 @@ def _calibrate_delay(
         plot(delay, input_path, output_path)
     return delay
 
+def _get_lstm_config(architecture):
+    return {
+        Architecture.STANDARD: {
+            "num_layers": 3,
+            "hidden_size": 24,
+            "train_burn_in": 4096,
+            "train_truncate": 512,
+        },
+        Architecture.LITE: {
+            "num_layers": 2,
+            "hidden_size": 16,
+            "train_burn_in": 4096,
+            "train_truncate": 512,
+        },
+        Architecture.FEATHER: {
+            "num_layers": 1,
+            "hidden_size": 12,
+            "train_burn_in": 4096,
+            "train_truncate": 512,
+        },
+    }[architecture]
 
 def _check_v1(*args, **kwargs):
     return True
@@ -407,6 +428,7 @@ def _get_configs(
     output_basename: str,
     delay: int,
     epochs: int,
+    model_type: str,
     architecture: Architecture,
     ny: int,
     lr: float,
@@ -442,17 +464,42 @@ def _get_configs(
             "delay": delay,
         },
     }
-    model_config = {
-        "net": {
-            "name": "WaveNet",
-            # This should do decently. If you really want a nice model, try turning up
-            # "channels" in the first block and "input_size" in the second from 12 to 16.
-            "config": _get_wavenet_config(architecture),
-        },
-        "loss": {"val_loss": "esr"},
-        "optimizer": {"lr": lr},
-        "lr_scheduler": {"class": "ExponentialLR", "kwargs": {"gamma": 1.0 - lr_decay}},
-    }
+    
+    if model_type == "WaveNet":
+        model_config = {
+            "net": {
+                "name": "WaveNet",
+                # This should do decently. If you really want a nice model, try turning up
+                # "channels" in the first block and "input_size" in the second from 12 to 16.
+                "config": _get_wavenet_config(architecture),
+            },
+            "loss": {"val_loss": "esr"},
+            "optimizer": {"lr": lr},
+            "lr_scheduler": {"class": "ExponentialLR", "kwargs": {"gamma": 1.0 - lr_decay}},
+        }
+    else:
+        model_config = {
+            "net": {
+                "name": "LSTM",
+                "config": _get_lstm_config(architecture),
+            },
+            "loss": {
+                "val_loss": "mse",
+                "mask_first": 4096,    
+                "pre_emph_weight": 1.0,
+                "pre_emph_coef": 0.85
+            },
+            "optimizer": {
+            "lr": 0.01
+            },
+            "lr_scheduler": {
+                "class": "ExponentialLR",
+                "kwargs": {
+                    "gamma": 0.995
+                }
+            }
+        }    
+
     if torch.cuda.is_available():
         device_config = {"accelerator": "gpu", "devices": 1}
     elif torch.backends.mps.is_available():
@@ -531,6 +578,7 @@ def train(
     input_version: Optional[Version] = None,
     epochs=100,
     delay=None,
+    model_type: str = "WaveNet",
     architecture: Union[Architecture, str] = Architecture.STANDARD,
     batch_size: int = 16,
     ny: int = 8192,
@@ -563,6 +611,7 @@ def train(
         output_path,
         delay,
         epochs,
+        model_type,
         Architecture(architecture),
         ny,
         lr,

	neural-amp-modeler Neural network emulator for guitar amplifiers
	Log \| Files \| Refs \| README \| LICENSE

M	nam/train/colab.py	\|	2	++
M	nam/train/core.py	\|	71	++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++-----------