From 13208e23d71baa5e5024fb817a34a4dd89ce79a8 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Jo=C3=A3o=20Felipe=20Santos?= <santosjf@pm.me>
Date: Tue, 20 Jan 2026 12:16:33 -0800
Subject: [PATCH 1/6] Updated how activations are initialized from config.
 Passing an object instead of a string is now supported.

---
 NAM/activations.cpp                    |  53 ++++++++++++
 NAM/activations.h                      |  33 ++++---
 NAM/convnet.cpp                        |  12 +--
 NAM/convnet.h                          |   4 +-
 NAM/wavenet.cpp                        |  10 +--
 NAM/wavenet.h                          |  12 +--
 build/.gitignore                       |   4 -
 tools/run_tests.cpp                    |   9 ++
 tools/test/test_activations.cpp        | 114 +++++++++++++++++++++++++
 tools/test/test_blending_detailed.cpp  |   2 +-
 tools/test/test_gating_activations.cpp |   2 +-
 11 files changed, 220 insertions(+), 35 deletions(-)
 delete mode 100644 build/.gitignore
diff --git a/NAM/activations.cpp b/NAM/activations.cpp
index 3db6024b..cc15c423 100644
--- a/NAM/activations.cpp
+++ b/NAM/activations.cpp
@@ -31,6 +31,59 @@ nam::activations::Activation* nam::activations::Activation::get_activation(const
   return _activations[name];
 }
 
+nam::activations::Activation* nam::activations::Activation::get_activation(const nlohmann::json& activation_config)
+{
+  // If it's a string, use the existing string-based lookup
+  if (activation_config.is_string())
+  {
+    std::string name = activation_config.get<std::string>();
+    return get_activation(name);
+  }
+  
+  // If it's an object, parse the activation type and parameters
+  if (activation_config.is_object())
+  {
+    std::string type = activation_config["type"].get<std::string>();
+    
+    // Handle different activation types with parameters
+    if (type == "PReLU")
+    {
+      if (activation_config.find("negative_slope") != activation_config.end())
+      {
+        float negative_slope = activation_config["negative_slope"].get<float>();
+        return new ActivationPReLU(negative_slope);
+      }
+      else if (activation_config.find("negative_slopes") != activation_config.end())
+      {
+        std::vector<float> negative_slopes = activation_config["negative_slopes"].get<std::vector<float>>();
+        return new ActivationPReLU(negative_slopes);
+      }
+      // If no parameters provided, use default
+      return new ActivationPReLU(0.01);
+    }
+    else if (type == "LeakyReLU")
+    {
+      float negative_slope = activation_config.value("negative_slope", 0.01f);
+      return new ActivationLeakyReLU(negative_slope);
+    }
+    else if (type == "LeakyHardTanh")
+    {
+      float min_val = activation_config.value("min_val", -1.0f);
+      float max_val = activation_config.value("max_val", 1.0f);
+      float min_slope = activation_config.value("min_slope", 0.01f);
+      float max_slope = activation_config.value("max_slope", 0.01f);
+      return new ActivationLeakyHardTanh(min_val, max_val, min_slope, max_slope);
+    }
+    else
+    {
+      // For other activation types without parameters, use the default string-based lookup
+      return get_activation(type);
+    }
+  }
+  
+  return nullptr;
+}
+
 void nam::activations::Activation::enable_fast_tanh()
 {
   nam::activations::Activation::using_fast_tanh = true;
diff --git a/NAM/activations.h b/NAM/activations.h
index 6b4b6a2d..5b239f12 100644
--- a/NAM/activations.h
+++ b/NAM/activations.h
@@ -6,6 +6,7 @@
 #include <unordered_map>
 #include <Eigen/Dense>
 #include <functional>
+#include "json.hpp"
 
 namespace nam
 {
@@ -102,6 +103,7 @@ class Activation
   virtual void apply(float* data, long size) {}
 
   static Activation* get_activation(const std::string name);
+  static Activation* get_activation(const nlohmann::json& activation_config);
   static void enable_fast_tanh();
   static void disable_fast_tanh();
   static bool using_fast_tanh;
@@ -226,20 +228,31 @@ class ActivationPReLU : public Activation
   void apply(Eigen::MatrixXf& matrix) override
   {
     // Matrix is organized as (channels, time_steps)
-    int n_channels = negative_slopes.size();
-    int actual_channels = matrix.rows();
-
-    // NOTE: check not done during runtime on release builds
-    // model loader should make sure dimensions match
-    assert(actual_channels == n_channels);
-
+    unsigned long actual_channels = static_cast<unsigned long>(matrix.rows());
+    
+    // Prepare the slopes for the current matrix size
+    std::vector<float> slopes_for_channels = negative_slopes;
+    
+    if (slopes_for_channels.size() == 1 && actual_channels > 1)
+    {
+      // Broadcast single slope to all channels
+      float slope = slopes_for_channels[0];
+      slopes_for_channels.clear();
+      slopes_for_channels.resize(actual_channels, slope);
+    }
+    else if (slopes_for_channels.size() != actual_channels)
+    {
+      // This should not happen in normal usage, but handle gracefully
+      slopes_for_channels.resize(actual_channels, 0.01f); // Default slope
+    }
+    
     // Apply each negative slope to its corresponding channel
-    for (int channel = 0; channel < std::min(n_channels, actual_channels); channel++)
+    for (unsigned long channel = 0; channel < actual_channels; channel++)
     {
       // Apply the negative slope to all time steps in this channel
-      for (int time_step = 0; time_step < matrix.rows(); time_step++)
+      for (int time_step = 0; time_step < matrix.cols(); time_step++)
       {
-        matrix(channel, time_step) = leaky_relu(matrix(channel, time_step), negative_slopes[channel]);
+        matrix(channel, time_step) = leaky_relu(matrix(channel, time_step), slopes_for_channels[channel]);
       }
     }
   }
diff --git a/NAM/convnet.cpp b/NAM/convnet.cpp
index 8bbcded2..a85e6c44 100644
--- a/NAM/convnet.cpp
+++ b/NAM/convnet.cpp
@@ -48,7 +48,7 @@ void nam::convnet::BatchNorm::process_(Eigen::MatrixXf& x, const long i_start, c
 }
 
 void nam::convnet::ConvNetBlock::set_weights_(const int in_channels, const int out_channels, const int _dilation,
-                                              const bool batchnorm, const std::string activation, const int groups,
+                                              const bool batchnorm, const nlohmann::json activation_config, const int groups,
                                               std::vector<float>::iterator& weights)
 {
   this->_batchnorm = batchnorm;
@@ -56,7 +56,7 @@ void nam::convnet::ConvNetBlock::set_weights_(const int in_channels, const int o
   this->conv.set_size_and_weights_(in_channels, out_channels, 2, _dilation, !batchnorm, groups, weights);
   if (this->_batchnorm)
     this->batchnorm = BatchNorm(out_channels, weights);
-  this->activation = activations::Activation::get_activation(activation);
+  this->activation = activations::Activation::get_activation(activation_config);
 }
 
 void nam::convnet::ConvNetBlock::SetMaxBufferSize(const int maxBufferSize)
@@ -173,7 +173,7 @@ void nam::convnet::_Head::process_(const Eigen::MatrixXf& input, Eigen::MatrixXf
 }
 
 nam::convnet::ConvNet::ConvNet(const int in_channels, const int out_channels, const int channels,
-                               const std::vector<int>& dilations, const bool batchnorm, const std::string activation,
+                               const std::vector<int>& dilations, const bool batchnorm, const nlohmann::json activation_config,
                                std::vector<float>& weights, const double expected_sample_rate, const int groups)
 : Buffer(in_channels, out_channels, *std::max_element(dilations.begin(), dilations.end()), expected_sample_rate)
 {
@@ -183,7 +183,7 @@ nam::convnet::ConvNet::ConvNet(const int in_channels, const int out_channels, co
   // First block takes in_channels input, subsequent blocks take channels input
   for (size_t i = 0; i < dilations.size(); i++)
     this->_blocks[i].set_weights_(
-      i == 0 ? in_channels : channels, channels, dilations[i], batchnorm, activation, groups, it);
+      i == 0 ? in_channels : channels, channels, dilations[i], batchnorm, activation_config, groups, it);
   // Only need _block_vals for the head (one entry)
   // Conv1D layers manage their own buffers now
   this->_block_vals.resize(1);
@@ -327,13 +327,13 @@ std::unique_ptr<nam::DSP> nam::convnet::Factory(const nlohmann::json& config, st
   const int channels = config["channels"];
   const std::vector<int> dilations = config["dilations"];
   const bool batchnorm = config["batchnorm"];
-  const std::string activation = config["activation"];
+  const nlohmann::json activation_config = config["activation"];
   const int groups = config.value("groups", 1); // defaults to 1
   // Default to 1 channel in/out for backward compatibility
   const int in_channels = config.value("in_channels", 1);
   const int out_channels = config.value("out_channels", 1);
   return std::make_unique<nam::convnet::ConvNet>(
-    in_channels, out_channels, channels, dilations, batchnorm, activation, weights, expectedSampleRate, groups);
+    in_channels, out_channels, channels, dilations, batchnorm, activation_config, weights, expectedSampleRate, groups);
 }
 
 namespace
diff --git a/NAM/convnet.h b/NAM/convnet.h
index d1e846c3..c4b28d81 100644
--- a/NAM/convnet.h
+++ b/NAM/convnet.h
@@ -44,7 +44,7 @@ class ConvNetBlock
 public:
   ConvNetBlock() {};
   void set_weights_(const int in_channels, const int out_channels, const int _dilation, const bool batchnorm,
-                    const std::string activation, const int groups, std::vector<float>::iterator& weights);
+                    const nlohmann::json activation_config, const int groups, std::vector<float>::iterator& weights);
   void SetMaxBufferSize(const int maxBufferSize);
   // Process input matrix directly (new API, similar to WaveNet)
   void Process(const Eigen::MatrixXf& input, const int num_frames);
@@ -78,7 +78,7 @@ class ConvNet : public Buffer
 {
 public:
   ConvNet(const int in_channels, const int out_channels, const int channels, const std::vector<int>& dilations,
-          const bool batchnorm, const std::string activation, std::vector<float>& weights,
+          const bool batchnorm, const nlohmann::json activation_config, std::vector<float>& weights,
           const double expected_sample_rate = -1.0, const int groups = 1);
   ~ConvNet() = default;
 
diff --git a/NAM/wavenet.cpp b/NAM/wavenet.cpp
index 2cb749e4..121a5572 100644
--- a/NAM/wavenet.cpp
+++ b/NAM/wavenet.cpp
@@ -113,7 +113,7 @@ void nam::wavenet::_Layer::Process(const Eigen::MatrixXf& input, const Eigen::Ma
 
 nam::wavenet::_LayerArray::_LayerArray(const int input_size, const int condition_size, const int head_size,
                                        const int channels, const int bottleneck, const int kernel_size,
-                                       const std::vector<int>& dilations, const std::string activation,
+                                       const std::vector<int>& dilations, const nlohmann::json activation_config,
                                        const GatingMode gating_mode, const bool head_bias, const int groups_input,
                                        const int groups_1x1, const Head1x1Params& head1x1_params,
                                        const std::string& secondary_activation)
@@ -122,7 +122,7 @@ nam::wavenet::_LayerArray::_LayerArray(const int input_size, const int condition
 , _bottleneck(bottleneck)
 {
   for (size_t i = 0; i < dilations.size(); i++)
-    this->_layers.push_back(_Layer(condition_size, channels, bottleneck, kernel_size, dilations[i], activation,
+    this->_layers.push_back(_Layer(condition_size, channels, bottleneck, kernel_size, dilations[i], activation_config,
                                    gating_mode, groups_input, groups_1x1, head1x1_params, secondary_activation));
 }
 
@@ -273,7 +273,7 @@ nam::wavenet::WaveNet::WaveNet(const int in_channels,
     this->_layer_arrays.push_back(nam::wavenet::_LayerArray(
       layer_array_params[i].input_size, layer_array_params[i].condition_size, layer_array_params[i].head_size,
       layer_array_params[i].channels, layer_array_params[i].bottleneck, layer_array_params[i].kernel_size,
-      layer_array_params[i].dilations, layer_array_params[i].activation, layer_array_params[i].gating_mode,
+      layer_array_params[i].dilations, layer_array_params[i].activation_config, layer_array_params[i].gating_mode,
       layer_array_params[i].head_bias, layer_array_params[i].groups_input, layer_array_params[i].groups_1x1,
       layer_array_params[i].head1x1_params, layer_array_params[i].secondary_activation));
     if (i > 0)
@@ -477,7 +477,7 @@ std::unique_ptr<nam::DSP> nam::wavenet::Factory(const nlohmann::json& config, st
     const int head_size = layer_config["head_size"];
     const int kernel_size = layer_config["kernel_size"];
     const auto dilations = layer_config["dilations"];
-    const std::string activation = layer_config["activation"].get<std::string>();
+    const nlohmann::json activation_config = layer_config["activation"];
     // Parse gating mode - support both old "gated" boolean and new "gating_mode" string
     GatingMode gating_mode = GatingMode::NONE;
     std::string secondary_activation;
@@ -531,7 +531,7 @@ std::unique_ptr<nam::DSP> nam::wavenet::Factory(const nlohmann::json& config, st
     nam::wavenet::Head1x1Params head1x1_params(head1x1_active, head1x1_out_channels, head1x1_groups);
 
     layer_array_params.push_back(nam::wavenet::LayerArrayParams(
-      input_size, condition_size, head_size, channels, bottleneck, kernel_size, dilations, activation, gating_mode,
+      input_size, condition_size, head_size, channels, bottleneck, kernel_size, dilations, activation_config, gating_mode,
       head_bias, groups, groups_1x1, head1x1_params, secondary_activation));
   }
   const bool with_head = !config["head"].is_null();
diff --git a/NAM/wavenet.h b/NAM/wavenet.h
index e4113858..e559b223 100644
--- a/NAM/wavenet.h
+++ b/NAM/wavenet.h
@@ -50,12 +50,12 @@ class _Layer
 public:
   // New constructor with GatingMode enum and configurable activations
   _Layer(const int condition_size, const int channels, const int bottleneck, const int kernel_size, const int dilation,
-         const std::string activation, const GatingMode gating_mode, const int groups_input, const int groups_1x1,
+         const nlohmann::json activation_config, const GatingMode gating_mode, const int groups_input, const int groups_1x1,
          const Head1x1Params& head1x1_params, const std::string& secondary_activation)
   : _conv(channels, (gating_mode != GatingMode::NONE) ? 2 * bottleneck : bottleneck, kernel_size, true, dilation)
   , _input_mixin(condition_size, (gating_mode != GatingMode::NONE) ? 2 * bottleneck : bottleneck, false)
   , _1x1(bottleneck, channels, groups_1x1)
-  , _activation(activations::Activation::get_activation(activation)) // needs to support activations with parameters
+  , _activation(activations::Activation::get_activation(activation_config)) // now supports activations with parameters
   , _gating_mode(gating_mode)
   , _bottleneck(bottleneck)
   {
@@ -148,7 +148,7 @@ class LayerArrayParams
 public:
   LayerArrayParams(const int input_size_, const int condition_size_, const int head_size_, const int channels_,
                    const int bottleneck_, const int kernel_size_, const std::vector<int>&& dilations_,
-                   const std::string activation_, const GatingMode gating_mode_, const bool head_bias_,
+                   const nlohmann::json activation_, const GatingMode gating_mode_, const bool head_bias_,
                    const int groups_input, const int groups_1x1_, const Head1x1Params& head1x1_params_,
                    const std::string& secondary_activation_)
   : input_size(input_size_)
@@ -158,7 +158,7 @@ class LayerArrayParams
   , bottleneck(bottleneck_)
   , kernel_size(kernel_size_)
   , dilations(std::move(dilations_))
-  , activation(activation_)
+  , activation_config(activation_)
   , gating_mode(gating_mode_)
   , head_bias(head_bias_)
   , groups_input(groups_input)
@@ -175,7 +175,7 @@ class LayerArrayParams
   const int bottleneck;
   const int kernel_size;
   std::vector<int> dilations;
-  const std::string activation;
+  const nlohmann::json activation_config;
   const GatingMode gating_mode;
   const bool head_bias;
   const int groups_input;
@@ -191,7 +191,7 @@ class _LayerArray
   // New constructor with GatingMode enum and configurable activations
   _LayerArray(const int input_size, const int condition_size, const int head_size, const int channels,
               const int bottleneck, const int kernel_size, const std::vector<int>& dilations,
-              const std::string activation, const GatingMode gating_mode, const bool head_bias, const int groups_input,
+              const nlohmann::json activation_config, const GatingMode gating_mode, const bool head_bias, const int groups_input,
               const int groups_1x1, const Head1x1Params& head1x1_params, const std::string& secondary_activation);
 
   void SetMaxBufferSize(const int maxBufferSize);
diff --git a/build/.gitignore b/build/.gitignore
deleted file mode 100644
index 86d0cb27..00000000
--- a/build/.gitignore
+++ /dev/null
@@ -1,4 +0,0 @@
-# Ignore everything in this directory
-*
-# Except this file
-!.gitignore
\ No newline at end of file
diff --git a/tools/run_tests.cpp b/tools/run_tests.cpp
index de3a2e20..860709da 100644
--- a/tools/run_tests.cpp
+++ b/tools/run_tests.cpp
@@ -44,6 +44,15 @@ int main()
   // This is enforced by an assert so it doesn't need to be tested
   // test_activations::TestPReLU::test_wrong_number_of_channels();
 
+  // JSON activation parsing tests
+  test_activations::TestJSONActivationParsing::test_string_activation();
+  test_activations::TestJSONActivationParsing::test_json_prelu_single_slope();
+  test_activations::TestJSONActivationParsing::test_json_prelu_multi_slope();
+  test_activations::TestJSONActivationParsing::test_json_leaky_relu();
+  test_activations::TestJSONActivationParsing::test_json_leaky_hardtanh();
+  test_activations::TestJSONActivationParsing::test_json_unknown_activation();
+  test_activations::TestJSONActivationParsing::test_functional_verification();
+
   test_dsp::test_construct();
   test_dsp::test_get_input_level();
   test_dsp::test_get_output_level();
diff --git a/tools/test/test_activations.cpp b/tools/test/test_activations.cpp
index e9f7a86c..8f8b82ed 100644
--- a/tools/test/test_activations.cpp
+++ b/tools/test/test_activations.cpp
@@ -195,4 +195,118 @@ class TestPReLU
   }
 };
 
+class TestJSONActivationParsing
+{
+public:
+  static void test_string_activation()
+  {
+    nlohmann::json str_activation = "ReLU";
+    auto act = nam::activations::Activation::get_activation(str_activation);
+    assert(act != nullptr);
+    // Don't delete global activation objects
+  }
+
+  static void test_json_prelu_single_slope()
+  {
+    nlohmann::json prelu_single = {
+      {"type", "PReLU"},
+      {"negative_slope", 0.25f}
+    };
+    auto act = nam::activations::Activation::get_activation(prelu_single);
+    assert(act != nullptr);
+    delete act; // Delete dynamically allocated object
+  }
+
+  static void test_json_prelu_multi_slope()
+  {
+    nlohmann::json prelu_multi = {
+      {"type", "PReLU"},
+      {"negative_slopes", {0.1f, 0.2f, 0.3f, 0.4f}}
+    };
+    auto act = nam::activations::Activation::get_activation(prelu_multi);
+    assert(act != nullptr);
+    delete act; // Delete dynamically allocated object
+  }
+
+  static void test_json_leaky_relu()
+  {
+    nlohmann::json leaky_relu = {
+      {"type", "LeakyReLU"},
+      {"negative_slope", 0.15f}
+    };
+    auto act = nam::activations::Activation::get_activation(leaky_relu);
+    assert(act != nullptr);
+    delete act; // Delete dynamically allocated object
+  }
+
+  static void test_json_leaky_hardtanh()
+  {
+    nlohmann::json leaky_hardtanh = {
+      {"type", "LeakyHardTanh"},
+      {"min_val", -2.0f},
+      {"max_val", 2.0f},
+      {"min_slope", 0.1f},
+      {"max_slope", 0.1f}
+    };
+    auto act = nam::activations::Activation::get_activation(leaky_hardtanh);
+    assert(act != nullptr);
+    delete act; // Delete dynamically allocated object
+  }
+
+  static void test_json_unknown_activation()
+  {
+    nlohmann::json unknown_activation = {
+      {"type", "UnknownActivation"}
+    };
+    auto act = nam::activations::Activation::get_activation(unknown_activation);
+    assert(act == nullptr); // Should fail for unknown activation type
+  }
+
+  static void test_functional_verification()
+  {
+    // Create test data with 4 channels and 3 time steps
+    Eigen::MatrixXf test_data(4, 3);
+    test_data << 
+      -1.0, -0.5, 0.0,
+      -2.0, 0.0, 1.0,
+      -0.5, 0.5, 1.5,
+      -1.5, -1.0, 0.5;
+
+    // Test PReLU with multiple slopes
+    nlohmann::json functional_prelu = {
+      {"type", "PReLU"},
+      {"negative_slopes", {0.1f, 0.2f, 0.3f, 0.4f}}
+    };
+    auto functional_act = nam::activations::Activation::get_activation(functional_prelu);
+    assert(functional_act != nullptr);
+
+    Eigen::MatrixXf result = test_data;
+    functional_act->apply(result);
+
+    // Verify specific values
+    // Channel 0, slope 0.1: -1.0 * 0.1 = -0.1
+    assert(fabs(result(0, 0) - (-0.1f)) < 1e-6);
+
+    // Channel 1, slope 0.2: -2.0 * 0.2 = -0.4
+    assert(fabs(result(1, 0) - (-0.4f)) < 1e-6);
+
+    // Channel 2, slope 0.3: -0.5 * 0.3 = -0.15
+    assert(fabs(result(2, 0) - (-0.15f)) < 1e-6);
+
+    // Channel 3, slope 0.4: -1.5 * 0.4 = -0.6
+    assert(fabs(result(3, 0) - (-0.6f)) < 1e-6);
+
+    // Positive values should be unchanged
+    for (int i = 0; i < result.rows(); i++) {
+      for (int j = 0; j < result.cols(); j++) {
+        if (test_data(i, j) >= 0) {
+          assert(fabs(result(i, j) - test_data(i, j)) < 1e-6);
+        }
+      }
+    }
+
+    delete functional_act;
+  }
+};
+
 }; // namespace test_activations
diff --git a/tools/test/test_blending_detailed.cpp b/tools/test/test_blending_detailed.cpp
index 7b774f5a..f8da255d 100644
--- a/tools/test/test_blending_detailed.cpp
+++ b/tools/test/test_blending_detailed.cpp
@@ -42,7 +42,7 @@ class TestBlendingDetailed
     assert(fabs(output(1, 1) - 4.0f) < 1e-6);
 
     // Test with sigmoid blending activation
-    nam::activations::Activation* sigmoid_act = nam::activations::Activation::get_activation("Sigmoid");
+    nam::activations::Activation* sigmoid_act = nam::activations::Activation::get_activation(std::string("Sigmoid"));
     nam::gating_activations::BlendingActivation blending_act_sigmoid(&identity_act, sigmoid_act, 2);
 
     Eigen::MatrixXf output_sigmoid(2, 2);
diff --git a/tools/test/test_gating_activations.cpp b/tools/test/test_gating_activations.cpp
index a67b872c..3f681cb6 100644
--- a/tools/test/test_gating_activations.cpp
+++ b/tools/test/test_gating_activations.cpp
@@ -118,7 +118,7 @@ class TestBlendingActivation
     assert(fabs(output(0, 1) - (-1.0f)) < 1e-6);
 
     // Test with sigmoid blending activation
-    nam::activations::Activation* sigmoid_act = nam::activations::Activation::get_activation("Sigmoid");
+    nam::activations::Activation* sigmoid_act = nam::activations::Activation::get_activation(std::string("Sigmoid"));
     nam::gating_activations::BlendingActivation blending_act2(&identity_act, sigmoid_act, 1);
     blending_act2.apply(input, output);
 

From 52023ef3b0662ed37fa6373f3e0b993769223bff Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Jo=C3=A3o=20Felipe=20Santos?= <santosjf@pm.me>
Date: Tue, 20 Jan 2026 12:28:11 -0800
Subject: [PATCH 2/6] Removed broadcasting from PReLU

---
 NAM/activations.h | 16 +++-------------
 1 file changed, 3 insertions(+), 13 deletions(-)

diff --git a/NAM/activations.h b/NAM/activations.h
index 5b239f12..21bfb6e3 100644
--- a/NAM/activations.h
+++ b/NAM/activations.h
@@ -232,19 +232,9 @@ class ActivationPReLU : public Activation
     
     // Prepare the slopes for the current matrix size
     std::vector<float> slopes_for_channels = negative_slopes;
-    
-    if (slopes_for_channels.size() == 1 && actual_channels > 1)
-    {
-      // Broadcast single slope to all channels
-      float slope = slopes_for_channels[0];
-      slopes_for_channels.clear();
-      slopes_for_channels.resize(actual_channels, slope);
-    }
-    else if (slopes_for_channels.size() != actual_channels)
-    {
-      // This should not happen in normal usage, but handle gracefully
-      slopes_for_channels.resize(actual_channels, 0.01f); // Default slope
-    }
+
+    // Fail loudly if input has more channels than activation
+    assert(actual_channels == negative_slopes.size());
     
     // Apply each negative slope to its corresponding channel
     for (unsigned long channel = 0; channel < actual_channels; channel++)

From 273d53fadc7d7b59272b23b328ed819ec21983cf Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Jo=C3=A3o=20Felipe=20Santos?= <santosjf@pm.me>
Date: Tue, 20 Jan 2026 14:42:48 -0800
Subject: [PATCH 3/6] Restored build/.gitignore

---
 build/.gitignore | 4 ++++
 1 file changed, 4 insertions(+)
 create mode 100644 build/.gitignore

diff --git a/build/.gitignore b/build/.gitignore
new file mode 100644
index 00000000..86d0cb27
--- /dev/null
+++ b/build/.gitignore
@@ -0,0 +1,4 @@
+# Ignore everything in this directory
+*
+# Except this file
+!.gitignore
\ No newline at end of file

From ed9569bcd1413c2ec9eaea6c8281f6f6e0d4d485 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Jo=C3=A3o=20Felipe=20Santos?= <santosjf@pm.me>
Date: Tue, 20 Jan 2026 16:03:48 -0800
Subject: [PATCH 4/6] Converted the output type of get_activation to a
 shared_ptr so callers do not have to manage memory allocated by it.

---
 NAM/activations.cpp                           | 74 +++++++++++--------
 NAM/activations.h                             | 10 ++-
 NAM/convnet.h                                 |  2 +-
 NAM/gating_activations.h                      | 12 +--
 NAM/wavenet.h                                 |  2 +-
 tools/test/test_activations.cpp               | 19 +++--
 tools/test/test_blending_detailed.cpp         | 16 +++-
 tools/test/test_gating_activations.cpp        | 26 ++++---
 tools/test/test_input_buffer_verification.cpp | 12 ++-
 .../test_wavenet_gating_compatibility.cpp     | 16 +++-
 10 files changed, 119 insertions(+), 70 deletions(-)

diff --git a/NAM/activations.cpp b/NAM/activations.cpp
index cc15c423..b084c554 100644
--- a/NAM/activations.cpp
+++ b/NAM/activations.cpp
@@ -1,29 +1,43 @@
 #include "activations.h"
 
-nam::activations::ActivationTanh _TANH = nam::activations::ActivationTanh();
-nam::activations::ActivationFastTanh _FAST_TANH = nam::activations::ActivationFastTanh();
-nam::activations::ActivationHardTanh _HARD_TANH = nam::activations::ActivationHardTanh();
-nam::activations::ActivationReLU _RELU = nam::activations::ActivationReLU();
-nam::activations::ActivationLeakyReLU _LEAKY_RELU =
-  nam::activations::ActivationLeakyReLU(0.01); // FIXME does not parameterize LeakyReLU
-nam::activations::ActivationPReLU _PRELU = nam::activations::ActivationPReLU(0.01); // Same as leaky ReLU by default
-nam::activations::ActivationSigmoid _SIGMOID = nam::activations::ActivationSigmoid();
-nam::activations::ActivationSwish _SWISH = nam::activations::ActivationSwish();
-nam::activations::ActivationHardSwish _HARD_SWISH = nam::activations::ActivationHardSwish();
-nam::activations::ActivationLeakyHardTanh _LEAKY_HARD_TANH = nam::activations::ActivationLeakyHardTanh();
+// Global singleton instances (statically allocated, never deleted)
+static nam::activations::ActivationTanh _TANH;
+static nam::activations::ActivationFastTanh _FAST_TANH;
+static nam::activations::ActivationHardTanh _HARD_TANH;
+static nam::activations::ActivationReLU _RELU;
+static nam::activations::ActivationLeakyReLU _LEAKY_RELU(0.01); // FIXME does not parameterize LeakyReLU
+static nam::activations::ActivationPReLU _PRELU(0.01); // Same as leaky ReLU by default
+static nam::activations::ActivationSigmoid _SIGMOID;
+static nam::activations::ActivationSwish _SWISH;
+static nam::activations::ActivationHardSwish _HARD_SWISH;
+static nam::activations::ActivationLeakyHardTanh _LEAKY_HARD_TANH;
 
 bool nam::activations::Activation::using_fast_tanh = false;
 
-std::unordered_map<std::string, nam::activations::Activation*> nam::activations::Activation::_activations = {
-  {"Tanh", &_TANH},  {"Hardtanh", &_HARD_TANH},   {"Fasttanh", &_FAST_TANH},
-  {"ReLU", &_RELU},  {"LeakyReLU", &_LEAKY_RELU}, {"Sigmoid", &_SIGMOID},
-  {"SiLU", &_SWISH}, {"Hardswish", &_HARD_SWISH}, {"LeakyHardtanh", &_LEAKY_HARD_TANH},
-  {"PReLU", &_PRELU}};
+// Helper to create a non-owning shared_ptr (no-op deleter) for singletons
+template<typename T>
+nam::activations::Activation::Ptr make_singleton_ptr(T& singleton)
+{
+  return nam::activations::Activation::Ptr(&singleton, [](nam::activations::Activation*){});
+}
+
+std::unordered_map<std::string, nam::activations::Activation::Ptr> nam::activations::Activation::_activations = {
+  {"Tanh", make_singleton_ptr(_TANH)},
+  {"Hardtanh", make_singleton_ptr(_HARD_TANH)},
+  {"Fasttanh", make_singleton_ptr(_FAST_TANH)},
+  {"ReLU", make_singleton_ptr(_RELU)},
+  {"LeakyReLU", make_singleton_ptr(_LEAKY_RELU)},
+  {"Sigmoid", make_singleton_ptr(_SIGMOID)},
+  {"SiLU", make_singleton_ptr(_SWISH)},
+  {"Hardswish", make_singleton_ptr(_HARD_SWISH)},
+  {"LeakyHardtanh", make_singleton_ptr(_LEAKY_HARD_TANH)},
+  {"PReLU", make_singleton_ptr(_PRELU)}
+};
 
-nam::activations::Activation* tanh_bak = nullptr;
-nam::activations::Activation* sigmoid_bak = nullptr;
+nam::activations::Activation::Ptr tanh_bak = nullptr;
+nam::activations::Activation::Ptr sigmoid_bak = nullptr;
 
-nam::activations::Activation* nam::activations::Activation::get_activation(const std::string name)
+nam::activations::Activation::Ptr nam::activations::Activation::get_activation(const std::string name)
 {
   if (_activations.find(name) == _activations.end())
     return nullptr;
@@ -31,7 +45,7 @@ nam::activations::Activation* nam::activations::Activation::get_activation(const
   return _activations[name];
 }
 
-nam::activations::Activation* nam::activations::Activation::get_activation(const nlohmann::json& activation_config)
+nam::activations::Activation::Ptr nam::activations::Activation::get_activation(const nlohmann::json& activation_config)
 {
   // If it's a string, use the existing string-based lookup
   if (activation_config.is_string())
@@ -39,32 +53,33 @@ nam::activations::Activation* nam::activations::Activation::get_activation(const
     std::string name = activation_config.get<std::string>();
     return get_activation(name);
   }
-  
+
   // If it's an object, parse the activation type and parameters
   if (activation_config.is_object())
   {
     std::string type = activation_config["type"].get<std::string>();
-    
+
     // Handle different activation types with parameters
+    // These return owning shared_ptr (will be deleted when last reference goes out of scope)
     if (type == "PReLU")
     {
       if (activation_config.find("negative_slope") != activation_config.end())
       {
         float negative_slope = activation_config["negative_slope"].get<float>();
-        return new ActivationPReLU(negative_slope);
+        return std::make_shared<ActivationPReLU>(negative_slope);
       }
       else if (activation_config.find("negative_slopes") != activation_config.end())
       {
         std::vector<float> negative_slopes = activation_config["negative_slopes"].get<std::vector<float>>();
-        return new ActivationPReLU(negative_slopes);
+        return std::make_shared<ActivationPReLU>(negative_slopes);
       }
       // If no parameters provided, use default
-      return new ActivationPReLU(0.01);
+      return std::make_shared<ActivationPReLU>(0.01f);
     }
     else if (type == "LeakyReLU")
     {
       float negative_slope = activation_config.value("negative_slope", 0.01f);
-      return new ActivationLeakyReLU(negative_slope);
+      return std::make_shared<ActivationLeakyReLU>(negative_slope);
     }
     else if (type == "LeakyHardTanh")
     {
@@ -72,7 +87,7 @@ nam::activations::Activation* nam::activations::Activation::get_activation(const
       float max_val = activation_config.value("max_val", 1.0f);
       float min_slope = activation_config.value("min_slope", 0.01f);
       float max_slope = activation_config.value("max_slope", 0.01f);
-      return new ActivationLeakyHardTanh(min_val, max_val, min_slope, max_slope);
+      return std::make_shared<ActivationLeakyHardTanh>(min_val, max_val, min_slope, max_slope);
     }
     else
     {
@@ -80,7 +95,7 @@ nam::activations::Activation* nam::activations::Activation::get_activation(const
       return get_activation(type);
     }
   }
-  
+
   return nullptr;
 }
 
@@ -122,8 +137,7 @@ void nam::activations::Activation::enable_lut(std::string function_name, float m
   {
     throw std::runtime_error("Tried to enable LUT for a function other than Tanh or Sigmoid");
   }
-  FastLUTActivation lut_activation(min, max, n_points, fn);
-  _activations[function_name] = &lut_activation;
+  _activations[function_name] = std::make_shared<FastLUTActivation>(min, max, n_points, fn);
 }
 
 void nam::activations::Activation::disable_lut(std::string function_name)
diff --git a/NAM/activations.h b/NAM/activations.h
index 21bfb6e3..c077776c 100644
--- a/NAM/activations.h
+++ b/NAM/activations.h
@@ -3,6 +3,7 @@
 #include <cassert>
 #include <string>
 #include <cmath> // expf
+#include <memory>
 #include <unordered_map>
 #include <Eigen/Dense>
 #include <functional>
@@ -92,6 +93,9 @@ inline float hardswish(float x)
 class Activation
 {
 public:
+  // Type alias for shared pointer to Activation
+  using Ptr = std::shared_ptr<Activation>;
+
   Activation() = default;
   virtual ~Activation() = default;
   virtual void apply(Eigen::MatrixXf& matrix) { apply(matrix.data(), matrix.rows() * matrix.cols()); }
@@ -102,8 +106,8 @@ class Activation
   }
   virtual void apply(float* data, long size) {}
 
-  static Activation* get_activation(const std::string name);
-  static Activation* get_activation(const nlohmann::json& activation_config);
+  static Ptr get_activation(const std::string name);
+  static Ptr get_activation(const nlohmann::json& activation_config);
   static void enable_fast_tanh();
   static void disable_fast_tanh();
   static bool using_fast_tanh;
@@ -111,7 +115,7 @@ class Activation
   static void disable_lut(std::string function_name);
 
 protected:
-  static std::unordered_map<std::string, Activation*> _activations;
+  static std::unordered_map<std::string, Ptr> _activations;
 };
 
 // identity function activation
diff --git a/NAM/convnet.h b/NAM/convnet.h
index c4b28d81..b675a436 100644
--- a/NAM/convnet.h
+++ b/NAM/convnet.h
@@ -58,7 +58,7 @@ class ConvNetBlock
 private:
   BatchNorm batchnorm;
   bool _batchnorm = false;
-  activations::Activation* activation = nullptr;
+  activations::Activation::Ptr activation;
   Eigen::MatrixXf _output; // Output buffer owned by the block
 };
 
diff --git a/NAM/gating_activations.h b/NAM/gating_activations.h
index dbe5b034..ad49fb8b 100644
--- a/NAM/gating_activations.h
+++ b/NAM/gating_activations.h
@@ -32,7 +32,7 @@ class GatingActivation
    * @param input_channels Number of input channels (default: 1)
    * @param gating_channels Number of gating channels (default: 1)
    */
-  GatingActivation(activations::Activation* input_act, activations::Activation* gating_act, int input_channels = 1)
+  GatingActivation(activations::Activation::Ptr input_act, activations::Activation::Ptr gating_act, int input_channels = 1)
   : input_activation(input_act)
   , gating_activation(gating_act)
   , num_channels(input_channels)
@@ -94,8 +94,8 @@ class GatingActivation
   int get_output_channels() const { return num_channels; }
 
 private:
-  activations::Activation* input_activation;
-  activations::Activation* gating_activation;
+  activations::Activation::Ptr input_activation;
+  activations::Activation::Ptr gating_activation;
   int num_channels;
   Eigen::MatrixXf input_buffer;
 };
@@ -109,7 +109,7 @@ class BlendingActivation
    * @param blend_act Activation function for blending channels
    * @param input_channels Number of input channels
    */
-  BlendingActivation(activations::Activation* input_act, activations::Activation* blend_act, int input_channels = 1)
+  BlendingActivation(activations::Activation::Ptr input_act, activations::Activation::Ptr blend_act, int input_channels = 1)
   : input_activation(input_act)
   , blending_activation(blend_act)
   , num_channels(input_channels)
@@ -169,8 +169,8 @@ class BlendingActivation
   int get_output_channels() const { return num_channels; }
 
 private:
-  activations::Activation* input_activation;
-  activations::Activation* blending_activation;
+  activations::Activation::Ptr input_activation;
+  activations::Activation::Ptr blending_activation;
   int num_channels;
   Eigen::MatrixXf input_buffer;
 };
diff --git a/NAM/wavenet.h b/NAM/wavenet.h
index e559b223..65a7dee5 100644
--- a/NAM/wavenet.h
+++ b/NAM/wavenet.h
@@ -134,7 +134,7 @@ class _Layer
   // Output to head (skip connection: activated conv output)
   Eigen::MatrixXf _output_head;
 
-  activations::Activation* _activation;
+  activations::Activation::Ptr _activation;
   const GatingMode _gating_mode;
   const int _bottleneck; // Internal channel count (not doubled when gated)
 
diff --git a/tools/test/test_activations.cpp b/tools/test/test_activations.cpp
index 8f8b82ed..85fe15f4 100644
--- a/tools/test/test_activations.cpp
+++ b/tools/test/test_activations.cpp
@@ -41,7 +41,7 @@ class TestFastTanh
   {
     const std::string name = "Fasttanh";
     auto a = nam::activations::Activation::get_activation(name);
-    _test_class(a);
+    _test_class(a.get());
   }
 
 private:
@@ -94,7 +94,7 @@ class TestLeakyReLU
   {
     const std::string name = "LeakyReLU";
     auto a = nam::activations::Activation::get_activation(name);
-    _test_class(a);
+    _test_class(a.get());
   }
 
 private:
@@ -203,7 +203,7 @@ class TestJSONActivationParsing
     nlohmann::json str_activation = "ReLU";
     auto act = nam::activations::Activation::get_activation(str_activation);
     assert(act != nullptr);
-    // Don't delete global activation objects
+    // shared_ptr handles memory management automatically
   }
 
   static void test_json_prelu_single_slope()
@@ -214,7 +214,7 @@ class TestJSONActivationParsing
     };
     auto act = nam::activations::Activation::get_activation(prelu_single);
     assert(act != nullptr);
-    delete act; // Delete dynamically allocated object
+    // shared_ptr handles memory management automatically
   }
 
   static void test_json_prelu_multi_slope()
@@ -225,7 +225,7 @@ class TestJSONActivationParsing
     };
     auto act = nam::activations::Activation::get_activation(prelu_multi);
     assert(act != nullptr);
-    delete act; // Delete dynamically allocated object
+    // shared_ptr handles memory management automatically
   }
 
   static void test_json_leaky_relu()
@@ -236,7 +236,7 @@ class TestJSONActivationParsing
     };
     auto act = nam::activations::Activation::get_activation(leaky_relu);
     assert(act != nullptr);
-    delete act; // Delete dynamically allocated object
+    // shared_ptr handles memory management automatically
   }
 
   static void test_json_leaky_hardtanh()
@@ -250,7 +250,7 @@ class TestJSONActivationParsing
     };
     auto act = nam::activations::Activation::get_activation(leaky_hardtanh);
     assert(act != nullptr);
-    delete act; // Delete dynamically allocated object
+    // shared_ptr handles memory management automatically
   }
 
   static void test_json_unknown_activation()
@@ -266,7 +266,7 @@ class TestJSONActivationParsing
   {
     // Create test data with 4 channels and 3 time steps
     Eigen::MatrixXf test_data(4, 3);
-    test_data << 
+    test_data <<
       -1.0, -0.5, 0.0,
       -2.0, 0.0, 1.0,
       -0.5, 0.5, 1.5,
@@ -304,8 +304,7 @@ class TestJSONActivationParsing
         }
       }
     }
-
-    delete functional_act;
+    // shared_ptr handles memory management automatically
   }
 };
 
diff --git a/tools/test/test_blending_detailed.cpp b/tools/test/test_blending_detailed.cpp
index f8da255d..b5c38db4 100644
--- a/tools/test/test_blending_detailed.cpp
+++ b/tools/test/test_blending_detailed.cpp
@@ -5,6 +5,7 @@
 #include <vector>
 #include <cmath>
 #include <iostream>
+#include <memory>
 
 #include "NAM/gating_activations.h"
 #include "NAM/activations.h"
@@ -12,6 +13,13 @@
 namespace test_blending_detailed
 {
 
+// Helper to create a non-owning shared_ptr for stack-allocated activations in tests
+template<typename T>
+nam::activations::Activation::Ptr make_test_ptr(T& activation)
+{
+  return nam::activations::Activation::Ptr(&activation, [](nam::activations::Activation*){});
+}
+
 class TestBlendingDetailed
 {
 public:
@@ -29,7 +37,7 @@ class TestBlendingDetailed
     // Test with default (linear) activations
     nam::activations::ActivationIdentity identity_act;
     nam::activations::ActivationIdentity identity_blend_act;
-    nam::gating_activations::BlendingActivation blending_act(&identity_act, &identity_blend_act, 2);
+    nam::gating_activations::BlendingActivation blending_act(make_test_ptr(identity_act), make_test_ptr(identity_blend_act), 2);
     blending_act.apply(input, output);
 
     // With linear activations:
@@ -42,8 +50,8 @@ class TestBlendingDetailed
     assert(fabs(output(1, 1) - 4.0f) < 1e-6);
 
     // Test with sigmoid blending activation
-    nam::activations::Activation* sigmoid_act = nam::activations::Activation::get_activation(std::string("Sigmoid"));
-    nam::gating_activations::BlendingActivation blending_act_sigmoid(&identity_act, sigmoid_act, 2);
+    auto sigmoid_act = nam::activations::Activation::get_activation(std::string("Sigmoid"));
+    nam::gating_activations::BlendingActivation blending_act_sigmoid(make_test_ptr(identity_act), sigmoid_act, 2);
 
     Eigen::MatrixXf output_sigmoid(2, 2);
     blending_act_sigmoid.apply(input, output_sigmoid);
@@ -80,7 +88,7 @@ class TestBlendingDetailed
     // Test with ReLU activation on input (which will change values < 0 to 0)
     nam::activations::ActivationReLU relu_act;
     nam::activations::ActivationIdentity identity_act;
-    nam::gating_activations::BlendingActivation blending_act(&relu_act, &identity_act, 1);
+    nam::gating_activations::BlendingActivation blending_act(make_test_ptr(relu_act), make_test_ptr(identity_act), 1);
 
     blending_act.apply(input, output);
 
diff --git a/tools/test/test_gating_activations.cpp b/tools/test/test_gating_activations.cpp
index 3f681cb6..90fd21a7 100644
--- a/tools/test/test_gating_activations.cpp
+++ b/tools/test/test_gating_activations.cpp
@@ -5,6 +5,7 @@
 #include <vector>
 #include <cmath>
 #include <iostream>
+#include <memory>
 
 #include "NAM/gating_activations.h"
 #include "NAM/activations.h"
@@ -12,6 +13,13 @@
 namespace test_gating_activations
 {
 
+// Helper to create a non-owning shared_ptr for stack-allocated activations in tests
+template<typename T>
+nam::activations::Activation::Ptr make_test_ptr(T& activation)
+{
+  return nam::activations::Activation::Ptr(&activation, [](nam::activations::Activation*){});
+}
+
 class TestGatingActivation
 {
 public:
@@ -26,7 +34,7 @@ class TestGatingActivation
     // Create gating activation with default activations (1 input channel, 1 gating channel)
     nam::activations::ActivationIdentity identity_act;
     nam::activations::ActivationSigmoid sigmoid_act;
-    nam::gating_activations::GatingActivation gating_act(&identity_act, &sigmoid_act, 1);
+    nam::gating_activations::GatingActivation gating_act(make_test_ptr(identity_act), make_test_ptr(sigmoid_act), 1);
 
     // Apply the activation
     gating_act.apply(input, output);
@@ -52,7 +60,7 @@ class TestGatingActivation
     Eigen::MatrixXf output(1, 2);
 
     // Create gating activation with custom activations
-    nam::gating_activations::GatingActivation gating_act(&leaky_relu, &leaky_relu2, 1);
+    nam::gating_activations::GatingActivation gating_act(make_test_ptr(leaky_relu), make_test_ptr(leaky_relu2), 1);
 
     // Apply the activation
     gating_act.apply(input, output);
@@ -85,7 +93,7 @@ class TestBlendingActivation
     // Create blending activation (1 input channel)
     nam::activations::ActivationIdentity identity_act;
     nam::activations::ActivationIdentity identity_blend_act;
-    nam::gating_activations::BlendingActivation blending_act(&identity_act, &identity_blend_act, 1);
+    nam::gating_activations::BlendingActivation blending_act(make_test_ptr(identity_act), make_test_ptr(identity_blend_act), 1);
 
     // Apply the activation
     blending_act.apply(input, output);
@@ -107,7 +115,7 @@ class TestBlendingActivation
     // Test with default (linear) activations
     nam::activations::ActivationIdentity identity_act;
     nam::activations::ActivationIdentity identity_blend_act;
-    nam::gating_activations::BlendingActivation blending_act(&identity_act, &identity_blend_act, 1);
+    nam::gating_activations::BlendingActivation blending_act(make_test_ptr(identity_act), make_test_ptr(identity_blend_act), 1);
     blending_act.apply(input, output);
 
     // With linear activations, blending should be:
@@ -118,8 +126,8 @@ class TestBlendingActivation
     assert(fabs(output(0, 1) - (-1.0f)) < 1e-6);
 
     // Test with sigmoid blending activation
-    nam::activations::Activation* sigmoid_act = nam::activations::Activation::get_activation(std::string("Sigmoid"));
-    nam::gating_activations::BlendingActivation blending_act2(&identity_act, sigmoid_act, 1);
+    auto sigmoid_act = nam::activations::Activation::get_activation(std::string("Sigmoid"));
+    nam::gating_activations::BlendingActivation blending_act2(make_test_ptr(identity_act), sigmoid_act, 1);
     blending_act2.apply(input, output);
 
     // With sigmoid blending, alpha values should be between 0 and 1
@@ -149,7 +157,7 @@ class TestBlendingActivation
     Eigen::MatrixXf output(1, 2);
 
     // Create blending activation with custom activations
-    nam::gating_activations::BlendingActivation blending_act(&leaky_relu, &leaky_relu2, 1);
+    nam::gating_activations::BlendingActivation blending_act(make_test_ptr(leaky_relu), make_test_ptr(leaky_relu2), 1);
 
     // Apply the activation
     blending_act.apply(input, output);
@@ -167,7 +175,7 @@ class TestBlendingActivation
 
     nam::activations::ActivationIdentity identity_act;
     nam::activations::ActivationIdentity identity_blend_act;
-    nam::gating_activations::BlendingActivation blending_act(&identity_act, &identity_blend_act, 1);
+    nam::gating_activations::BlendingActivation blending_act(make_test_ptr(identity_act), make_test_ptr(identity_blend_act), 1);
 
     // This should trigger an assert and terminate the program
     // We can't easily test asserts in a unit test framework without special handling
@@ -188,7 +196,7 @@ class TestBlendingActivation
 
     nam::activations::ActivationIdentity identity_act;
     nam::activations::ActivationIdentity identity_blend_act;
-    nam::gating_activations::BlendingActivation blending_act(&identity_act, &identity_blend_act, 1);
+    nam::gating_activations::BlendingActivation blending_act(make_test_ptr(identity_act), make_test_ptr(identity_blend_act), 1);
     blending_act.apply(input, output);
 
     assert(fabs(output(0, 0) - 0.0f) < 1e-6);
diff --git a/tools/test/test_input_buffer_verification.cpp b/tools/test/test_input_buffer_verification.cpp
index 01aa9e27..2f895652 100644
--- a/tools/test/test_input_buffer_verification.cpp
+++ b/tools/test/test_input_buffer_verification.cpp
@@ -5,6 +5,7 @@
 #include <vector>
 #include <cmath>
 #include <iostream>
+#include <memory>
 
 #include "NAM/gating_activations.h"
 #include "NAM/activations.h"
@@ -12,6 +13,13 @@
 namespace test_input_buffer_verification
 {
 
+// Helper to create a non-owning shared_ptr for stack-allocated activations in tests
+template<typename T>
+nam::activations::Activation::Ptr make_test_ptr(T& activation)
+{
+  return nam::activations::Activation::Ptr(&activation, [](nam::activations::Activation*){});
+}
+
 class TestInputBufferVerification
 {
 public:
@@ -26,7 +34,7 @@ class TestInputBufferVerification
     // Use ReLU activation which will set negative values to 0
     nam::activations::ActivationReLU relu_act;
     nam::activations::ActivationIdentity identity_act;
-    nam::gating_activations::BlendingActivation blending_act(&relu_act, &identity_act, 1);
+    nam::gating_activations::BlendingActivation blending_act(make_test_ptr(relu_act), make_test_ptr(identity_act), 1);
 
     // Apply the activation
     blending_act.apply(input, output);
@@ -53,7 +61,7 @@ class TestInputBufferVerification
     // Use LeakyReLU with slope 0.1
     nam::activations::ActivationLeakyReLU leaky_relu(0.1f);
     nam::activations::ActivationIdentity identity_act;
-    nam::gating_activations::BlendingActivation blending_act(&leaky_relu, &identity_act, 1);
+    nam::gating_activations::BlendingActivation blending_act(make_test_ptr(leaky_relu), make_test_ptr(identity_act), 1);
 
     blending_act.apply(input, output);
 
diff --git a/tools/test/test_wavenet_gating_compatibility.cpp b/tools/test/test_wavenet_gating_compatibility.cpp
index f3ad8e65..6e443bb7 100644
--- a/tools/test/test_wavenet_gating_compatibility.cpp
+++ b/tools/test/test_wavenet_gating_compatibility.cpp
@@ -5,6 +5,7 @@
 #include <vector>
 #include <cmath>
 #include <iostream>
+#include <memory>
 
 #include "NAM/gating_activations.h"
 #include "NAM/activations.h"
@@ -12,6 +13,13 @@
 namespace test_wavenet_gating_compatibility
 {
 
+// Helper to create a non-owning shared_ptr for stack-allocated activations in tests
+template<typename T>
+nam::activations::Activation::Ptr make_test_ptr(T& activation)
+{
+  return nam::activations::Activation::Ptr(&activation, [](nam::activations::Activation*){});
+}
+
 class TestWavenetGatingCompatibility
 {
 public:
@@ -35,7 +43,7 @@ class TestWavenetGatingCompatibility
     // Wavenet uses: input activation (default/linear) and sigmoid for gating
     nam::activations::ActivationIdentity identity_act;
     nam::activations::ActivationSigmoid sigmoid_act;
-    nam::gating_activations::GatingActivation gating_act(&identity_act, &sigmoid_act, channels);
+    nam::gating_activations::GatingActivation gating_act(make_test_ptr(identity_act), make_test_ptr(sigmoid_act), channels);
 
     // Apply the activation
     gating_act.apply(input, output);
@@ -84,7 +92,7 @@ class TestWavenetGatingCompatibility
 
     nam::activations::ActivationIdentity identity_act;
     nam::activations::ActivationSigmoid sigmoid_act;
-    nam::gating_activations::GatingActivation gating_act(&identity_act, &sigmoid_act, channels);
+    nam::gating_activations::GatingActivation gating_act(make_test_ptr(identity_act), make_test_ptr(sigmoid_act), channels);
     gating_act.apply(input, output);
 
     // Verify each column was processed independently
@@ -120,7 +128,7 @@ class TestWavenetGatingCompatibility
 
     nam::activations::ActivationIdentity identity_act;
     nam::activations::ActivationSigmoid sigmoid_act;
-    nam::gating_activations::GatingActivation gating_act(&identity_act, &sigmoid_act, channels);
+    nam::gating_activations::GatingActivation gating_act(make_test_ptr(identity_act), make_test_ptr(sigmoid_act), channels);
 
     // This should not crash or produce incorrect results due to memory contiguity issues
     gating_act.apply(input, output);
@@ -155,7 +163,7 @@ class TestWavenetGatingCompatibility
 
     nam::activations::ActivationIdentity identity_act;
     nam::activations::ActivationSigmoid sigmoid_act;
-    nam::gating_activations::GatingActivation gating_act(&identity_act, &sigmoid_act, channels);
+    nam::gating_activations::GatingActivation gating_act(make_test_ptr(identity_act), make_test_ptr(sigmoid_act), channels);
     gating_act.apply(input, output);
 
     // Verify dimensions

From 9c64e51f26e82fb3d95cf737518899d2f5b4b00e Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Jo=C3=A3o=20Felipe=20Santos?= <santosjf@pm.me>
Date: Tue, 20 Jan 2026 16:18:59 -0800
Subject: [PATCH 5/6] Updated get_activation to take an ActivationConfig
 instead of a JSON, and created a method to convert from string or JSON to
 ActivationConfig so parsing happens sooner.

---
 NAM/activations.cpp                           | 138 +++++++++++++----
 NAM/activations.h                             |  45 +++++-
 NAM/convnet.cpp                               |  12 +-
 NAM/convnet.h                                 |   7 +-
 NAM/wavenet.cpp                               |   7 +-
 NAM/wavenet.h                                 |  28 ++--
 tools/run_tests.cpp                           |  12 ++
 tools/test/test_activations.cpp               | 146 ++++++++++++++++++
 tools/test/test_convnet.cpp                   |  14 +-
 .../test_condition_processing.cpp             |   2 +-
 tools/test/test_wavenet/test_full.cpp         |  10 +-
 tools/test/test_wavenet/test_head1x1.cpp      |  10 +-
 tools/test/test_wavenet/test_layer.cpp        |  15 +-
 tools/test/test_wavenet/test_layer_array.cpp  |   6 +-
 .../test/test_wavenet/test_real_time_safe.cpp |  12 +-
 .../test/test_wavenet_configurable_gating.cpp |  10 +-
 16 files changed, 378 insertions(+), 96 deletions(-)

diff --git a/NAM/activations.cpp b/NAM/activations.cpp
index b084c554..c9eeb958 100644
--- a/NAM/activations.cpp
+++ b/NAM/activations.cpp
@@ -45,58 +45,128 @@ nam::activations::Activation::Ptr nam::activations::Activation::get_activation(c
   return _activations[name];
 }
 
-nam::activations::Activation::Ptr nam::activations::Activation::get_activation(const nlohmann::json& activation_config)
+// ActivationConfig implementation
+nam::activations::ActivationConfig nam::activations::ActivationConfig::simple(ActivationType t)
 {
-  // If it's a string, use the existing string-based lookup
-  if (activation_config.is_string())
+  ActivationConfig config;
+  config.type = t;
+  return config;
+}
+
+nam::activations::ActivationConfig nam::activations::ActivationConfig::from_json(const nlohmann::json& j)
+{
+  ActivationConfig config;
+
+  // Map from string to ActivationType
+  static const std::unordered_map<std::string, ActivationType> type_map = {
+    {"Tanh", ActivationType::Tanh},
+    {"Hardtanh", ActivationType::Hardtanh},
+    {"Fasttanh", ActivationType::Fasttanh},
+    {"ReLU", ActivationType::ReLU},
+    {"LeakyReLU", ActivationType::LeakyReLU},
+    {"PReLU", ActivationType::PReLU},
+    {"Sigmoid", ActivationType::Sigmoid},
+    {"SiLU", ActivationType::SiLU},
+    {"Hardswish", ActivationType::Hardswish},
+    {"LeakyHardtanh", ActivationType::LeakyHardtanh},
+    {"LeakyHardTanh", ActivationType::LeakyHardtanh} // Support both casings
+  };
+
+  // If it's a string, simple lookup
+  if (j.is_string())
   {
-    std::string name = activation_config.get<std::string>();
-    return get_activation(name);
+    std::string name = j.get<std::string>();
+    auto it = type_map.find(name);
+    if (it == type_map.end())
+    {
+      throw std::runtime_error("Unknown activation type: " + name);
+    }
+    config.type = it->second;
+    return config;
   }
 
-  // If it's an object, parse the activation type and parameters
-  if (activation_config.is_object())
+  // If it's an object, parse type and parameters
+  if (j.is_object())
   {
-    std::string type = activation_config["type"].get<std::string>();
+    std::string type_str = j["type"].get<std::string>();
+    auto it = type_map.find(type_str);
+    if (it == type_map.end())
+    {
+      throw std::runtime_error("Unknown activation type: " + type_str);
+    }
+    config.type = it->second;
 
-    // Handle different activation types with parameters
-    // These return owning shared_ptr (will be deleted when last reference goes out of scope)
-    if (type == "PReLU")
+    // Parse optional parameters based on activation type
+    if (config.type == ActivationType::PReLU)
     {
-      if (activation_config.find("negative_slope") != activation_config.end())
+      if (j.find("negative_slope") != j.end())
       {
-        float negative_slope = activation_config["negative_slope"].get<float>();
-        return std::make_shared<ActivationPReLU>(negative_slope);
+        config.negative_slope = j["negative_slope"].get<float>();
       }
-      else if (activation_config.find("negative_slopes") != activation_config.end())
+      else if (j.find("negative_slopes") != j.end())
       {
-        std::vector<float> negative_slopes = activation_config["negative_slopes"].get<std::vector<float>>();
-        return std::make_shared<ActivationPReLU>(negative_slopes);
+        config.negative_slopes = j["negative_slopes"].get<std::vector<float>>();
       }
-      // If no parameters provided, use default
-      return std::make_shared<ActivationPReLU>(0.01f);
-    }
-    else if (type == "LeakyReLU")
-    {
-      float negative_slope = activation_config.value("negative_slope", 0.01f);
-      return std::make_shared<ActivationLeakyReLU>(negative_slope);
     }
-    else if (type == "LeakyHardTanh")
+    else if (config.type == ActivationType::LeakyReLU)
     {
-      float min_val = activation_config.value("min_val", -1.0f);
-      float max_val = activation_config.value("max_val", 1.0f);
-      float min_slope = activation_config.value("min_slope", 0.01f);
-      float max_slope = activation_config.value("max_slope", 0.01f);
-      return std::make_shared<ActivationLeakyHardTanh>(min_val, max_val, min_slope, max_slope);
+      config.negative_slope = j.value("negative_slope", 0.01f);
     }
-    else
+    else if (config.type == ActivationType::LeakyHardtanh)
     {
-      // For other activation types without parameters, use the default string-based lookup
-      return get_activation(type);
+      config.min_val = j.value("min_val", -1.0f);
+      config.max_val = j.value("max_val", 1.0f);
+      config.min_slope = j.value("min_slope", 0.01f);
+      config.max_slope = j.value("max_slope", 0.01f);
     }
+
+    return config;
   }
 
-  return nullptr;
+  throw std::runtime_error("Invalid activation config: expected string or object");
+}
+
+nam::activations::Activation::Ptr nam::activations::Activation::get_activation(const ActivationConfig& config)
+{
+  switch (config.type)
+  {
+    case ActivationType::Tanh:
+      return _activations["Tanh"];
+    case ActivationType::Hardtanh:
+      return _activations["Hardtanh"];
+    case ActivationType::Fasttanh:
+      return _activations["Fasttanh"];
+    case ActivationType::ReLU:
+      return _activations["ReLU"];
+    case ActivationType::Sigmoid:
+      return _activations["Sigmoid"];
+    case ActivationType::SiLU:
+      return _activations["SiLU"];
+    case ActivationType::Hardswish:
+      return _activations["Hardswish"];
+    case ActivationType::LeakyReLU:
+      if (config.negative_slope.has_value())
+      {
+        return std::make_shared<ActivationLeakyReLU>(config.negative_slope.value());
+      }
+      return _activations["LeakyReLU"];
+    case ActivationType::PReLU:
+      if (config.negative_slopes.has_value())
+      {
+        return std::make_shared<ActivationPReLU>(config.negative_slopes.value());
+      }
+      else if (config.negative_slope.has_value())
+      {
+        return std::make_shared<ActivationPReLU>(config.negative_slope.value());
+      }
+      return std::make_shared<ActivationPReLU>(0.01f);
+    case ActivationType::LeakyHardtanh:
+      return std::make_shared<ActivationLeakyHardTanh>(
+        config.min_val.value_or(-1.0f), config.max_val.value_or(1.0f), config.min_slope.value_or(0.01f),
+        config.max_slope.value_or(0.01f));
+    default:
+      return nullptr;
+  }
 }
 
 void nam::activations::Activation::enable_fast_tanh()
diff --git a/NAM/activations.h b/NAM/activations.h
index c077776c..977b4586 100644
--- a/NAM/activations.h
+++ b/NAM/activations.h
@@ -1,18 +1,58 @@
 #pragma once
 
 #include <cassert>
-#include <string>
 #include <cmath> // expf
+#include <functional>
 #include <memory>
+#include <optional>
+#include <string>
 #include <unordered_map>
+#include <vector>
+
 #include <Eigen/Dense>
-#include <functional>
+
 #include "json.hpp"
 
 namespace nam
 {
 namespace activations
 {
+
+// Forward declaration
+class Activation;
+
+// Strongly-typed activation type enum
+enum class ActivationType
+{
+  Tanh,
+  Hardtanh,
+  Fasttanh,
+  ReLU,
+  LeakyReLU,
+  PReLU,
+  Sigmoid,
+  SiLU, // aka Swish
+  Hardswish,
+  LeakyHardtanh
+};
+
+// Strongly-typed activation configuration
+struct ActivationConfig
+{
+  ActivationType type;
+
+  // Optional parameters (used by specific activation types)
+  std::optional<float> negative_slope;               // LeakyReLU, PReLU (single)
+  std::optional<std::vector<float>> negative_slopes; // PReLU (per-channel)
+  std::optional<float> min_val;                      // LeakyHardtanh
+  std::optional<float> max_val;                      // LeakyHardtanh
+  std::optional<float> min_slope;                    // LeakyHardtanh
+  std::optional<float> max_slope;                    // LeakyHardtanh
+
+  // Convenience constructors
+  static ActivationConfig simple(ActivationType t);
+  static ActivationConfig from_json(const nlohmann::json& j);
+};
 inline float relu(float x)
 {
   return x > 0.0f ? x : 0.0f;
@@ -107,6 +147,7 @@ class Activation
   virtual void apply(float* data, long size) {}
 
   static Ptr get_activation(const std::string name);
+  static Ptr get_activation(const ActivationConfig& config);
   static Ptr get_activation(const nlohmann::json& activation_config);
   static void enable_fast_tanh();
   static void disable_fast_tanh();
diff --git a/NAM/convnet.cpp b/NAM/convnet.cpp
index a85e6c44..fc7c151f 100644
--- a/NAM/convnet.cpp
+++ b/NAM/convnet.cpp
@@ -48,7 +48,8 @@ void nam::convnet::BatchNorm::process_(Eigen::MatrixXf& x, const long i_start, c
 }
 
 void nam::convnet::ConvNetBlock::set_weights_(const int in_channels, const int out_channels, const int _dilation,
-                                              const bool batchnorm, const nlohmann::json activation_config, const int groups,
+                                              const bool batchnorm,
+                                              const activations::ActivationConfig& activation_config, const int groups,
                                               std::vector<float>::iterator& weights)
 {
   this->_batchnorm = batchnorm;
@@ -173,8 +174,9 @@ void nam::convnet::_Head::process_(const Eigen::MatrixXf& input, Eigen::MatrixXf
 }
 
 nam::convnet::ConvNet::ConvNet(const int in_channels, const int out_channels, const int channels,
-                               const std::vector<int>& dilations, const bool batchnorm, const nlohmann::json activation_config,
-                               std::vector<float>& weights, const double expected_sample_rate, const int groups)
+                               const std::vector<int>& dilations, const bool batchnorm,
+                               const activations::ActivationConfig& activation_config, std::vector<float>& weights,
+                               const double expected_sample_rate, const int groups)
 : Buffer(in_channels, out_channels, *std::max_element(dilations.begin(), dilations.end()), expected_sample_rate)
 {
   this->_verify_weights(channels, dilations, batchnorm, weights.size());
@@ -327,7 +329,9 @@ std::unique_ptr<nam::DSP> nam::convnet::Factory(const nlohmann::json& config, st
   const int channels = config["channels"];
   const std::vector<int> dilations = config["dilations"];
   const bool batchnorm = config["batchnorm"];
-  const nlohmann::json activation_config = config["activation"];
+  // Parse JSON into typed ActivationConfig at model loading boundary
+  const activations::ActivationConfig activation_config =
+    activations::ActivationConfig::from_json(config["activation"]);
   const int groups = config.value("groups", 1); // defaults to 1
   // Default to 1 channel in/out for backward compatibility
   const int in_channels = config.value("in_channels", 1);
diff --git a/NAM/convnet.h b/NAM/convnet.h
index b675a436..1765311b 100644
--- a/NAM/convnet.h
+++ b/NAM/convnet.h
@@ -9,8 +9,10 @@
 
 #include <Eigen/Dense>
 
+#include "activations.h"
 #include "conv1d.h"
 #include "dsp.h"
+#include "json.hpp"
 
 namespace nam
 {
@@ -44,7 +46,8 @@ class ConvNetBlock
 public:
   ConvNetBlock() {};
   void set_weights_(const int in_channels, const int out_channels, const int _dilation, const bool batchnorm,
-                    const nlohmann::json activation_config, const int groups, std::vector<float>::iterator& weights);
+                    const activations::ActivationConfig& activation_config, const int groups,
+                    std::vector<float>::iterator& weights);
   void SetMaxBufferSize(const int maxBufferSize);
   // Process input matrix directly (new API, similar to WaveNet)
   void Process(const Eigen::MatrixXf& input, const int num_frames);
@@ -78,7 +81,7 @@ class ConvNet : public Buffer
 {
 public:
   ConvNet(const int in_channels, const int out_channels, const int channels, const std::vector<int>& dilations,
-          const bool batchnorm, const nlohmann::json activation_config, std::vector<float>& weights,
+          const bool batchnorm, const activations::ActivationConfig& activation_config, std::vector<float>& weights,
           const double expected_sample_rate = -1.0, const int groups = 1);
   ~ConvNet() = default;
 
diff --git a/NAM/wavenet.cpp b/NAM/wavenet.cpp
index 121a5572..58887dd2 100644
--- a/NAM/wavenet.cpp
+++ b/NAM/wavenet.cpp
@@ -113,7 +113,8 @@ void nam::wavenet::_Layer::Process(const Eigen::MatrixXf& input, const Eigen::Ma
 
 nam::wavenet::_LayerArray::_LayerArray(const int input_size, const int condition_size, const int head_size,
                                        const int channels, const int bottleneck, const int kernel_size,
-                                       const std::vector<int>& dilations, const nlohmann::json activation_config,
+                                       const std::vector<int>& dilations,
+                                       const activations::ActivationConfig& activation_config,
                                        const GatingMode gating_mode, const bool head_bias, const int groups_input,
                                        const int groups_1x1, const Head1x1Params& head1x1_params,
                                        const std::string& secondary_activation)
@@ -477,7 +478,9 @@ std::unique_ptr<nam::DSP> nam::wavenet::Factory(const nlohmann::json& config, st
     const int head_size = layer_config["head_size"];
     const int kernel_size = layer_config["kernel_size"];
     const auto dilations = layer_config["dilations"];
-    const nlohmann::json activation_config = layer_config["activation"];
+    // Parse JSON into typed ActivationConfig at model loading boundary
+    const activations::ActivationConfig activation_config =
+      activations::ActivationConfig::from_json(layer_config["activation"]);
     // Parse gating mode - support both old "gated" boolean and new "gating_mode" string
     GatingMode gating_mode = GatingMode::NONE;
     std::string secondary_activation;
diff --git a/NAM/wavenet.h b/NAM/wavenet.h
index 65a7dee5..93403d79 100644
--- a/NAM/wavenet.h
+++ b/NAM/wavenet.h
@@ -1,16 +1,17 @@
 #pragma once
 
-#include <string>
-#include <vector>
 #include <memory>
 #include <stdexcept>
+#include <string>
+#include <vector>
 
-#include "json.hpp"
 #include <Eigen/Dense>
 
-#include "dsp.h"
+#include "activations.h"
 #include "conv1d.h"
+#include "dsp.h"
 #include "gating_activations.h"
+#include "json.hpp"
 
 namespace nam
 {
@@ -48,14 +49,14 @@ struct Head1x1Params
 class _Layer
 {
 public:
-  // New constructor with GatingMode enum and configurable activations
+  // Constructor with GatingMode enum and typed ActivationConfig
   _Layer(const int condition_size, const int channels, const int bottleneck, const int kernel_size, const int dilation,
-         const nlohmann::json activation_config, const GatingMode gating_mode, const int groups_input, const int groups_1x1,
-         const Head1x1Params& head1x1_params, const std::string& secondary_activation)
+         const activations::ActivationConfig& activation_config, const GatingMode gating_mode, const int groups_input,
+         const int groups_1x1, const Head1x1Params& head1x1_params, const std::string& secondary_activation)
   : _conv(channels, (gating_mode != GatingMode::NONE) ? 2 * bottleneck : bottleneck, kernel_size, true, dilation)
   , _input_mixin(condition_size, (gating_mode != GatingMode::NONE) ? 2 * bottleneck : bottleneck, false)
   , _1x1(bottleneck, channels, groups_1x1)
-  , _activation(activations::Activation::get_activation(activation_config)) // now supports activations with parameters
+  , _activation(activations::Activation::get_activation(activation_config))
   , _gating_mode(gating_mode)
   , _bottleneck(bottleneck)
   {
@@ -148,7 +149,7 @@ class LayerArrayParams
 public:
   LayerArrayParams(const int input_size_, const int condition_size_, const int head_size_, const int channels_,
                    const int bottleneck_, const int kernel_size_, const std::vector<int>&& dilations_,
-                   const nlohmann::json activation_, const GatingMode gating_mode_, const bool head_bias_,
+                   const activations::ActivationConfig& activation_, const GatingMode gating_mode_, const bool head_bias_,
                    const int groups_input, const int groups_1x1_, const Head1x1Params& head1x1_params_,
                    const std::string& secondary_activation_)
   : input_size(input_size_)
@@ -175,7 +176,7 @@ class LayerArrayParams
   const int bottleneck;
   const int kernel_size;
   std::vector<int> dilations;
-  const nlohmann::json activation_config;
+  const activations::ActivationConfig activation_config;
   const GatingMode gating_mode;
   const bool head_bias;
   const int groups_input;
@@ -188,11 +189,12 @@ class LayerArrayParams
 class _LayerArray
 {
 public:
-  // New constructor with GatingMode enum and configurable activations
+  // Constructor with GatingMode enum and typed ActivationConfig
   _LayerArray(const int input_size, const int condition_size, const int head_size, const int channels,
               const int bottleneck, const int kernel_size, const std::vector<int>& dilations,
-              const nlohmann::json activation_config, const GatingMode gating_mode, const bool head_bias, const int groups_input,
-              const int groups_1x1, const Head1x1Params& head1x1_params, const std::string& secondary_activation);
+              const activations::ActivationConfig& activation_config, const GatingMode gating_mode, const bool head_bias,
+              const int groups_input, const int groups_1x1, const Head1x1Params& head1x1_params,
+              const std::string& secondary_activation);
 
   void SetMaxBufferSize(const int maxBufferSize);
 
diff --git a/tools/run_tests.cpp b/tools/run_tests.cpp
index 860709da..f3d2bb42 100644
--- a/tools/run_tests.cpp
+++ b/tools/run_tests.cpp
@@ -53,6 +53,18 @@ int main()
   test_activations::TestJSONActivationParsing::test_json_unknown_activation();
   test_activations::TestJSONActivationParsing::test_functional_verification();
 
+  // Typed ActivationConfig tests
+  test_activations::TestTypedActivationConfig::test_simple_config();
+  test_activations::TestTypedActivationConfig::test_all_simple_types();
+  test_activations::TestTypedActivationConfig::test_leaky_relu_config();
+  test_activations::TestTypedActivationConfig::test_prelu_single_slope_config();
+  test_activations::TestTypedActivationConfig::test_prelu_multi_slope_config();
+  test_activations::TestTypedActivationConfig::test_leaky_hardtanh_config();
+  test_activations::TestTypedActivationConfig::test_from_json_string();
+  test_activations::TestTypedActivationConfig::test_from_json_object();
+  test_activations::TestTypedActivationConfig::test_from_json_prelu_multi();
+  test_activations::TestTypedActivationConfig::test_unknown_activation_throws();
+
   test_dsp::test_construct();
   test_dsp::test_get_input_level();
   test_dsp::test_get_output_level();
diff --git a/tools/test/test_activations.cpp b/tools/test/test_activations.cpp
index 85fe15f4..4d607e02 100644
--- a/tools/test/test_activations.cpp
+++ b/tools/test/test_activations.cpp
@@ -308,4 +308,150 @@ class TestJSONActivationParsing
   }
 };
 
+class TestTypedActivationConfig
+{
+public:
+  static void test_simple_config()
+  {
+    // Test simple() factory method
+    auto config = nam::activations::ActivationConfig::simple(nam::activations::ActivationType::ReLU);
+    assert(config.type == nam::activations::ActivationType::ReLU);
+    assert(!config.negative_slope.has_value());
+    assert(!config.negative_slopes.has_value());
+
+    auto act = nam::activations::Activation::get_activation(config);
+    assert(act != nullptr);
+  }
+
+  static void test_all_simple_types()
+  {
+    // Test that all simple activation types work
+    std::vector<nam::activations::ActivationType> types = {
+      nam::activations::ActivationType::Tanh,     nam::activations::ActivationType::Hardtanh,
+      nam::activations::ActivationType::Fasttanh, nam::activations::ActivationType::ReLU,
+      nam::activations::ActivationType::Sigmoid,  nam::activations::ActivationType::SiLU,
+      nam::activations::ActivationType::Hardswish};
+
+    for (auto type : types)
+    {
+      auto config = nam::activations::ActivationConfig::simple(type);
+      auto act = nam::activations::Activation::get_activation(config);
+      assert(act != nullptr);
+    }
+  }
+
+  static void test_leaky_relu_config()
+  {
+    // Test LeakyReLU with custom negative slope
+    nam::activations::ActivationConfig config;
+    config.type = nam::activations::ActivationType::LeakyReLU;
+    config.negative_slope = 0.2f;
+
+    auto act = nam::activations::Activation::get_activation(config);
+    assert(act != nullptr);
+
+    // Verify the behavior
+    std::vector<float> data = {-1.0f, 0.0f, 1.0f};
+    act->apply(data.data(), (long)data.size());
+    assert(fabs(data[0] - (-0.2f)) < 1e-6); // -1.0 * 0.2 = -0.2
+    assert(fabs(data[1] - 0.0f) < 1e-6);
+    assert(fabs(data[2] - 1.0f) < 1e-6);
+  }
+
+  static void test_prelu_single_slope_config()
+  {
+    // Test PReLU with single slope
+    nam::activations::ActivationConfig config;
+    config.type = nam::activations::ActivationType::PReLU;
+    config.negative_slope = 0.25f;
+
+    auto act = nam::activations::Activation::get_activation(config);
+    assert(act != nullptr);
+  }
+
+  static void test_prelu_multi_slope_config()
+  {
+    // Test PReLU with multiple slopes (per-channel)
+    nam::activations::ActivationConfig config;
+    config.type = nam::activations::ActivationType::PReLU;
+    config.negative_slopes = std::vector<float>{0.1f, 0.2f, 0.3f};
+
+    auto act = nam::activations::Activation::get_activation(config);
+    assert(act != nullptr);
+
+    // Verify per-channel behavior
+    Eigen::MatrixXf data(3, 2);
+    data << -1.0f, 1.0f, -1.0f, 1.0f, -1.0f, 1.0f;
+
+    act->apply(data);
+
+    // Channel 0 (slope 0.1): -1.0 * 0.1 = -0.1
+    assert(fabs(data(0, 0) - (-0.1f)) < 1e-6);
+    // Channel 1 (slope 0.2): -1.0 * 0.2 = -0.2
+    assert(fabs(data(1, 0) - (-0.2f)) < 1e-6);
+    // Channel 2 (slope 0.3): -1.0 * 0.3 = -0.3
+    assert(fabs(data(2, 0) - (-0.3f)) < 1e-6);
+    // Positive values unchanged
+    assert(fabs(data(0, 1) - 1.0f) < 1e-6);
+  }
+
+  static void test_leaky_hardtanh_config()
+  {
+    // Test LeakyHardtanh with custom parameters
+    nam::activations::ActivationConfig config;
+    config.type = nam::activations::ActivationType::LeakyHardtanh;
+    config.min_val = -2.0f;
+    config.max_val = 2.0f;
+    config.min_slope = 0.1f;
+    config.max_slope = 0.1f;
+
+    auto act = nam::activations::Activation::get_activation(config);
+    assert(act != nullptr);
+  }
+
+  static void test_from_json_string()
+  {
+    // Test from_json with string input
+    nlohmann::json j = "ReLU";
+    auto config = nam::activations::ActivationConfig::from_json(j);
+    assert(config.type == nam::activations::ActivationType::ReLU);
+  }
+
+  static void test_from_json_object()
+  {
+    // Test from_json with object input
+    nlohmann::json j = {{"type", "LeakyReLU"}, {"negative_slope", 0.15f}};
+    auto config = nam::activations::ActivationConfig::from_json(j);
+    assert(config.type == nam::activations::ActivationType::LeakyReLU);
+    assert(config.negative_slope.has_value());
+    assert(fabs(config.negative_slope.value() - 0.15f) < 1e-6);
+  }
+
+  static void test_from_json_prelu_multi()
+  {
+    // Test from_json with PReLU multi-slope
+    nlohmann::json j = {{"type", "PReLU"}, {"negative_slopes", {0.1f, 0.2f, 0.3f, 0.4f}}};
+    auto config = nam::activations::ActivationConfig::from_json(j);
+    assert(config.type == nam::activations::ActivationType::PReLU);
+    assert(config.negative_slopes.has_value());
+    assert(config.negative_slopes.value().size() == 4);
+  }
+
+  static void test_unknown_activation_throws()
+  {
+    // Test that unknown activation type throws
+    nlohmann::json j = "UnknownActivation";
+    bool threw = false;
+    try
+    {
+      nam::activations::ActivationConfig::from_json(j);
+    }
+    catch (const std::runtime_error& e)
+    {
+      threw = true;
+    }
+    assert(threw);
+  }
+};
+
 }; // namespace test_activations
diff --git a/tools/test/test_convnet.cpp b/tools/test/test_convnet.cpp
index 56bd5ec0..0f554824 100644
--- a/tools/test/test_convnet.cpp
+++ b/tools/test/test_convnet.cpp
@@ -18,7 +18,7 @@ void test_convnet_basic()
   const int channels = 2;
   const std::vector<int> dilations{1, 2};
   const bool batchnorm = false;
-  const std::string activation = "ReLU";
+  const auto activation = nam::activations::ActivationConfig::simple(nam::activations::ActivationType::ReLU);
   const double expected_sample_rate = 48000.0;
 
   // Calculate weights needed:
@@ -65,7 +65,7 @@ void test_convnet_batchnorm()
   const int channels = 1;
   const std::vector<int> dilations{1};
   const bool batchnorm = true;
-  const std::string activation = "ReLU";
+  const auto activation = nam::activations::ActivationConfig::simple(nam::activations::ActivationType::ReLU);
   const double expected_sample_rate = 48000.0;
 
   // Calculate weights needed:
@@ -110,7 +110,7 @@ void test_convnet_multiple_blocks()
   const int channels = 2;
   const std::vector<int> dilations{1, 2, 4};
   const bool batchnorm = false;
-  const std::string activation = "Tanh";
+  const auto activation = nam::activations::ActivationConfig::simple(nam::activations::ActivationType::Tanh);
   const double expected_sample_rate = 48000.0;
 
   // Calculate weights needed:
@@ -158,7 +158,7 @@ void test_convnet_zero_input()
   const int channels = 1;
   const std::vector<int> dilations{1};
   const bool batchnorm = false;
-  const std::string activation = "ReLU";
+  const auto activation = nam::activations::ActivationConfig::simple(nam::activations::ActivationType::ReLU);
   const double expected_sample_rate = 48000.0;
 
   std::vector<float> weights;
@@ -195,7 +195,7 @@ void test_convnet_different_buffer_sizes()
   const int channels = 1;
   const std::vector<int> dilations{1};
   const bool batchnorm = false;
-  const std::string activation = "ReLU";
+  const auto activation = nam::activations::ActivationConfig::simple(nam::activations::ActivationType::ReLU);
   const double expected_sample_rate = 48000.0;
 
   std::vector<float> weights;
@@ -235,7 +235,7 @@ void test_convnet_prewarm()
   const int channels = 2;
   const std::vector<int> dilations{1, 2, 4};
   const bool batchnorm = false;
-  const std::string activation = "ReLU";
+  const auto activation = nam::activations::ActivationConfig::simple(nam::activations::ActivationType::ReLU);
   const double expected_sample_rate = 48000.0;
 
   std::vector<float> weights;
@@ -278,7 +278,7 @@ void test_convnet_multiple_calls()
   const int channels = 1;
   const std::vector<int> dilations{1};
   const bool batchnorm = false;
-  const std::string activation = "ReLU";
+  const auto activation = nam::activations::ActivationConfig::simple(nam::activations::ActivationType::ReLU);
   const double expected_sample_rate = 48000.0;
 
   std::vector<float> weights;
diff --git a/tools/test/test_wavenet/test_condition_processing.cpp b/tools/test/test_wavenet/test_condition_processing.cpp
index c4b5b1af..4a4c9027 100644
--- a/tools/test/test_wavenet/test_condition_processing.cpp
+++ b/tools/test/test_wavenet/test_condition_processing.cpp
@@ -27,7 +27,7 @@ std::unique_ptr<nam::wavenet::WaveNet> create_simple_wavenet(
   const int bottleneck = channels;
   const int kernel_size = 1;
   std::vector<int> dilations{1};
-  const std::string activation = "ReLU";
+  const auto activation = nam::activations::ActivationConfig::simple(nam::activations::ActivationType::ReLU);
   const nam::wavenet::GatingMode gating_mode = nam::wavenet::GatingMode::NONE;
   const bool head_bias = false;
   const bool with_head = false;
diff --git a/tools/test/test_wavenet/test_full.cpp b/tools/test/test_wavenet/test_full.cpp
index ee498c18..6be8787c 100644
--- a/tools/test/test_wavenet/test_full.cpp
+++ b/tools/test/test_wavenet/test_full.cpp
@@ -22,7 +22,7 @@ void test_wavenet_model()
   const int bottleneck = channels;
   const int kernel_size = 1;
   std::vector<int> dilations{1};
-  const std::string activation = "ReLU";
+  const auto activation = nam::activations::ActivationConfig::simple(nam::activations::ActivationType::ReLU);
   const nam::wavenet::GatingMode gating_mode = nam::wavenet::GatingMode::NONE;
   const bool head_bias = false;
   const float head_scale = 1.0f;
@@ -83,7 +83,7 @@ void test_wavenet_multiple_arrays()
   const int channels = 1;
   const int kernel_size = 1;
   std::vector<int> dilations{1};
-  const std::string activation = "ReLU";
+  const auto activation = nam::activations::ActivationConfig::simple(nam::activations::ActivationType::ReLU);
   const nam::wavenet::GatingMode gating_mode = nam::wavenet::GatingMode::NONE;
   const bool head_bias = false;
   const float head_scale = 0.5f;
@@ -146,7 +146,7 @@ void test_wavenet_zero_input()
   const int bottleneck = channels;
   const int kernel_size = 1;
   std::vector<int> dilations{1};
-  const std::string activation = "ReLU";
+  const auto activation = nam::activations::ActivationConfig::simple(nam::activations::ActivationType::ReLU);
   const nam::wavenet::GatingMode gating_mode = nam::wavenet::GatingMode::NONE;
   const bool head_bias = false;
   const float head_scale = 1.0f;
@@ -195,7 +195,7 @@ void test_wavenet_different_buffer_sizes()
   const int bottleneck = channels;
   const int kernel_size = 1;
   std::vector<int> dilations{1};
-  const std::string activation = "ReLU";
+  const auto activation = nam::activations::ActivationConfig::simple(nam::activations::ActivationType::ReLU);
   const nam::wavenet::GatingMode gating_mode = nam::wavenet::GatingMode::NONE;
   const bool head_bias = false;
   const float head_scale = 1.0f;
@@ -247,7 +247,7 @@ void test_wavenet_prewarm()
   const int bottleneck = channels;
   const int kernel_size = 3;
   std::vector<int> dilations{1, 2, 4};
-  const std::string activation = "ReLU";
+  const auto activation = nam::activations::ActivationConfig::simple(nam::activations::ActivationType::ReLU);
   const nam::wavenet::GatingMode gating_mode = nam::wavenet::GatingMode::NONE;
   const bool head_bias = false;
   const float head_scale = 1.0f;
diff --git a/tools/test/test_wavenet/test_head1x1.cpp b/tools/test/test_wavenet/test_head1x1.cpp
index 18ff70b1..5714a6b1 100644
--- a/tools/test/test_wavenet/test_head1x1.cpp
+++ b/tools/test/test_wavenet/test_head1x1.cpp
@@ -21,7 +21,7 @@ void test_head1x1_inactive()
   const int bottleneck = channels;
   const int kernelSize = 1;
   const int dilation = 1;
-  const std::string activation = "ReLU";
+  const auto activation = nam::activations::ActivationConfig::simple(nam::activations::ActivationType::ReLU);
   const nam::wavenet::GatingMode gating_mode = nam::wavenet::GatingMode::NONE;
   const int groups_input = 1;
   const int groups_1x1 = 1;
@@ -87,7 +87,7 @@ void test_head1x1_active()
   const int bottleneck = channels;
   const int kernelSize = 1;
   const int dilation = 1;
-  const std::string activation = "ReLU";
+  const auto activation = nam::activations::ActivationConfig::simple(nam::activations::ActivationType::ReLU);
   const nam::wavenet::GatingMode gating_mode = nam::wavenet::GatingMode::NONE;
   const int groups_input = 1;
   const int groups_1x1 = 1;
@@ -160,7 +160,7 @@ void test_head1x1_gated()
   const int bottleneck = channels;
   const int kernelSize = 1;
   const int dilation = 1;
-  const std::string activation = "ReLU";
+  const auto activation = nam::activations::ActivationConfig::simple(nam::activations::ActivationType::ReLU);
   const nam::wavenet::GatingMode gating_mode = nam::wavenet::GatingMode::GATED;
   const int groups_input = 1;
   const int groups_1x1 = 1;
@@ -250,7 +250,7 @@ void test_head1x1_groups()
   const int bottleneck = channels;
   const int kernelSize = 1;
   const int dilation = 1;
-  const std::string activation = "ReLU";
+  const auto activation = nam::activations::ActivationConfig::simple(nam::activations::ActivationType::ReLU);
   const nam::wavenet::GatingMode gating_mode = nam::wavenet::GatingMode::NONE;
   const int groups_input = 1;
   const int groups_1x1 = 1;
@@ -330,7 +330,7 @@ void test_head1x1_different_out_channels()
   const int bottleneck = channels;
   const int kernelSize = 1;
   const int dilation = 1;
-  const std::string activation = "ReLU";
+  const auto activation = nam::activations::ActivationConfig::simple(nam::activations::ActivationType::ReLU);
   const nam::wavenet::GatingMode gating_mode = nam::wavenet::GatingMode::NONE;
   const int groups_input = 1;
   const int groups_1x1 = 1;
diff --git a/tools/test/test_wavenet/test_layer.cpp b/tools/test/test_wavenet/test_layer.cpp
index ae432748..e3494011 100644
--- a/tools/test/test_wavenet/test_layer.cpp
+++ b/tools/test/test_wavenet/test_layer.cpp
@@ -21,7 +21,7 @@ void test_gated()
   const int bottleneck = channels;
   const int kernelSize = 1;
   const int dilation = 1;
-  const std::string activation = "ReLU";
+  const auto activation = nam::activations::ActivationConfig::simple(nam::activations::ActivationType::ReLU);
   const nam::wavenet::GatingMode gating_mode = nam::wavenet::GatingMode::GATED;
   const int groups_input = 1;
   const int groups_1x1 = 1;
@@ -97,7 +97,7 @@ void test_layer_getters()
   const int bottleneck = channels;
   const int kernelSize = 3;
   const int dilation = 2;
-  const std::string activation = "Tanh";
+  const auto activation = nam::activations::ActivationConfig::simple(nam::activations::ActivationType::Tanh);
   const nam::wavenet::GatingMode gating_mode = nam::wavenet::GatingMode::NONE;
   const int groups_input = 1;
   const int groups_1x1 = 1;
@@ -119,7 +119,7 @@ void test_non_gated_layer()
   const int bottleneck = channels;
   const int kernelSize = 1;
   const int dilation = 1;
-  const std::string activation = "ReLU";
+  const auto activation = nam::activations::ActivationConfig::simple(nam::activations::ActivationType::ReLU);
   const nam::wavenet::GatingMode gating_mode = nam::wavenet::GatingMode::NONE;
   const int groups_input = 1;
   const int groups_1x1 = 1;
@@ -193,7 +193,8 @@ void test_layer_activations()
     const int groups_input = 1;
     const int groups_1x1 = 1;
     nam::wavenet::Head1x1Params head1x1_params(false, channels, 1);
-    auto layer = nam::wavenet::_Layer(conditionSize, channels, bottleneck, kernelSize, dilation, "Tanh", gating_mode,
+    auto tanh_config = nam::activations::ActivationConfig::simple(nam::activations::ActivationType::Tanh);
+    auto layer = nam::wavenet::_Layer(conditionSize, channels, bottleneck, kernelSize, dilation, tanh_config, gating_mode,
                                       groups_input, groups_1x1, head1x1_params, "");
     std::vector<float> weights{1.0f, 0.0f, 1.0f, 1.0f, 0.0f};
     auto it = weights.begin();
@@ -224,7 +225,7 @@ void test_layer_multichannel()
   const int bottleneck = channels;
   const int kernelSize = 1;
   const int dilation = 1;
-  const std::string activation = "ReLU";
+  const auto activation = nam::activations::ActivationConfig::simple(nam::activations::ActivationType::ReLU);
   const nam::wavenet::GatingMode gating_mode = nam::wavenet::GatingMode::NONE;
   const int groups_input = 1;
   const int groups_1x1 = 1;
@@ -294,7 +295,7 @@ void test_layer_bottleneck()
   const int bottleneck = 2; // bottleneck < channels
   const int kernelSize = 1;
   const int dilation = 1;
-  const std::string activation = "ReLU";
+  const auto activation = nam::activations::ActivationConfig::simple(nam::activations::ActivationType::ReLU);
   const nam::wavenet::GatingMode gating_mode = nam::wavenet::GatingMode::NONE;
   const int groups_input = 1;
   const int groups_1x1 = 1;
@@ -371,7 +372,7 @@ void test_layer_bottleneck_gated()
   const int bottleneck = 2; // bottleneck < channels
   const int kernelSize = 1;
   const int dilation = 1;
-  const std::string activation = "ReLU";
+  const auto activation = nam::activations::ActivationConfig::simple(nam::activations::ActivationType::ReLU);
   const nam::wavenet::GatingMode gating_mode =
     nam::wavenet::GatingMode::GATED; // gated doubles the internal bottleneck channels
   const int groups_input = 1;
diff --git a/tools/test/test_wavenet/test_layer_array.cpp b/tools/test/test_wavenet/test_layer_array.cpp
index d5916a2f..ba7cb391 100644
--- a/tools/test/test_wavenet/test_layer_array.cpp
+++ b/tools/test/test_wavenet/test_layer_array.cpp
@@ -22,7 +22,7 @@ void test_layer_array_basic()
   const int bottleneck = channels;
   const int kernel_size = 1;
   std::vector<int> dilations{1, 2};
-  const std::string activation = "ReLU";
+  const auto activation = nam::activations::ActivationConfig::simple(nam::activations::ActivationType::ReLU);
   const nam::wavenet::GatingMode gating_mode = nam::wavenet::GatingMode::NONE;
   const bool head_bias = false;
   const int groups = 1;
@@ -81,7 +81,7 @@ void test_layer_array_receptive_field()
   const int bottleneck = channels;
   const int kernel_size = 3;
   std::vector<int> dilations{1, 2, 4};
-  const std::string activation = "ReLU";
+  const auto activation = nam::activations::ActivationConfig::simple(nam::activations::ActivationType::ReLU);
   const nam::wavenet::GatingMode gating_mode = nam::wavenet::GatingMode::NONE;
   const bool head_bias = false;
   const int groups = 1;
@@ -112,7 +112,7 @@ void test_layer_array_with_head_input()
   const int bottleneck = channels;
   const int kernel_size = 1;
   std::vector<int> dilations{1};
-  const std::string activation = "ReLU";
+  const auto activation = nam::activations::ActivationConfig::simple(nam::activations::ActivationType::ReLU);
   const nam::wavenet::GatingMode gating_mode = nam::wavenet::GatingMode::NONE;
   const bool head_bias = false;
   const int groups = 1;
diff --git a/tools/test/test_wavenet/test_real_time_safe.cpp b/tools/test/test_wavenet/test_real_time_safe.cpp
index cc04150d..b89e9dd4 100644
--- a/tools/test/test_wavenet/test_real_time_safe.cpp
+++ b/tools/test/test_wavenet/test_real_time_safe.cpp
@@ -432,7 +432,7 @@ void test_layer_process_realtime_safe()
   const int bottleneck = channels;
   const int kernel_size = 1;
   const int dilation = 1;
-  const std::string activation = "ReLU";
+  const auto activation = nam::activations::ActivationConfig::simple(nam::activations::ActivationType::ReLU);
   const nam::wavenet::GatingMode gating_mode = nam::wavenet::GatingMode::NONE;
   const int groups_input = 1;
   const int groups_1x1 = 1;
@@ -488,7 +488,7 @@ void test_layer_bottleneck_process_realtime_safe()
   const int bottleneck = 2; // bottleneck < channels
   const int kernel_size = 1;
   const int dilation = 1;
-  const std::string activation = "ReLU";
+  const auto activation = nam::activations::ActivationConfig::simple(nam::activations::ActivationType::ReLU);
   const nam::wavenet::GatingMode gating_mode = nam::wavenet::GatingMode::NONE;
   const int groups_input = 1;
   const int groups_1x1 = 1;
@@ -574,7 +574,7 @@ void test_layer_grouped_process_realtime_safe()
   const int bottleneck = channels;
   const int kernel_size = 2;
   const int dilation = 1;
-  const std::string activation = "ReLU";
+  const auto activation = nam::activations::ActivationConfig::simple(nam::activations::ActivationType::ReLU);
   const nam::wavenet::GatingMode gating_mode = nam::wavenet::GatingMode::NONE;
   const int groups_input = 2; // groups_input > 1
   const int groups_1x1 = 2; // 1x1 is also grouped
@@ -685,7 +685,7 @@ void test_layer_array_process_realtime_safe()
   const int bottleneck = channels;
   const int kernel_size = 1;
   std::vector<int> dilations{1};
-  const std::string activation = "ReLU";
+  const auto activation = nam::activations::ActivationConfig::simple(nam::activations::ActivationType::ReLU);
   const nam::wavenet::GatingMode gating_mode = nam::wavenet::GatingMode::NONE;
   const bool head_bias = false;
   const int groups = 1;
@@ -749,7 +749,7 @@ void test_process_realtime_safe()
   const int channels = 1;
   const int kernel_size = 1;
   std::vector<int> dilations{1};
-  const std::string activation = "ReLU";
+  const auto activation = nam::activations::ActivationConfig::simple(nam::activations::ActivationType::ReLU);
   const nam::wavenet::GatingMode gating_mode = nam::wavenet::GatingMode::NONE;
   const bool head_bias = false;
   const float head_scale = 1.0f;
@@ -827,7 +827,7 @@ void test_process_3in_2out_realtime_safe()
   const int channels = 4; // internal channels
   const int bottleneck = 2; // bottleneck (will be used for head)
   const int kernel_size = 1;
-  const std::string activation = "ReLU";
+  const auto activation = nam::activations::ActivationConfig::simple(nam::activations::ActivationType::ReLU);
   const nam::wavenet::GatingMode gating_mode = nam::wavenet::GatingMode::NONE;
   const bool head_bias = false;
   const float head_scale = 1.0f;
diff --git a/tools/test/test_wavenet_configurable_gating.cpp b/tools/test/test_wavenet_configurable_gating.cpp
index a98326c3..2c0d13b4 100644
--- a/tools/test/test_wavenet_configurable_gating.cpp
+++ b/tools/test/test_wavenet_configurable_gating.cpp
@@ -21,7 +21,7 @@ class TestConfigurableGating
     const int bottleneck = 2;
     const int kernelSize = 3;
     const int dilation = 1;
-    const std::string activation = "Tanh";
+    const auto activation = nam::activations::ActivationConfig::simple(nam::activations::ActivationType::Tanh);
     const int groups_input = 1;
     const int groups_1x1 = 1;
     nam::wavenet::Head1x1Params head1x1_params(false, channels, 1);
@@ -48,7 +48,7 @@ class TestConfigurableGating
     const int bottleneck = 2;
     const int kernelSize = 3;
     const int dilation = 1;
-    const std::string activation = "Tanh";
+    const auto activation = nam::activations::ActivationConfig::simple(nam::activations::ActivationType::Tanh);
     const int groups_input = 1;
     const int groups_1x1 = 1;
     nam::wavenet::Head1x1Params head1x1_params(false, channels, 1);
@@ -78,7 +78,7 @@ class TestConfigurableGating
     const int bottleneck = 2;
     const int kernel_size = 3;
     const std::vector<int> dilations = {1, 2};
-    const std::string activation = "Tanh";
+    const auto activation = nam::activations::ActivationConfig::simple(nam::activations::ActivationType::Tanh);
     const bool head_bias = false;
     const int groups_input = 1;
     const int groups_1x1 = 1;
@@ -111,7 +111,7 @@ class TestConfigurableGating
     const int bottleneck = 2;
     const int kernel_size = 3;
     const std::vector<int> dilations = {1};
-    const std::string activation = "Tanh";
+    const auto activation = nam::activations::ActivationConfig::simple(nam::activations::ActivationType::Tanh);
     const bool head_bias = false;
     const int groups_input = 1;
     const int groups_1x1 = 1;
@@ -174,7 +174,7 @@ class TestConfigurableGating
     const int bottleneck = 2;
     const int kernelSize = 3;
     const int dilation = 1;
-    const std::string activation = "Tanh";
+    const auto activation = nam::activations::ActivationConfig::simple(nam::activations::ActivationType::Tanh);
     const int groups_input = 1;
     const int groups_1x1 = 1;
     nam::wavenet::Head1x1Params head1x1_params(false, channels, 1);

From 87ea5760fd2b16ed06b57c7fc2161d1e66ccec4c Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Jo=C3=A3o=20Felipe=20Santos?= <santosjf@pm.me>
Date: Tue, 20 Jan 2026 16:23:40 -0800
Subject: [PATCH 6/6] Deleted tests for a function that was removed from the
 codebase

---
 tools/run_tests.cpp             |   9 ---
 tools/test/test_activations.cpp | 113 --------------------------------
 2 files changed, 122 deletions(-)

diff --git a/tools/run_tests.cpp b/tools/run_tests.cpp
index f3d2bb42..879417a9 100644
--- a/tools/run_tests.cpp
+++ b/tools/run_tests.cpp
@@ -44,15 +44,6 @@ int main()
   // This is enforced by an assert so it doesn't need to be tested
   // test_activations::TestPReLU::test_wrong_number_of_channels();
 
-  // JSON activation parsing tests
-  test_activations::TestJSONActivationParsing::test_string_activation();
-  test_activations::TestJSONActivationParsing::test_json_prelu_single_slope();
-  test_activations::TestJSONActivationParsing::test_json_prelu_multi_slope();
-  test_activations::TestJSONActivationParsing::test_json_leaky_relu();
-  test_activations::TestJSONActivationParsing::test_json_leaky_hardtanh();
-  test_activations::TestJSONActivationParsing::test_json_unknown_activation();
-  test_activations::TestJSONActivationParsing::test_functional_verification();
-
   // Typed ActivationConfig tests
   test_activations::TestTypedActivationConfig::test_simple_config();
   test_activations::TestTypedActivationConfig::test_all_simple_types();
diff --git a/tools/test/test_activations.cpp b/tools/test/test_activations.cpp
index 4d607e02..abbdd23c 100644
--- a/tools/test/test_activations.cpp
+++ b/tools/test/test_activations.cpp
@@ -195,119 +195,6 @@ class TestPReLU
   }
 };
 
-class TestJSONActivationParsing
-{
-public:
-  static void test_string_activation()
-  {
-    nlohmann::json str_activation = "ReLU";
-    auto act = nam::activations::Activation::get_activation(str_activation);
-    assert(act != nullptr);
-    // shared_ptr handles memory management automatically
-  }
-
-  static void test_json_prelu_single_slope()
-  {
-    nlohmann::json prelu_single = {
-      {"type", "PReLU"},
-      {"negative_slope", 0.25f}
-    };
-    auto act = nam::activations::Activation::get_activation(prelu_single);
-    assert(act != nullptr);
-    // shared_ptr handles memory management automatically
-  }
-
-  static void test_json_prelu_multi_slope()
-  {
-    nlohmann::json prelu_multi = {
-      {"type", "PReLU"},
-      {"negative_slopes", {0.1f, 0.2f, 0.3f, 0.4f}}
-    };
-    auto act = nam::activations::Activation::get_activation(prelu_multi);
-    assert(act != nullptr);
-    // shared_ptr handles memory management automatically
-  }
-
-  static void test_json_leaky_relu()
-  {
-    nlohmann::json leaky_relu = {
-      {"type", "LeakyReLU"},
-      {"negative_slope", 0.15f}
-    };
-    auto act = nam::activations::Activation::get_activation(leaky_relu);
-    assert(act != nullptr);
-    // shared_ptr handles memory management automatically
-  }
-
-  static void test_json_leaky_hardtanh()
-  {
-    nlohmann::json leaky_hardtanh = {
-      {"type", "LeakyHardTanh"},
-      {"min_val", -2.0f},
-      {"max_val", 2.0f},
-      {"min_slope", 0.1f},
-      {"max_slope", 0.1f}
-    };
-    auto act = nam::activations::Activation::get_activation(leaky_hardtanh);
-    assert(act != nullptr);
-    // shared_ptr handles memory management automatically
-  }
-
-  static void test_json_unknown_activation()
-  {
-    nlohmann::json unknown_activation = {
-      {"type", "UnknownActivation"}
-    };
-    auto act = nam::activations::Activation::get_activation(unknown_activation);
-    assert(act == nullptr); // Should fail for unknown activation type
-  }
-
-  static void test_functional_verification()
-  {
-    // Create test data with 4 channels and 3 time steps
-    Eigen::MatrixXf test_data(4, 3);
-    test_data <<
-      -1.0, -0.5, 0.0,
-      -2.0, 0.0, 1.0,
-      -0.5, 0.5, 1.5,
-      -1.5, -1.0, 0.5;
-
-    // Test PReLU with multiple slopes
-    nlohmann::json functional_prelu = {
-      {"type", "PReLU"},
-      {"negative_slopes", {0.1f, 0.2f, 0.3f, 0.4f}}
-    };
-    auto functional_act = nam::activations::Activation::get_activation(functional_prelu);
-    assert(functional_act != nullptr);
-
-    Eigen::MatrixXf result = test_data;
-    functional_act->apply(result);
-
-    // Verify specific values
-    // Channel 0, slope 0.1: -1.0 * 0.1 = -0.1
-    assert(fabs(result(0, 0) - (-0.1f)) < 1e-6);
-
-    // Channel 1, slope 0.2: -2.0 * 0.2 = -0.4
-    assert(fabs(result(1, 0) - (-0.4f)) < 1e-6);
-
-    // Channel 2, slope 0.3: -0.5 * 0.3 = -0.15
-    assert(fabs(result(2, 0) - (-0.15f)) < 1e-6);
-
-    // Channel 3, slope 0.4: -1.5 * 0.4 = -0.6
-    assert(fabs(result(3, 0) - (-0.6f)) < 1e-6);
-
-    // Positive values should be unchanged
-    for (int i = 0; i < result.rows(); i++) {
-      for (int j = 0; j < result.cols(); j++) {
-        if (test_data(i, j) >= 0) {
-          assert(fabs(result(i, j) - test_data(i, j)) < 1e-6);
-        }
-      }
-    }
-    // shared_ptr handles memory management automatically
-  }
-};
-
 class TestTypedActivationConfig
 {
 public: