fastmachinelearning · vloncar · Sep 11, 2024 · Aug 28, 2024 · Aug 28, 2024 · Sep 11, 2024
diff --git a/hls4ml/converters/pytorch/core.py b/hls4ml/converters/pytorch/core.py
@@ -41,7 +41,6 @@ def parse_linear_layer(operation, layer_name, input_names, input_shapes, node, c
 @pytorch_handler(*activation_layers)
 def parse_activation_layer(operation, layer_name, input_names, input_shapes, node, class_object, data_reader, config):
     layer = {}
-
     layer['class_name'] = operation
     layer['activation'] = layer['class_name']
     layer['name'] = layer_name
@@ -50,7 +49,9 @@ def parse_activation_layer(operation, layer_name, input_names, input_shapes, nod
     # if layer['class_name'] != 'Activation':
     #    layer['activation'] = layer['class_name']
     if node.op == 'call_module':
-        if layer['class_name'] == 'ReLU' or layer['class_name'] == 'Sigmoid':
+        if layer['class_name'] in ['ReLU', 'Sigmoid', 'Tanh']:
+            if layer['class_name'] == 'Tanh':
+                layer['activation'] = 'tanh'
             layer['class_name'] = 'Activation'
         if layer['class_name'] == 'LeakyReLU':
             layer['activ_param'] = class_object.negative_slope
@@ -68,7 +69,9 @@ def parse_activation_layer(operation, layer_name, input_names, input_shapes, nod
         if hasattr(node, 'dim'):
             layer['axis'] = class_object.dim
     else:
-        if layer['class_name'] == 'ReLU' or layer['class_name'] == 'Sigmoid':
+        if layer['class_name'] in ['ReLU', 'Sigmoid', 'Tanh']:
+            if layer['class_name'] == 'Tanh':
+                layer['activation'] = 'tanh'
             layer['class_name'] = 'Activation'
         if layer['class_name'] == 'LeakyReLU':
             layer['activ_param'] = node.kwargs['negative_slope']

diff --git a/hls4ml/converters/pytorch_to_hls.py b/hls4ml/converters/pytorch_to_hls.py
@@ -84,6 +84,7 @@ def decorator(function):
 # map names of operations between toch.nn and torch.nn.functionals
 layer_name_map = {
     'relu': 'ReLU',
+    'tanh': 'Tanh',
     'leaky_relu': 'LeakyReLU',
     'elu': 'ELU',
     'prelu': 'PReLU',

diff --git a/test/pytest/test_pytorch_api.py b/test/pytest/test_pytorch_api.py
@@ -64,6 +64,7 @@ def test_linear(backend, io_type):
     "activation_function",
     [
         nn.ReLU(),
+        nn.Tanh(),
         nn.LeakyReLU(negative_slope=1.0),
         nn.ELU(alpha=1.0),
         nn.PReLU(init=0.25),
@@ -102,7 +103,7 @@ def test_activations(activation_function, backend, io_type):
 
     assert nNodes - 1 == len(hls_model.get_layers())
 
-    if activation_function.__class__.__name__ == 'ReLU' or activation_function.__class__.__name__ == 'Sigmoid':
+    if activation_function.__class__.__name__ in ['ReLU', 'Sigmoid', 'Tanh']:
         assert list(hls_model.get_layers())[2].attributes['class_name'] == 'Activation'
     elif activation_function.__class__.__name__ == 'Threshold':
         assert list(hls_model.get_layers())[2].attributes['class_name'] == 'ThresholdedReLU'
@@ -118,6 +119,14 @@ def forward(self, x):
         return nn.functional.relu(x)
 
 
+class TanHModel(nn.Module):
+    def __init__(self):
+        super().__init__()
+
+    def forward(self, x):
+        return nn.functional.tanh(x)
+
+
 class LeakyReLuModel(nn.Module):
     def __init__(self):
         super().__init__()
@@ -154,6 +163,7 @@ def forward(self, x):
     "activation_function",
     [
         ReLuModel(),
+        TanHModel(),
         LeakyReLuModel(),
         EluModel(),
         SigmoidModel(),
@@ -172,7 +182,7 @@ def test_activation_functionals(activation_function, backend, io_type):
 
     config = config_from_pytorch_model(model, (1,))
     fn_name = activation_function.__class__.__name__
-    output_dir = str(test_root_path / f'hls4mlprj_pytorch_api_activations_functional_relu_{backend}_{io_type}_{fn_name}')
+    output_dir = str(test_root_path / f'hls4mlprj_pytorch_api_activations_functional_{fn_name}_{backend}_{io_type}')
     hls_model = convert_from_pytorch_model(model, hls_config=config, output_dir=output_dir, backend=backend, io_type=io_type)
     hls_model.compile()