From 53e9ece80e38ff44f0cfc235dd219c7f30ae87b0 Mon Sep 17 00:00:00 2001
From: Nemer Chiedde <chiedde@marchied.in2p3.fr>
Date: Mon, 27 Jun 2022 14:16:03 +0200
Subject: [PATCH 1/3] Softsign LUT optimization

---
 .../firmware/nnet_utils/nnet_activation.h     | 23 +++++++++++++++----
 hls4ml/writer/quartus_writer.py               |  9 +++++---
 2 files changed, 24 insertions(+), 8 deletions(-)
diff --git a/hls4ml/templates/quartus/firmware/nnet_utils/nnet_activation.h b/hls4ml/templates/quartus/firmware/nnet_utils/nnet_activation.h
index 1eb9524fe4..9d6ff81ff3 100755
--- a/hls4ml/templates/quartus/firmware/nnet_utils/nnet_activation.h
+++ b/hls4ml/templates/quartus/firmware/nnet_utils/nnet_activation.h
@@ -271,17 +271,30 @@ void softplus(data_T data[CONFIG_T::n_in], res_T res[CONFIG_T::n_in])
 template<class data_T, class res_T, typename CONFIG_T>
 void  softsign(data_T data[CONFIG_T::n_in], res_T res[CONFIG_T::n_in])
 {
+    static const int MAX_VALUE=8;
     // Initialize the lookup table
     #include "activation_tables/softsign_table.tb"
 
     // Index into the lookup table based on data
     #pragma unroll
     for (int ii=0; ii<CONFIG_T::n_in; ii++) {
-        ac_int<16> data_round = (data[ii]*CONFIG_T::table_size/16).to_int();
-        ac_int<16> index = data_round + 8*CONFIG_T::table_size/16;
-        if (index < 0)   index = 0;
-        if (index > CONFIG_T::table_size-1) index = CONFIG_T::table_size-1;
-        res[ii] = (res_T) softsign_table[index];
+        data_T temp  hls_register;
+        res_T  temp2 hls_register;
+        if(data[ii] < 0 ){
+            temp = -data[ii];
+        }
+        else{
+            temp = data[ii];
+        }
+        ac_int<16> index = (temp*CONFIG_T::table_size/MAX_VALUE).to_int();
+        if (temp > MAX_VALUE) index = CONFIG_T::table_size-1;
+        temp2 = (res_T) softsign_table[index];
+        if(data[ii] < 0 ){
+            res[ii] = -temp2;
+        }
+        else{
+            res[ii] = temp2;
+        }
     }
 }
 
diff --git a/hls4ml/writer/quartus_writer.py b/hls4ml/writer/quartus_writer.py
index 9a49422885..9a66092737 100644
--- a/hls4ml/writer/quartus_writer.py
+++ b/hls4ml/writer/quartus_writer.py
@@ -555,6 +555,8 @@ def __write_softplus_table(self, model, path):
         h_file.close()
 
     def __write_softsign_table(self, model, path):
+        MAX_VALUE = 8
+        MIN_VALUE = 0
         table_name = 'softsign_table'
         table_size = self.__get_table_size(model, 'softsign')
 
@@ -563,10 +565,11 @@ def __write_softsign_table(self, model, path):
 
         sep = ''
         for i in range(table_size):
-            in_val = 2*8.0*(i-float(table_size)/2.0)/float(table_size)
+            in_val = i * (MAX_VALUE-MIN_VALUE)/float(table_size) + (MAX_VALUE-MIN_VALUE)/(float(table_size)*2) + MIN_VALUE
             real_val = in_val / (np.fabs(in_val) + 1.)
-            h_file.write(sep + str(real_val))
-            sep = ", "
+            if(real_val >= 0):
+                h_file.write(sep + str(real_val))
+                sep = ", "
 
         h_file.write('};\n')
         h_file.write('\n#endif\n')

From 49c3864d5cdb7ce85e82e212451a31db5740ecfb Mon Sep 17 00:00:00 2001
From: Nemer Chiedde <chiedde@marchied.in2p3.fr>
Date: Thu, 7 Jul 2022 15:13:49 +0200
Subject: [PATCH 2/3] Test file: Activation softsign

---
 test/pytest/test_softsign.py | 58 ++++++++++++++++++++++++++++++++++++
 1 file changed, 58 insertions(+)
 create mode 100644 test/pytest/test_softsign.py

diff --git a/test/pytest/test_softsign.py b/test/pytest/test_softsign.py
new file mode 100644
index 0000000000..783a1eb339
--- /dev/null
+++ b/test/pytest/test_softsign.py
@@ -0,0 +1,58 @@
+import hls4ml
+import tensorflow as tf
+import numpy as np
+import pytest
+from sklearn.metrics import accuracy_score
+from pathlib import Path
+
+test_root_path = Path(__file__).parent
+
+def flat_distribution(shape):
+    return np.random.rand(*shape)
+
+
+def high_accuracy_distribution(shape):
+    '''Start with a flat distribution, then pick a random member of each row to amplify'''
+    x = np.random.rand(*shape)
+    imax = np.random.randint(0, shape[1], size=shape[0])
+    x[:, imax] *= 10
+    return x
+
+
+@pytest.fixture()
+def generate_data(function, input_shape):
+    return function((1000, *input_shape))
+
+
+# TODO: include latency strategy with flat_distribution when it can be made to pass
+@pytest.mark.parametrize('backend,strategy,function,input_shape,io_type', [   
+                            ('Quartus', 'resource', flat_distribution, (8,), 'io_parallel'),
+                            ('Quartus', 'resource', high_accuracy_distribution, (8,), 'io_parallel')
+                        ])
+def test_softsign(backend, strategy, generate_data, input_shape, io_type):
+    X = generate_data
+    model = tf.keras.models.Sequential()
+    model.add(tf.keras.layers.Activation(input_shape=input_shape, activation='softsign', name='softsign'))
+    model.compile()
+    
+    f_type = 'ac_fixed<18,8,true,AC_RND,AC_SAT>' if backend == 'Quartus' else 'ap_fixed<18,8,AP_RND,AP_SAT>'
+    cfg = hls4ml.utils.config_from_keras_model(model, granularity='name')
+    cfg['LayerName']['softsign']['Strategy'] = strategy
+    cfg['LayerName']['softsign']['inv_table_t'] = f_type
+    cfg['LayerName']['softsign']['exp_table_t'] = f_type
+    
+    odir = str(test_root_path / 'hls4mlprj_softsign_{}'.format(strategy))
+    hls_model = hls4ml.converters.convert_from_keras_model(model, hls_config=cfg, io_type=io_type,
+                                                           output_dir=odir, backend=backend)
+    hls_model.compile()
+   
+    y_keras = model.predict(X)
+    y_hls4ml = hls_model.predict(X).reshape(y_keras.shape)
+
+    acc_hls4ml = accuracy_score(np.argmax(y_keras, axis=-1).ravel(), np.argmax(y_hls4ml, axis=-1).ravel())
+
+    print('Accuracy hls4ml relative to keras: {}'.format(acc_hls4ml))
+
+    assert acc_hls4ml >= 0.7
+
+

From 37696fa447bc8716921c17165cc00bc6e3b440e5 Mon Sep 17 00:00:00 2001
From: Nemer Chiedde <chiedde@marchied.in2p3.fr>
Date: Tue, 16 Aug 2022 11:20:54 +0200
Subject: [PATCH 3/3] Changing minimal accurancy to 9.8 and adding new texts
 using Vivado and Quartus

---
 test/pytest/test_softsign.py | 18 +++++++-----------
 1 file changed, 7 insertions(+), 11 deletions(-)

diff --git a/test/pytest/test_softsign.py b/test/pytest/test_softsign.py
index 783a1eb339..3444f0b4a1 100644
--- a/test/pytest/test_softsign.py
+++ b/test/pytest/test_softsign.py
@@ -11,14 +11,6 @@ def flat_distribution(shape):
     return np.random.rand(*shape)
 
 
-def high_accuracy_distribution(shape):
-    '''Start with a flat distribution, then pick a random member of each row to amplify'''
-    x = np.random.rand(*shape)
-    imax = np.random.randint(0, shape[1], size=shape[0])
-    x[:, imax] *= 10
-    return x
-
-
 @pytest.fixture()
 def generate_data(function, input_shape):
     return function((1000, *input_shape))
@@ -26,8 +18,12 @@ def generate_data(function, input_shape):
 
 # TODO: include latency strategy with flat_distribution when it can be made to pass
 @pytest.mark.parametrize('backend,strategy,function,input_shape,io_type', [   
-                            ('Quartus', 'resource', flat_distribution, (8,), 'io_parallel'),
-                            ('Quartus', 'resource', high_accuracy_distribution, (8,), 'io_parallel')
+                            ('Vivado', 'stable', flat_distribution, (4,), 'io_parallel'),
+                            ('Quartus', 'stable', flat_distribution, (4,), 'io_parallel'),
+
+                            # IO_stram avaliable just for VIVADO
+                            ('Vivado', 'stable', flat_distribution, (4,), 'io_stream'),
+                            ('Vivado', 'stable', flat_distribution, (4, 4, 3), 'io_stream')
                         ])
 def test_softsign(backend, strategy, generate_data, input_shape, io_type):
     X = generate_data
@@ -53,6 +49,6 @@ def test_softsign(backend, strategy, generate_data, input_shape, io_type):
 
     print('Accuracy hls4ml relative to keras: {}'.format(acc_hls4ml))
 
-    assert acc_hls4ml >= 0.7
+    assert acc_hls4ml >= 0.98