From f34238d92d85a392924488b5449f54d17c9d6396 Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Mon, 10 May 2021 15:09:58 +0100
Subject: [PATCH 01/64] [nn] Added ability to gather activation stastitics
 during LUT inference.

---
 src/logicnets/nn.py | 49 ++++++++++++++++++++++++++++++++++++++++-----
 1 file changed, 44 insertions(+), 5 deletions(-)

diff --git a/src/logicnets/nn.py b/src/logicnets/nn.py
index 6effa5cc9..6eb8ab2f9 100644
--- a/src/logicnets/nn.py
+++ b/src/logicnets/nn.py
@@ -44,10 +44,34 @@ def generate_truth_tables(model: nn.Module, verbose: bool = False) -> None:
     model.training = training
 
 # TODO: Create a container module which performs this function.
-def lut_inference(model: nn.Module) -> None:
+def lut_inference(model: nn.Module, track_used_luts: bool = False) -> None:
     for name, module in model.named_modules():
         if type(module) == SparseLinearNeq:
-            module.lut_inference()
+            module.lut_inference(track_used_luts=track_used_luts)
+
+# TODO: Create a container module which performs this function.
+def save_luts(model: nn.Module, path: str) -> None:
+    lut_dict = {}
+    for name, module in model.named_modules():
+        if type(module) == SparseLinearNeq:
+            luts = module.neuron_truth_tables
+            indices = list(map(lambda x: x[0], luts))
+            tt_inputs = list(map(lambda x: x[1], luts))
+            tt_input_bin_str = list(map(lambda x: list(map(lambda y: list(map(lambda z: module.input_quant.get_bin_str(z), y)), x)), tt_inputs))
+            tt_float_outputs = list(map(lambda x: x[2], luts))
+            tt_bin_outputs = list(map(lambda x: x[3], luts))
+            tt_outputs_bin_str = list(map(lambda x: list(map(lambda y: module.output_quant.get_bin_str(y), x)), tt_bin_outputs))
+            histogram = module.used_luts_histogram
+            lut_dict[name] = {
+                'indices': indices,
+                'input_state_space': tt_inputs,
+                'input_state_space_bin_str': tt_input_bin_str,
+                'output_state_space_float': tt_float_outputs,
+                'output_state_space_bin': tt_bin_outputs,
+                'output_state_space_bin_str': tt_outputs_bin_str,
+                'histogram': histogram,
+            }
+    torch.save(lut_dict, path)
 
 # TODO: Create a container module which performs this function.
 def neq_inference(model: nn.Module) -> None:
@@ -111,6 +135,8 @@ def __init__(self, in_features: int, out_features: int, input_quant, output_quan
         self.neuron_truth_tables = None
         self.apply_input_quant = apply_input_quant
         self.apply_output_quant = apply_output_quant
+        self.track_used_luts = False
+        self.used_luts_histogram = None
 
     # TODO: Move the verilog string templates to elsewhere
     # TODO: Move this to another class
@@ -158,8 +184,9 @@ def gen_neuron_verilog(self, index, module_name):
             lut_string += f"\t\t\t{int(cat_input_bitwidth)}'b{entry_str}: M1r = {int(output_bitwidth)}'b{res_str};\n"
         return generate_lut_verilog(module_name, int(cat_input_bitwidth), int(output_bitwidth), lut_string)
 
-    def lut_inference(self):
+    def lut_inference(self, track_used_luts=False):
         self.is_lut_inference = True
+        self.track_used_luts = track_used_luts
         self.input_quant.bin_output()
         self.output_quant.bin_output()
 
@@ -169,7 +196,7 @@ def neq_inference(self):
         self.output_quant.float_output()
 
     # TODO: This function might be a useful utility outside of this class..
-    def table_lookup(self, connected_input: Tensor, input_perm_matrix: Tensor, bin_output_states: Tensor) -> Tensor:
+    def table_lookup(self, connected_input: Tensor, input_perm_matrix: Tensor, bin_output_states: Tensor, neuron_lut_histogram=None) -> Tensor:
         fan_in_size = connected_input.shape[1]
         ci_bcast = connected_input.unsqueeze(2) # Reshape to B x Fan-in x 1
         pm_bcast = input_perm_matrix.t().unsqueeze(0) # Reshape to 1 x Fan-in x InputStates
@@ -178,17 +205,29 @@ def table_lookup(self, connected_input: Tensor, input_perm_matrix: Tensor, bin_o
         if not (matches == torch.ones_like(matches,dtype=matches.dtype)).all():
             raise Exception(f"One or more vectors in the input is not in the possible input state space")
         indices = torch.argmax(eq.type(torch.int64),dim=1)
+        if self.track_used_luts:
+            # TODO: vectorize this loop
+            for i in indices:
+                neuron_lut_histogram[i] += 1
         return bin_output_states[indices]
 
     def lut_forward(self, x: Tensor) -> Tensor:
         if self.apply_input_quant:
             x = self.input_quant(x) # Use this to fetch the bin output of the input, if the input isn't already in binary format
+        # TODO: Put this in a child class(?)
+        # TODO: Add support for non-uniform fan-in
+        if self.track_used_luts:
+            if self.used_luts_histogram is None:
+                self.used_luts_histogram = self.out_features * [None]
+                for i in range(self.out_features):
+                    self.used_luts_histogram[i] = torch.zeros(size=(len(self.neuron_truth_tables[i][2]),), dtype=torch.int64)
         y = torch.zeros((x.shape[0],self.out_features))
         # Perform table lookup for each neuron output
         for i in range(self.out_features):
             indices, input_perm_matrix, float_output_states, bin_output_states = self.neuron_truth_tables[i]
+            neuron_lut_histogram = self.used_luts_histogram[i] if self.track_used_luts else None
             connected_input = x[:,indices]
-            y[:,i] = self.table_lookup(connected_input, input_perm_matrix, bin_output_states)
+            y[:,i] = self.table_lookup(connected_input, input_perm_matrix, bin_output_states, neuron_lut_histogram=neuron_lut_histogram)
         return y
 
     def forward(self, x: Tensor) -> Tensor:

From aa622a4bde728f5c0407f031cdff5a3334e1dfc8 Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Mon, 10 May 2021 18:05:33 +0100
Subject: [PATCH 02/64] [jsc] Added script to save LUTs and activation
 statistics.

---
 examples/jet_substructure/dump_luts.py | 122 +++++++++++++++++++++++++
 1 file changed, 122 insertions(+)
 create mode 100644 examples/jet_substructure/dump_luts.py

diff --git a/examples/jet_substructure/dump_luts.py b/examples/jet_substructure/dump_luts.py
new file mode 100644
index 000000000..c244ee1ba
--- /dev/null
+++ b/examples/jet_substructure/dump_luts.py
@@ -0,0 +1,122 @@
+#  Copyright (C) 2021 Xilinx, Inc
+#
+#  Licensed under the Apache License, Version 2.0 (the "License");
+#  you may not use this file except in compliance with the License.
+#  You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing, software
+#  distributed under the License is distributed on an "AS IS" BASIS,
+#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+#  See the License for the specific language governing permissions and
+#  limitations under the License.
+
+import os
+from argparse import ArgumentParser
+
+import torch
+from torch.utils.data import DataLoader
+
+from logicnets.nn import    generate_truth_tables, \
+                            lut_inference, \
+                            save_luts, \
+                            module_list_to_verilog_module
+
+from train import configs, model_config, dataset_config, other_options, test
+from dataset import JetSubstructureDataset
+from models import JetSubstructureNeqModel, JetSubstructureLutModel
+from logicnets.synthesis import synthesize_and_get_resource_counts
+
+if __name__ == "__main__":
+    parser = ArgumentParser(description="Synthesize convert a PyTorch trained model into verilog")
+    parser.add_argument('--arch', type=str, choices=configs.keys(), default="jsc-s",
+        help="Specific the neural network model to use (default: %(default)s)")
+    parser.add_argument('--batch-size', type=int, default=None, metavar='N',
+        help="Batch size for evaluation (default: %(default)s)")
+    parser.add_argument('--input-bitwidth', type=int, default=None,
+        help="Bitwidth to use at the input (default: %(default)s)")
+    parser.add_argument('--hidden-bitwidth', type=int, default=None,
+        help="Bitwidth to use for activations in hidden layers (default: %(default)s)")
+    parser.add_argument('--output-bitwidth', type=int, default=None,
+        help="Bitwidth to use at the output (default: %(default)s)")
+    parser.add_argument('--input-fanin', type=int, default=None,
+        help="Fanin to use at the input (default: %(default)s)")
+    parser.add_argument('--hidden-fanin', type=int, default=None,
+        help="Fanin to use for the hidden layers (default: %(default)s)")
+    parser.add_argument('--output-fanin', type=int, default=None,
+        help="Fanin to use at the output (default: %(default)s)")
+    parser.add_argument('--hidden-layers', nargs='+', type=int, default=None,
+        help="A list of hidden layer neuron sizes (default: %(default)s)")
+    parser.add_argument('--dataset-file', type=str, default='data/processed-pythia82-lhc13-all-pt1-50k-r1_h022_e0175_t220_nonu_truth.z',
+        help="The file to use as the dataset input (default: %(default)s)")
+    parser.add_argument('--dataset-config', type=str, default='config/yaml_IP_OP_config.yml',
+        help="The file to use to configure the input dataset (default: %(default)s)")
+    parser.add_argument('--log-dir', type=str, default='./log',
+        help="A location to store the log output of the training run and the output model (default: %(default)s)")
+    parser.add_argument('--checkpoint', type=str, required=True,
+        help="The checkpoint file which contains the model weights")
+    args = parser.parse_args()
+    defaults = configs[args.arch]
+    options = vars(args)
+    del options['arch']
+    config = {}
+    for k in options.keys():
+        config[k] = options[k] if options[k] is not None else defaults[k] # Override defaults, if specified.
+
+    if not os.path.exists(config['log_dir']):
+        os.makedirs(config['log_dir'])
+
+    # Split up configuration options to be more understandable
+    model_cfg = {}
+    for k in model_config.keys():
+        model_cfg[k] = config[k]
+    dataset_cfg = {}
+    for k in dataset_config.keys():
+        dataset_cfg[k] = config[k]
+    options_cfg = {}
+    for k in other_options.keys():
+        if k == 'cuda':
+            continue
+        options_cfg[k] = config[k]
+
+    # Fetch the test set
+    dataset = {}
+    dataset['train'] = JetSubstructureDataset(dataset_cfg['dataset_file'], dataset_cfg['dataset_config'], split="train")
+    train_loader = DataLoader(dataset["train"], batch_size=config['batch_size'], shuffle=False)
+
+    # Instantiate the PyTorch model
+    x, y = dataset['train'][0]
+    dataset_length = len(dataset['train'])
+    model_cfg['input_length'] = len(x)
+    model_cfg['output_length'] = len(y)
+    model = JetSubstructureNeqModel(model_cfg)
+
+    # Load the model weights
+    checkpoint = torch.load(options_cfg['checkpoint'], map_location='cpu')
+    model.load_state_dict(checkpoint['model_dict'])
+
+    # Test the PyTorch model
+    print("Running inference of baseline model on training set (%d examples)..." % (dataset_length))
+    model.eval()
+    baseline_accuracy = test(model, train_loader, cuda=False)
+    print("Baseline accuracy: %f" % (baseline_accuracy))
+
+    # Instantiate LUT-based model
+    lut_model = JetSubstructureLutModel(model_cfg)
+    lut_model.load_state_dict(checkpoint['model_dict'])
+
+    # Generate the truth tables in the LUT module
+    print("Converting to NEQs to LUTs...")
+    generate_truth_tables(lut_model, verbose=True)
+
+    # Test the LUT-based model
+    print("Running inference of LUT-based model training set (%d examples)..." % (dataset_length))
+    lut_inference(lut_model, track_used_luts=True)
+    lut_model.eval()
+    lut_accuracy = test(lut_model, train_loader, cuda=False)
+    print("LUT-Based Model accuracy: %f" % (lut_accuracy))
+    print("Saving LUTs to %s... " % (options_cfg["log_dir"] + "/luts.pth"))
+    save_luts(lut_model, options_cfg["log_dir"] + "/luts.pth")
+    print("Done!")
+

From 4d75911d263fda879c98587779f1cb3925e07965 Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Tue, 18 May 2021 10:43:32 +0100
Subject: [PATCH 03/64] [nn] Added extra parameter to specify a cutoff, for if
 a TT entry should be included in the output verilog.

---
 src/logicnets/nn.py | 19 +++++++++++++------
 1 file changed, 13 insertions(+), 6 deletions(-)

diff --git a/src/logicnets/nn.py b/src/logicnets/nn.py
index 6eb8ab2f9..27529e11a 100644
--- a/src/logicnets/nn.py
+++ b/src/logicnets/nn.py
@@ -73,6 +73,12 @@ def save_luts(model: nn.Module, path: str) -> None:
             }
     torch.save(lut_dict, path)
 
+# TODO: Create a container module which performs this function.
+def load_histograms(model: nn.Module, lut_dict: dict) -> None:
+    for name, module in model.named_modules():
+        if name in lut_dict.keys():
+            module.used_luts_histogram = lut_dict[name]['histogram']
+
 # TODO: Create a container module which performs this function.
 def neq_inference(model: nn.Module) -> None:
     for name, module in model.named_modules():
@@ -81,7 +87,7 @@ def neq_inference(model: nn.Module) -> None:
 
 # TODO: Should this go in with the other verilog functions?
 # TODO: Support non-linear topologies
-def module_list_to_verilog_module(module_list: nn.ModuleList, module_name: str, output_directory: str):
+def module_list_to_verilog_module(module_list: nn.ModuleList, module_name: str, output_directory: str, freq_thresh=None):
     input_bitwidth = None
     output_bitwidth = None
     module_contents = ""
@@ -89,7 +95,7 @@ def module_list_to_verilog_module(module_list: nn.ModuleList, module_name: str,
         m = module_list[i]
         if type(m) == SparseLinearNeq:
             module_prefix = f"layer{i}"
-            module_input_bits, module_output_bits = m.gen_layer_verilog(module_prefix, output_directory)
+            module_input_bits, module_output_bits = m.gen_layer_verilog(module_prefix, output_directory, freq_thresh=freq_thresh)
             if i == 0:
                 input_bitwidth = module_input_bits
             elif i == len(module_list)-1:
@@ -141,7 +147,7 @@ def __init__(self, in_features: int, out_features: int, input_quant, output_quan
     # TODO: Move the verilog string templates to elsewhere
     # TODO: Move this to another class
     # TODO: Update this code to support custom bitwidths per input/output
-    def gen_layer_verilog(self, module_prefix, directory):
+    def gen_layer_verilog(self, module_prefix, directory, freq_thresh=None):
         _, input_bitwidth = self.input_quant.get_scale_factor_bits()
         _, output_bitwidth = self.output_quant.get_scale_factor_bits()
         input_bitwidth, output_bitwidth = int(input_bitwidth), int(output_bitwidth)
@@ -152,7 +158,7 @@ def gen_layer_verilog(self, module_prefix, directory):
         for index in range(self.out_features):
             module_name = f"{module_prefix}_N{index}"
             indices, _, _, _ = self.neuron_truth_tables[index]
-            neuron_verilog = self.gen_neuron_verilog(index, module_name) # Generate the contents of the neuron verilog
+            neuron_verilog = self.gen_neuron_verilog(index, module_name, freq_thresh=freq_thresh) # Generate the contents of the neuron verilog
             with open(f"{directory}/{module_name}.v", "w") as f:
                 f.write(neuron_verilog)
             connection_string = generate_neuron_connection_verilog(indices, input_bitwidth) # Generate the string which connects the synapses to this neuron
@@ -168,7 +174,7 @@ def gen_layer_verilog(self, module_prefix, directory):
 
     # TODO: Move the verilog string templates to elsewhere
     # TODO: Move this to another class
-    def gen_neuron_verilog(self, index, module_name):
+    def gen_neuron_verilog(self, index, module_name, freq_thresh=None):
         indices, input_perm_matrix, float_output_states, bin_output_states = self.neuron_truth_tables[index]
         _, input_bitwidth = self.input_quant.get_scale_factor_bits()
         _, output_bitwidth = self.output_quant.get_scale_factor_bits()
@@ -181,7 +187,8 @@ def gen_neuron_verilog(self, index, module_name):
                 val = input_perm_matrix[i,idx]
                 entry_str += self.input_quant.get_bin_str(val)
             res_str = self.output_quant.get_bin_str(bin_output_states[i])
-            lut_string += f"\t\t\t{int(cat_input_bitwidth)}'b{entry_str}: M1r = {int(output_bitwidth)}'b{res_str};\n"
+            if (freq_thresh is None) or (self.used_luts_histogram[index][i] >= freq_thresh):
+                lut_string += f"\t\t\t{int(cat_input_bitwidth)}'b{entry_str}: M1r = {int(output_bitwidth)}'b{res_str};\n"
         return generate_lut_verilog(module_name, int(cat_input_bitwidth), int(output_bitwidth), lut_string)
 
     def lut_inference(self, track_used_luts=False):

From 538281538cd43d0e040c67f10b0aeb7ef68d51ec Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Tue, 18 May 2021 10:52:07 +0100
Subject: [PATCH 04/64] [jsc] Made verification of verilog simulation optional
 with a flag.

---
 examples/jet_substructure/models.py | 15 +++++++++------
 1 file changed, 9 insertions(+), 6 deletions(-)

diff --git a/examples/jet_substructure/models.py b/examples/jet_substructure/models.py
index 7c0fba9f9..be6891bff 100644
--- a/examples/jet_substructure/models.py
+++ b/examples/jet_substructure/models.py
@@ -64,12 +64,14 @@ def __init__(self, model_config):
         self.verilog_dir = None
         self.top_module_filename = None
         self.dut = None
+        self.verify = True
 
-    def verilog_inference(self, verilog_dir, top_module_filename):
+    def verilog_inference(self, verilog_dir, top_module_filename, verify=True):
         self.verilog_dir = realpath(verilog_dir)
         self.top_module_filename = top_module_filename
         self.dut = PyVerilator.build(f"{self.verilog_dir}/{self.top_module_filename}", verilog_path=[self.verilog_dir], build_dir=f"{self.verilog_dir}/verilator")
         self.is_verilog_inference = True
+        self.verify = verify
 
     def pytorch_inference(self):
         self.is_verilog_inference = False
@@ -92,11 +94,8 @@ def verilog_forward(self, x):
         self.dut.io.clk = 0
         for i in range(x.shape[0]):
             x_i = x[i,:]
-            y_i = self.pytorch_forward(x[i:i+1,:])[0]
             xv_i = list(map(lambda z: input_quant.get_bin_str(z), x_i))
-            ys_i = list(map(lambda z: output_quant.get_bin_str(z), y_i))
             xvc_i = reduce(lambda a,b: a+b, xv_i[::-1])
-            ysc_i = reduce(lambda a,b: a+b, ys_i[::-1])
             self.dut["M0"] = int(xvc_i, 2)
             for j in range(self.latency + 1):
                 #print(self.dut.io.M5)
@@ -104,9 +103,13 @@ def verilog_forward(self, x):
                 result = f"{res:0{int(total_output_bits)}b}"
                 self.dut.io.clk = 1
                 self.dut.io.clk = 0
-            expected = f"{int(ysc_i,2):0{int(total_output_bits)}b}"
             result = f"{res:0{int(total_output_bits)}b}"
-            assert(expected == result)
+            if self.verify:
+                y_i = self.pytorch_forward(x[i:i+1,:])[0]
+                ys_i = list(map(lambda z: output_quant.get_bin_str(z), y_i))
+                ysc_i = reduce(lambda a,b: a+b, ys_i[::-1])
+                expected = f"{int(ysc_i,2):0{int(total_output_bits)}b}"
+                assert(expected == result)
             res_split = [result[i:i+output_bitwidth] for i in range(0, len(result), output_bitwidth)][::-1]
             yv_i = torch.Tensor(list(map(lambda z: int(z, 2), res_split)))
             y[i,:] = yv_i

From 45d7955eae74d3ca4af3f7752f7446c305c3a9f0 Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Tue, 18 May 2021 10:53:03 +0100
Subject: [PATCH 05/64] [jsc] Added loading of calculated histograms and
 specifying a TT frequency threshold.

---
 examples/jet_substructure/neq2lut.py | 13 ++++++++++---
 1 file changed, 10 insertions(+), 3 deletions(-)

diff --git a/examples/jet_substructure/neq2lut.py b/examples/jet_substructure/neq2lut.py
index 15b6d2b80..c106128aa 100644
--- a/examples/jet_substructure/neq2lut.py
+++ b/examples/jet_substructure/neq2lut.py
@@ -20,7 +20,8 @@
 
 from logicnets.nn import    generate_truth_tables, \
                             lut_inference, \
-                            module_list_to_verilog_module
+                            module_list_to_verilog_module, \
+                            load_histograms
 
 from train import configs, model_config, dataset_config, other_options, test
 from dataset import JetSubstructureDataset
@@ -55,6 +56,10 @@
         help="A location to store the log output of the training run and the output model (default: %(default)s)")
     parser.add_argument('--checkpoint', type=str, required=True,
         help="The checkpoint file which contains the model weights")
+    parser.add_argument('--histograms', type=str, required=True,
+        help="The checkpoint histograms of LUT usage")
+    parser.add_argument('--freq-thresh', type=int, default=0,
+        help="Threshold to use to include this truth table into the model (default: %(default)s)")
     args = parser.parse_args()
     defaults = configs[args.arch]
     options = vars(args)
@@ -118,13 +123,15 @@
                     'test_accuracy': lut_accuracy}
 
     torch.save(modelSave, options_cfg["log_dir"] + "/lut_based_model.pth")
+    luts = torch.load(args.histograms)
+    load_histograms(lut_model, luts)
 
     print("Generating verilog in %s..." % (options_cfg["log_dir"]))
-    module_list_to_verilog_module(lut_model.module_list, "logicnet", options_cfg["log_dir"])
+    module_list_to_verilog_module(lut_model.module_list, "logicnet", options_cfg["log_dir"], freq_thresh=args.freq_thresh)
     print("Top level entity stored at: %s/logicnet.v ..." % (options_cfg["log_dir"]))
 
     print("Running inference simulation of Verilog-based model...")
-    lut_model.verilog_inference(options_cfg["log_dir"], "logicnet.v")
+    lut_model.verilog_inference(options_cfg["log_dir"], "logicnet.v", verify=args.freq_thresh == 0)
     verilog_accuracy = test(lut_model, test_loader, cuda=False)
     print("Verilog-Based Model accuracy: %f" % (verilog_accuracy))
 

From dc302d1f8344c02bcbf312aecdeb88ab052723b4 Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Wed, 19 May 2021 15:52:34 +0100
Subject: [PATCH 06/64] [nn] Added a default case to verilog LUT generation.

---
 examples/jet_substructure/models.py | 2 +-
 src/logicnets/nn.py                 | 3 +++
 2 files changed, 4 insertions(+), 1 deletion(-)

diff --git a/examples/jet_substructure/models.py b/examples/jet_substructure/models.py
index be6891bff..e8c99a612 100644
--- a/examples/jet_substructure/models.py
+++ b/examples/jet_substructure/models.py
@@ -69,7 +69,7 @@ def __init__(self, model_config):
     def verilog_inference(self, verilog_dir, top_module_filename, verify=True):
         self.verilog_dir = realpath(verilog_dir)
         self.top_module_filename = top_module_filename
-        self.dut = PyVerilator.build(f"{self.verilog_dir}/{self.top_module_filename}", verilog_path=[self.verilog_dir], build_dir=f"{self.verilog_dir}/verilator")
+        self.dut = PyVerilator.build(f"{self.verilog_dir}/{self.top_module_filename}", verilog_path=[self.verilog_dir], build_dir=f"{self.verilog_dir}/verilator", command_args=("--x-assign","0",))
         self.is_verilog_inference = True
         self.verify = verify
 
diff --git a/src/logicnets/nn.py b/src/logicnets/nn.py
index 27529e11a..39af6a959 100644
--- a/src/logicnets/nn.py
+++ b/src/logicnets/nn.py
@@ -189,6 +189,9 @@ def gen_neuron_verilog(self, index, module_name, freq_thresh=None):
             res_str = self.output_quant.get_bin_str(bin_output_states[i])
             if (freq_thresh is None) or (self.used_luts_histogram[index][i] >= freq_thresh):
                 lut_string += f"\t\t\t{int(cat_input_bitwidth)}'b{entry_str}: M1r = {int(output_bitwidth)}'b{res_str};\n"
+        # Add a default "don't care" statement
+        default_string = int(output_bitwidth) * 'x'
+        lut_string += f"\t\t\tdefault: M1r = {int(output_bitwidth)}'b{default_string};\n"
         return generate_lut_verilog(module_name, int(cat_input_bitwidth), int(output_bitwidth), lut_string)
 
     def lut_inference(self, track_used_luts=False):

From 536271bf27b9ae490153ce3434c161eed1072edc Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Thu, 20 May 2021 16:15:21 +0100
Subject: [PATCH 07/64] [nn/jsc] Made registers optional in verilog generation.
 Default is no registers.

---
 examples/jet_substructure/models.py |  2 +-
 src/logicnets/verilog.py            | 12 +++++++-----
 2 files changed, 8 insertions(+), 6 deletions(-)

diff --git a/examples/jet_substructure/models.py b/examples/jet_substructure/models.py
index e8c99a612..49fec0e1b 100644
--- a/examples/jet_substructure/models.py
+++ b/examples/jet_substructure/models.py
@@ -60,7 +60,7 @@ def __init__(self, model_config):
                 layer_list.append(layer)
         self.module_list = nn.ModuleList(layer_list)
         self.is_verilog_inference = False
-        self.latency = len(self.num_neurons)
+        self.latency = 1
         self.verilog_dir = None
         self.top_module_filename = None
         self.dut = None
diff --git a/src/logicnets/verilog.py b/src/logicnets/verilog.py
index df33fa701..f073a4692 100644
--- a/src/logicnets/verilog.py
+++ b/src/logicnets/verilog.py
@@ -45,13 +45,15 @@ def generate_logicnets_verilog(module_name: str, input_name: str, input_bits: in
                                 output_bits_1=output_bits-1,
                                 module_contents=module_contents)
 
-def layer_connection_verilog(layer_string: str, input_string: str, input_bits: int, output_string: str, output_bits: int, output_wire=True):
-    layer_connection_template = """\
+def layer_connection_verilog(layer_string: str, input_string: str, input_bits: int, output_string: str, output_bits: int, output_wire=True, register=False):
+    if register:
+        layer_connection_template = """\
 wire [{input_bits_1:d}:0] {input_string}w;
 myreg #(.DataWidth({input_bits})) {layer_string}_reg (.data_in({input_string}), .clk(clk), .rst(rst), .data_out({input_string}w));\n"""
-#    layer_connection_template = """\
-#wire [{input_bits_1:d}:0] {input_string}w;
-#assign {input_string}w = {input_string};\n"""
+    else:
+        layer_connection_template = """\
+wire [{input_bits_1:d}:0] {input_string}w;
+assign {input_string}w = {input_string};\n"""
     layer_connection_template += "wire [{output_bits_1:d}:0] {output_string};\n" if output_wire else ""
     layer_connection_template += "{layer_string} {layer_string}_inst (.M0({input_string}w), .M1({output_string}));\n"
     return layer_connection_template.format(    layer_string=layer_string,

From f4e7810bc482bbeab012f327f23e2e62c35dae77 Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Wed, 26 May 2021 15:29:26 +0100
Subject: [PATCH 08/64] [verilog] Added 'parallel case' statement to generated
 verilog.

---
 src/logicnets/verilog.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/src/logicnets/verilog.py b/src/logicnets/verilog.py
index f073a4692..742cb64f8 100644
--- a/src/logicnets/verilog.py
+++ b/src/logicnets/verilog.py
@@ -69,6 +69,7 @@ def generate_lut_verilog(module_name, input_fanin_bits, output_bits, lut_string)
 
 	(*rom_style = "distributed" *) reg [{output_bits_1:d}:0] M1r;
 	assign M1 = M1r;
+    (* parallel_case *)
 	always @ (M0) begin
 		case (M0)
 {lut_string}

From 40d72e54102bd9ddb0a852b0662d11f0c9ec6445 Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Mon, 31 May 2021 10:31:39 +0100
Subject: [PATCH 09/64] Revert "[verilog] Added 'parallel case' statement to
 generated verilog."

This reverts commit f4e7810bc482bbeab012f327f23e2e62c35dae77.
---
 src/logicnets/verilog.py | 1 -
 1 file changed, 1 deletion(-)

diff --git a/src/logicnets/verilog.py b/src/logicnets/verilog.py
index 742cb64f8..f073a4692 100644
--- a/src/logicnets/verilog.py
+++ b/src/logicnets/verilog.py
@@ -69,7 +69,6 @@ def generate_lut_verilog(module_name, input_fanin_bits, output_bits, lut_string)
 
 	(*rom_style = "distributed" *) reg [{output_bits_1:d}:0] M1r;
 	assign M1 = M1r;
-    (* parallel_case *)
 	always @ (M0) begin
 		case (M0)
 {lut_string}

From 7970fce539a66ce90dd1412126cdaf43ad0c09b8 Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Fri, 18 Jun 2021 15:19:58 +0100
Subject: [PATCH 10/64] [jsc] Bugfixes in setting histograms / frequency values

---
 examples/jet_substructure/neq2lut.py | 7 ++++---
 examples/jet_substructure/train.py   | 7 +++++++
 2 files changed, 11 insertions(+), 3 deletions(-)

diff --git a/examples/jet_substructure/neq2lut.py b/examples/jet_substructure/neq2lut.py
index e23a8d823..ac6c5ccc3 100644
--- a/examples/jet_substructure/neq2lut.py
+++ b/examples/jet_substructure/neq2lut.py
@@ -62,7 +62,7 @@
         help="The checkpoint file which contains the model weights")
     parser.add_argument('--histograms', type=str, default=None,
         help="The checkpoint histograms of LUT usage (default: %(default)s)")
-    parser.add_argument('--freq-thresh', type=int, default=0,
+    parser.add_argument('--freq-thresh', type=int, default=None,
         help="Threshold to use to include this truth table into the model (default: %(default)s)")
     parser.add_argument('--generate-bench', action='store_true', default=False,
         help="Generate the truth table in BENCH format as well as verilog (default: %(default)s)")
@@ -131,8 +131,9 @@
                     'test_accuracy': lut_accuracy}
 
     torch.save(modelSave, options_cfg["log_dir"] + "/lut_based_model.pth")
-    luts = torch.load(args.histograms)
-    load_histograms(lut_model, luts)
+    if options_cfg["histograms"] is not None:
+        luts = torch.load(options_cfg["histograms"])
+        load_histograms(lut_model, luts)
 
     print("Generating verilog in %s..." % (options_cfg["log_dir"]))
     module_list_to_verilog_module(lut_model.module_list, "logicnet", options_cfg["log_dir"], freq_thresh=options_cfg["freq_thresh"], generate_bench=options_cfg["generate_bench"])
diff --git a/examples/jet_substructure/train.py b/examples/jet_substructure/train.py
index 840fd4f18..be90902b6 100644
--- a/examples/jet_substructure/train.py
+++ b/examples/jet_substructure/train.py
@@ -44,6 +44,8 @@
         "learning_rate": 1e-3,
         "seed": 2,
         "checkpoint": None,
+        "histograms": None,
+        "freq_thresh": None,
     },
     "jsc-m": {
         "hidden_layers": [64, 32, 32, 32],
@@ -59,6 +61,8 @@
         "learning_rate": 1e-3,
         "seed": 3,
         "checkpoint": None,
+        "histograms": None,
+        "freq_thresh": None,
     },
     "jsc-l": {
         "hidden_layers": [32, 64, 192, 192, 16],
@@ -74,6 +78,8 @@
         "learning_rate": 1e-3,
         "seed": 16,
         "checkpoint": None,
+        "histograms": None,
+        "freq_thresh": None,
     },
 }
 
@@ -107,6 +113,7 @@
     "checkpoint": None,
     "generate_bench": None,
     "freq_thresh": None,
+    "histograms": None,
 }
 
 def train(model, datasets, train_cfg, options):

From fbf8238eb2272afa34fb90288b1805bc852dd2e1 Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Mon, 28 Jun 2021 16:12:23 +0100
Subject: [PATCH 11/64] [jsc] Updated default PCA to be 12 dimensions.

---
 examples/jet_substructure/config/yaml_IP_OP_config.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/examples/jet_substructure/config/yaml_IP_OP_config.yml b/examples/jet_substructure/config/yaml_IP_OP_config.yml
index e238039bf..95befe1fe 100644
--- a/examples/jet_substructure/config/yaml_IP_OP_config.yml
+++ b/examples/jet_substructure/config/yaml_IP_OP_config.yml
@@ -45,5 +45,5 @@ L1Reg: 0.0001
 NormalizeInputs: 1 
 InputType: Dense
 ApplyPca: false
-PcaDimensions: 10
+PcaDimensions: 12
 

From 01f8d43b21d958a71cfc2884f221ecb133a7994b Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Tue, 31 Aug 2021 16:48:37 +0100
Subject: [PATCH 12/64] [jsc] Fixed description of commandline arguments

---
 examples/jet_substructure/dump_luts.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/examples/jet_substructure/dump_luts.py b/examples/jet_substructure/dump_luts.py
index c244ee1ba..05952268e 100644
--- a/examples/jet_substructure/dump_luts.py
+++ b/examples/jet_substructure/dump_luts.py
@@ -29,7 +29,7 @@
 from logicnets.synthesis import synthesize_and_get_resource_counts
 
 if __name__ == "__main__":
-    parser = ArgumentParser(description="Synthesize convert a PyTorch trained model into verilog")
+    parser = ArgumentParser(description="Generate histograms of states used throughout LogicNets")
     parser.add_argument('--arch', type=str, choices=configs.keys(), default="jsc-s",
         help="Specific the neural network model to use (default: %(default)s)")
     parser.add_argument('--batch-size', type=int, default=None, metavar='N',
@@ -53,7 +53,7 @@
     parser.add_argument('--dataset-config', type=str, default='config/yaml_IP_OP_config.yml',
         help="The file to use to configure the input dataset (default: %(default)s)")
     parser.add_argument('--log-dir', type=str, default='./log',
-        help="A location to store the log output of the training run and the output model (default: %(default)s)")
+        help="A location to store the calculated histograms (default: %(default)s)")
     parser.add_argument('--checkpoint', type=str, required=True,
         help="The checkpoint file which contains the model weights")
     args = parser.parse_args()

From 1ed85a561f0fb3e76ad057e8e980c0c0e4198af5 Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Tue, 28 Sep 2021 20:19:21 +0100
Subject: [PATCH 13/64] [jsc] Initial basic code for abc intergration.

---
 src/logicnets/abc.py       | 107 +++++++++++++++++++++++++++++++++++++
 src/logicnets/synthesis.py |  45 ++++++++++++++++
 2 files changed, 152 insertions(+)
 create mode 100644 src/logicnets/abc.py

diff --git a/src/logicnets/abc.py b/src/logicnets/abc.py
new file mode 100644
index 000000000..dee7fa68b
--- /dev/null
+++ b/src/logicnets/abc.py
@@ -0,0 +1,107 @@
+#  Copyright (C) 2021 Xilinx, Inc
+#  Copyright (C) 2021 Alan Mishchenko
+#
+#  Licensed under the Apache License, Version 2.0 (the "License");
+#  you may not use this file except in compliance with the License.
+#  You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing, software
+#  distributed under the License is distributed on an "AS IS" BASIS,
+#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+#  See the License for the specific language governing permissions and
+#  limitations under the License.
+
+def generate_prepare_script_string(num_layers, path):
+    prepare_script_template = """\
+# This script prepares experiments in ABC by deriving intermediate simulation patterns
+
+# Assuming that verilog/BENCH for each layer of the network are in files "ver/layer{{0,1,2,..}}.v"
+# and input/output patterns are the network are in files {{train,test}}_{{input,output}}.txt
+
+
+# ====================================================================================
+# Read the layers from Verilog/BENCH files
+{read_layers_string}
+
+# ====================================================================================
+# Convert input patterns into the internal binary representation
+&lnetread {path}/train_input.txt {path}/train.sim
+&lnetread {path}/test_input.txt  {path}/test.sim
+
+
+# ====================================================================================
+# Generate training simulation info for the inputs of each layer
+{simulate_layers_string}
+
+# ====================================================================================
+# Combine all layers into one monolithic AIG for the whole network (layers.aig)
+{gen_monolithic_aig_string}
+"""
+    read_layer_template = "&lnetread {path}/ver/layer{i}.v; &ps; &w {path}/layer{i}.aig\n"
+    simulate_layer_template = "&r {path}/layer{i}.aig; &lnetsim {path}/train{it}.sim {path}/train{ip1}.sim\n"
+    gen_monolithic_aig_template = "putontop {layers_aig_string}; st; ps; write {path}/layers.aig\n"
+    read_layers_string = ""
+    simulate_layers_string = ""
+    layers_aig_string = ""
+    for i in range(num_layers):
+        read_layers_string += read_layer_template.format(i=i, path=path)
+        simulate_layers_string += simulate_layer_template.format(i=i, it="" if i == 0 else i, ip1=i+1, path=path)
+        layers_aig_string += "{path}/layer{i}.aig ".format(i=i, path=path)
+    gen_monolithic_aig_string = gen_monolithic_aig_template.format(layers_aig_string=layers_aig_string.strip(), path=path)
+    return prepare_script_template.format(  path=path,
+                                            read_layers_string=read_layers_string,
+                                            simulate_layers_string=simulate_layers_string,
+                                            gen_monolithic_aig_string=gen_monolithic_aig_string)
+
+
+def generate_opt_script_string(model, path, num_registers, rarity=0):
+    opt_script_template = """\
+# Generating script with rarity = {rarity}.
+
+# ---- rarity = {rarity} -------------------------------------------------------------------------------------------------------
+{optimise_with_rarity_string}
+
+{gen_monolithic_aig_string}
+
+{technology_map_layers_string}
+
+{gen_monolithic_blif_string}
+
+read {path}/blif/layers_opt.blif; ps; pipe -L {num_registers}; ps; retime -M 4; ps; sweep; ps; write_verilog -fm {path}/ver/layers_opt_p{num_registers}.v
+
+&r {path}/aig/layers_opt.aig; &lnetsim {path}/train.sim {path}/train.simo
+&r {path}/aig/layers_opt.aig; &lneteval -O 2 {path}/train.simo {path}/train_output.txt
+
+&r {path}/aig/layers_opt.aig; &lnetsim {path}/test.sim {path}/test.simo
+&r {path}/aig/layers_opt.aig; &lneteval -O 2 {path}/test.simo {path}/test_output.txt
+
+"""
+    optimise_with_rarity_template = "&r {path}/layer{i}.aig; &ps; &lnetopt -I {fanin_bits} -O {fanout_bits} -R {rarity} {path}/train{it}.sim;  &w {path}/aig/layer{i}_opt.aig; &ps; time\n"
+    technology_map_layer_template = "&r {path}/aig/layer{i}_opt.aig; &lnetmap -I {fanin_bits} -O {fanout_bits}; write {path}/blif/layer{i}_opt.blif; write_verilog -fm {path}/ver/layer{i}_opt.v\n"
+    gen_monolithic_aig_template = "putontop {aig_layers_string}; st; ps; write {path}/aig/layers_opt.aig\n"
+    gen_monolithic_blif_template = "putontop {blif_layers_string}; sw; ps; write {path}/blif/layers_opt.blif\n"
+    num_layers = 5 # TODO: fetch number of layers from the model
+    optimise_with_rarity_string = ""
+    technology_map_layers_string = ""
+    aig_layers_string = ""
+    blif_layers_string = ""
+    for i in range(num_layers):
+        fanin_bits = 6 # TODO: Read this from model
+        fanout_bits = 2 # TODO: Read this from model
+        optimise_with_rarity_string += optimise_with_rarity_template.format(fanin_bits=fanin_bits, fanout_bits=fanout_bits, it="" if i == 0 else i, i=i, path=path, rarity=rarity)
+        technology_map_layers_string += technology_map_layer_template.format(fanin_bits=fanin_bits, fanout_bits=fanout_bits, i=i, path=path)
+        aig_layers_string += "{path}/aig/layer{i}_opt.aig ".format(i=i, path=path)
+        blif_layers_string += "{path}/blif/layer{i}_opt.blif ".format(i=i, path=path)
+    gen_monolithic_aig_string = gen_monolithic_aig_template.format(aig_layers_string=aig_layers_string.strip(), path=path)
+    gen_monolithic_blif_string = gen_monolithic_blif_template.format(blif_layers_string=blif_layers_string.strip(), path=path)
+    return opt_script_template.format(  rarity=rarity,
+                                        num_registers=num_registers,
+                                        path=path,
+                                        optimise_with_rarity_string=optimise_with_rarity_string,
+                                        gen_monolithic_aig_string=gen_monolithic_aig_string,
+                                        technology_map_layers_string=technology_map_layers_string,
+                                        gen_monolithic_blif_string=gen_monolithic_blif_string)
+
+
diff --git a/src/logicnets/synthesis.py b/src/logicnets/synthesis.py
index dc1551716..a95f2d2cb 100644
--- a/src/logicnets/synthesis.py
+++ b/src/logicnets/synthesis.py
@@ -14,10 +14,15 @@
 
 import os
 import subprocess
+import shutil
 from shutil import which
+import glob
+
+from .abc import generate_prepare_script_string, generate_opt_script_string
 
 #xcvu9p-flgb2104-2-i
 # TODO: Add option to perform synthesis on a remote server
+# Synthesise design with vivado and get resource counts
 def synthesize_and_get_resource_counts(verilog_dir, top_name,
 fpga_part = "xcku3p-ffva676-1-e", clk_name="clk", clk_period_ns=5.0):
     # old part : "xczu3eg-sbva484-1-i"
@@ -56,3 +61,43 @@ def synthesize_and_get_resource_counts(verilog_dir, top_name,
     else:
         ret["fmax_mhz"] = 1000.0 / (clk_period_ns - ret["WNS"])
     return ret
+
+# Optimize the design with ABC
+def synthesize_and_get_resource_counts_with_abc(verilog_dir, model, pipeline_stages=0, freq_thresh=0):
+    if "ABC_ROOT" not in os.environ:
+        raise Exception("The environment variable ABC_ROOT is not defined.")
+    abc_path = os.environ["ABC_ROOT"]
+
+    # Create directories and symlinks ready for processing with ABC
+    project_prefix = "logicnet"
+    abc_project_root = f"{verilog_dir}/{project_prefix}"
+    os.makedirs(f"{abc_project_root}/ver")
+    os.makedirs(f"{abc_project_root}/aig")
+    os.makedirs(f"{abc_project_root}/blif")
+    real_abc_project_root = os.path.realpath(abc_project_root)
+    project_symlink_path = f"{abc_path}/{project_prefix}"
+    os.symlink(real_abc_project_root, project_symlink_path) # Create a symlink to this folder in the ABC root.
+    # Fetch the right source files from the verilog directory
+    source_files = glob.glob(f"{verilog_dir}/*.v") + glob.glob(f"{verilog_dir}/*.bench")
+    for f in source_files:
+        shutil.copy(f, f"{abc_project_root}/ver")
+    # Fetch the I/O files
+    for f in glob.glob(f"{verilog_dir}/*.txt"):
+        shutil.copy(f, f"{abc_project_root}")
+
+    # Create script files to pass to ABC
+    # TODO: Calculate number of layers from the model
+    with open(f"{abc_project_root}/prepare.script", "w") as f:
+        f.write(generate_prepare_script_string(num_layers=5, path=project_prefix))
+    with open(f"{abc_project_root}/opt_all.script", "w") as f:
+        f.write(generate_opt_script_string(model=model, path=project_prefix, num_registers=pipeline_stages, rarity=freq_thresh))
+
+    #proc = subprocess.Popen(['./abc', '-c', '"x/jsc_s/prepare.script"', '-c', '"x/jsc_s/opt_all.script"'], cwd=abc_path, stdout=subprocess.PIPE, env=os.environ)
+    proc = subprocess.Popen(['./abc', '-c', f'"{project_prefix}/prepare.script"', '-c', f'"{project_prefix}/opt_all.script"'], cwd=abc_path, stdout=subprocess.PIPE, env=os.environ)
+    out, err = proc.communicate()
+
+    with open(f"{abc_project_root}/abc.log", "w") as f:
+        f.write(out.decode("utf-8"))
+
+    os.remove(project_symlink_path)
+

From 2857e710a10a37deadbed8ee46520f74dce54dd6 Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Tue, 28 Sep 2021 22:10:32 +0100
Subject: [PATCH 14/64] [abc] Updated module to pull information from the input
 model. Created end-to-end example.

---
 examples/jet_substructure/neq2lut_abc.py | 154 +++++++++++++++++++++++
 src/logicnets/abc.py                     |  16 ++-
 src/logicnets/synthesis.py               |  20 +--
 3 files changed, 179 insertions(+), 11 deletions(-)
 create mode 100644 examples/jet_substructure/neq2lut_abc.py

diff --git a/examples/jet_substructure/neq2lut_abc.py b/examples/jet_substructure/neq2lut_abc.py
new file mode 100644
index 000000000..bdd431c2e
--- /dev/null
+++ b/examples/jet_substructure/neq2lut_abc.py
@@ -0,0 +1,154 @@
+#  Copyright (C) 2021 Xilinx, Inc
+#
+#  Licensed under the Apache License, Version 2.0 (the "License");
+#  you may not use this file except in compliance with the License.
+#  You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing, software
+#  distributed under the License is distributed on an "AS IS" BASIS,
+#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+#  See the License for the specific language governing permissions and
+#  limitations under the License.
+
+import os
+from argparse import ArgumentParser
+
+import torch
+from torch.utils.data import DataLoader
+
+from logicnets.nn import    generate_truth_tables, \
+                            lut_inference, \
+                            module_list_to_verilog_module
+from logicnets.synthesis import synthesize_and_get_resource_counts_with_abc
+
+from train import configs, model_config, dataset_config, test
+from dataset import JetSubstructureDataset
+from models import JetSubstructureNeqModel, JetSubstructureLutModel
+from dataset_dump import dump_io
+
+other_options = {
+    "cuda": None,
+    "log_dir": None,
+    "checkpoint": None,
+}
+
+if __name__ == "__main__":
+    parser = ArgumentParser(description="Synthesize convert a PyTorch trained model into verilog")
+    parser.add_argument('--arch', type=str, choices=configs.keys(), default="jsc-s",
+        help="Specific the neural network model to use (default: %(default)s)")
+    parser.add_argument('--batch-size', type=int, default=None, metavar='N',
+        help="Batch size for evaluation (default: %(default)s)")
+    parser.add_argument('--input-bitwidth', type=int, default=None,
+        help="Bitwidth to use at the input (default: %(default)s)")
+    parser.add_argument('--hidden-bitwidth', type=int, default=None,
+        help="Bitwidth to use for activations in hidden layers (default: %(default)s)")
+    parser.add_argument('--output-bitwidth', type=int, default=None,
+        help="Bitwidth to use at the output (default: %(default)s)")
+    parser.add_argument('--input-fanin', type=int, default=None,
+        help="Fanin to use at the input (default: %(default)s)")
+    parser.add_argument('--hidden-fanin', type=int, default=None,
+        help="Fanin to use for the hidden layers (default: %(default)s)")
+    parser.add_argument('--output-fanin', type=int, default=None,
+        help="Fanin to use at the output (default: %(default)s)")
+    parser.add_argument('--hidden-layers', nargs='+', type=int, default=None,
+        help="A list of hidden layer neuron sizes (default: %(default)s)")
+    parser.add_argument('--dataset-file', type=str, default='data/processed-pythia82-lhc13-all-pt1-50k-r1_h022_e0175_t220_nonu_truth.z',
+        help="The file to use as the dataset input (default: %(default)s)")
+    parser.add_argument('--clock-period', type=float, default=1.0,
+        help="Target clock frequency to use during Vivado synthesis (default: %(default)s)")
+    parser.add_argument('--dataset-config', type=str, default='config/yaml_IP_OP_config.yml',
+        help="The file to use to configure the input dataset (default: %(default)s)")
+    parser.add_argument('--dataset-split', type=str, default='test', choices=['train', 'test'],
+        help="Dataset to use for evaluation (default: %(default)s)")
+    parser.add_argument('--log-dir', type=str, default='./log',
+        help="A location to store the log output of the training run and the output model (default: %(default)s)")
+    parser.add_argument('--checkpoint', type=str, required=True,
+        help="The checkpoint file which contains the model weights")
+    parser.add_argument('--num-registers', type=int, default=0,
+        help="The number of registers to add to the generated verilog (default: %(default)s)")
+    args = parser.parse_args()
+    defaults = configs[args.arch]
+    options = vars(args)
+    del options['arch']
+    config = {}
+    for k in options.keys():
+        config[k] = options[k] if options[k] is not None else defaults[k] # Override defaults, if specified.
+
+    if not os.path.exists(config['log_dir']):
+        os.makedirs(config['log_dir'])
+
+    # Split up configuration options to be more understandable
+    model_cfg = {}
+    for k in model_config.keys():
+        model_cfg[k] = config[k]
+    dataset_cfg = {}
+    for k in dataset_config.keys():
+        dataset_cfg[k] = config[k]
+    options_cfg = {}
+    for k in other_options.keys():
+        if k == 'cuda':
+            continue
+        options_cfg[k] = config[k]
+
+    # Fetch the test set
+    dataset = {}
+    dataset["train"] = JetSubstructureDataset(dataset_cfg['dataset_file'], dataset_cfg['dataset_config'], split="train")
+    dataset["test"] = JetSubstructureDataset(dataset_cfg['dataset_file'], dataset_cfg['dataset_config'], split="test")
+    train_loader = DataLoader(dataset["train"], batch_size=config['batch_size'], shuffle=False)
+    test_loader = DataLoader(dataset["test"], batch_size=config['batch_size'], shuffle=False)
+
+
+    # Instantiate the PyTorch model
+    x, y = dataset[args.dataset_split][0]
+    model_cfg['input_length'] = len(x)
+    model_cfg['output_length'] = len(y)
+    model = JetSubstructureNeqModel(model_cfg)
+
+    # Load the model weights
+    checkpoint = torch.load(options_cfg['checkpoint'], map_location='cpu')
+    model.load_state_dict(checkpoint['model_dict'])
+
+    # Test the PyTorch model
+    print("Running inference on baseline model...")
+    model.eval()
+    baseline_accuracy = test(model, test_loader, cuda=False)
+    print("Baseline accuracy: %f" % (baseline_accuracy))
+
+    # Run preprocessing on training set.
+    #train_input_file = config['log_dir'] + "/train_input.txt"
+    #train_output_file = config['log_dir'] + "/train_output.txt"
+    #test_input_file = config['log_dir'] + "/test_input.txt"
+    #test_output_file = config['log_dir'] + "/test_output.txt"
+    #print(f"Dumping train I/O to {train_input_file} and {train_output_file}")
+    #dump_io(model, train_loader, train_input_file, train_output_file)
+    #print(f"Dumping test I/O to {test_input_file} and {test_output_file}")
+    #dump_io(model, test_loader, test_input_file, test_output_file)
+
+    # Instantiate LUT-based model
+    lut_model = JetSubstructureLutModel(model_cfg)
+    lut_model.load_state_dict(checkpoint['model_dict'])
+
+    # Generate the truth tables in the LUT module
+    print("Converting to NEQs to LUTs...")
+    generate_truth_tables(lut_model, verbose=True)
+
+    # Test the LUT-based model
+    print("Running inference on LUT-based model...")
+    lut_inference(lut_model)
+    lut_model.eval()
+    lut_accuracy = test(lut_model, test_loader, cuda=False)
+    print("LUT-Based Model accuracy: %f" % (lut_accuracy))
+    modelSave = {   'model_dict': lut_model.state_dict(),
+                    'test_accuracy': lut_accuracy}
+
+    torch.save(modelSave, options_cfg["log_dir"] + "/lut_based_model.pth")
+
+    print("Generating verilog in %s..." % (options_cfg["log_dir"]))
+    module_list_to_verilog_module(lut_model.module_list, "logicnet", options_cfg["log_dir"], generate_bench=True, add_registers=False)
+    print("Top level entity stored at: %s/logicnet.v ..." % (options_cfg["log_dir"]))
+
+    print("Running synthesis and verilog technology-mapped verilog in ABC")
+    synthesize_and_get_resource_counts_with_abc(options_cfg["log_dir"], lut_model.module_list, pipeline_stages=args.num_registers, freq_thresh=0)
+
diff --git a/src/logicnets/abc.py b/src/logicnets/abc.py
index dee7fa68b..c3b56e568 100644
--- a/src/logicnets/abc.py
+++ b/src/logicnets/abc.py
@@ -56,7 +56,7 @@ def generate_prepare_script_string(num_layers, path):
                                             gen_monolithic_aig_string=gen_monolithic_aig_string)
 
 
-def generate_opt_script_string(model, path, num_registers, rarity=0):
+def generate_opt_script_string(module_list, path, num_registers, rarity=0):
     opt_script_template = """\
 # Generating script with rarity = {rarity}.
 
@@ -82,14 +82,22 @@ def generate_opt_script_string(model, path, num_registers, rarity=0):
     technology_map_layer_template = "&r {path}/aig/layer{i}_opt.aig; &lnetmap -I {fanin_bits} -O {fanout_bits}; write {path}/blif/layer{i}_opt.blif; write_verilog -fm {path}/ver/layer{i}_opt.v\n"
     gen_monolithic_aig_template = "putontop {aig_layers_string}; st; ps; write {path}/aig/layers_opt.aig\n"
     gen_monolithic_blif_template = "putontop {blif_layers_string}; sw; ps; write {path}/blif/layers_opt.blif\n"
-    num_layers = 5 # TODO: fetch number of layers from the model
+    num_layers = len(module_list) # TODO: fetch number of layers from the model
     optimise_with_rarity_string = ""
     technology_map_layers_string = ""
     aig_layers_string = ""
     blif_layers_string = ""
     for i in range(num_layers):
-        fanin_bits = 6 # TODO: Read this from model
-        fanout_bits = 2 # TODO: Read this from model
+        # Read in fanin/fanout bits
+        # Add assertion that fanin/fanout bits for all neuron is that same
+        layer = module_list[i]
+        _, input_bitwidth = layer.input_quant.get_scale_factor_bits()
+        _, output_bitwidth = layer.output_quant.get_scale_factor_bits()
+        num_indices = len(layer.neuron_truth_tables[0])
+        fanin_bits = input_bitwidth*num_indices
+        fanout_bits = output_bitwidth
+
+        # Generate optimisation script.
         optimise_with_rarity_string += optimise_with_rarity_template.format(fanin_bits=fanin_bits, fanout_bits=fanout_bits, it="" if i == 0 else i, i=i, path=path, rarity=rarity)
         technology_map_layers_string += technology_map_layer_template.format(fanin_bits=fanin_bits, fanout_bits=fanout_bits, i=i, path=path)
         aig_layers_string += "{path}/aig/layer{i}_opt.aig ".format(i=i, path=path)
diff --git a/src/logicnets/synthesis.py b/src/logicnets/synthesis.py
index a95f2d2cb..50a5b5b12 100644
--- a/src/logicnets/synthesis.py
+++ b/src/logicnets/synthesis.py
@@ -63,7 +63,7 @@ def synthesize_and_get_resource_counts(verilog_dir, top_name,
     return ret
 
 # Optimize the design with ABC
-def synthesize_and_get_resource_counts_with_abc(verilog_dir, model, pipeline_stages=0, freq_thresh=0):
+def synthesize_and_get_resource_counts_with_abc(verilog_dir, module_list, pipeline_stages=0, freq_thresh=0):
     if "ABC_ROOT" not in os.environ:
         raise Exception("The environment variable ABC_ROOT is not defined.")
     abc_path = os.environ["ABC_ROOT"]
@@ -71,16 +71,22 @@ def synthesize_and_get_resource_counts_with_abc(verilog_dir, model, pipeline_sta
     # Create directories and symlinks ready for processing with ABC
     project_prefix = "logicnet"
     abc_project_root = f"{verilog_dir}/{project_prefix}"
-    os.makedirs(f"{abc_project_root}/ver")
-    os.makedirs(f"{abc_project_root}/aig")
-    os.makedirs(f"{abc_project_root}/blif")
+    verilog_bench_dir = f"{abc_project_root}/ver"
+    aig_dir = f"{abc_project_root}/aig"
+    blif_dir = f"{abc_project_root}/blif"
+    if not os.path.exists(verilog_bench_dir):
+        os.makedirs(verilog_bench_dir)
+    if not os.path.exists(aig_dir):
+        os.makedirs(aig_dir)
+    if not os.path.exists(blif_dir):
+        os.makedirs(blif_dir)
     real_abc_project_root = os.path.realpath(abc_project_root)
     project_symlink_path = f"{abc_path}/{project_prefix}"
     os.symlink(real_abc_project_root, project_symlink_path) # Create a symlink to this folder in the ABC root.
     # Fetch the right source files from the verilog directory
     source_files = glob.glob(f"{verilog_dir}/*.v") + glob.glob(f"{verilog_dir}/*.bench")
     for f in source_files:
-        shutil.copy(f, f"{abc_project_root}/ver")
+        shutil.copy(f, verilog_bench_dir)
     # Fetch the I/O files
     for f in glob.glob(f"{verilog_dir}/*.txt"):
         shutil.copy(f, f"{abc_project_root}")
@@ -88,9 +94,9 @@ def synthesize_and_get_resource_counts_with_abc(verilog_dir, model, pipeline_sta
     # Create script files to pass to ABC
     # TODO: Calculate number of layers from the model
     with open(f"{abc_project_root}/prepare.script", "w") as f:
-        f.write(generate_prepare_script_string(num_layers=5, path=project_prefix))
+        f.write(generate_prepare_script_string(num_layers=len(module_list), path=project_prefix))
     with open(f"{abc_project_root}/opt_all.script", "w") as f:
-        f.write(generate_opt_script_string(model=model, path=project_prefix, num_registers=pipeline_stages, rarity=freq_thresh))
+        f.write(generate_opt_script_string(module_list=module_list, path=project_prefix, num_registers=pipeline_stages, rarity=freq_thresh))
 
     #proc = subprocess.Popen(['./abc', '-c', '"x/jsc_s/prepare.script"', '-c', '"x/jsc_s/opt_all.script"'], cwd=abc_path, stdout=subprocess.PIPE, env=os.environ)
     proc = subprocess.Popen(['./abc', '-c', f'"{project_prefix}/prepare.script"', '-c', f'"{project_prefix}/opt_all.script"'], cwd=abc_path, stdout=subprocess.PIPE, env=os.environ)

From 52f8c6425d0aafd95ef92b5c4f709dbfe9930243 Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Tue, 2 Nov 2021 12:17:19 +0000
Subject: [PATCH 15/64] Added AMC depencency to Dockerfile.

---
 docker/Dockerfile.cpu | 7 +++++++
 1 file changed, 7 insertions(+)

diff --git a/docker/Dockerfile.cpu b/docker/Dockerfile.cpu
index 3eaba4b33..6b63945c5 100644
--- a/docker/Dockerfile.cpu
+++ b/docker/Dockerfile.cpu
@@ -37,6 +37,13 @@ RUN apt-get -qq update && apt-get -qq -y install verilator build-essential libx1
 RUN git clone https://bitbucket.org/maltanar/oh-my-xilinx.git
 ENV OHMYXILINX=/workspace/oh-my-xilinx
 
+# Adding LogicNets dependency on ABC
+RUN git clone https://github.com/berkeley-abc/abc.git \
+    && cd abc \
+    && git checkout ecda331a2a921bcac30bf3210f56adf9152ca22f \
+    && make -j`nproc`
+ENV ABC_ROOT=/workspace/ABC
+
 # Create the user account to run LogicNets
 RUN groupadd -g $GID $GNAME
 RUN useradd -m -u $UID $UNAME -g $GNAME

From 691944eda9684231030de8392dd81878d0277ca3 Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Thu, 18 Aug 2022 17:28:36 +0100
Subject: [PATCH 16/64] [nids] Initial version supporting histograms.

---
 examples/cybersecurity/dump_luts.py | 119 ++++++++++++++++++++++++++++
 examples/cybersecurity/models.py    |  17 ++--
 examples/cybersecurity/neq2lut.py   |  19 ++++-
 examples/cybersecurity/train.py     |  12 +++
 4 files changed, 156 insertions(+), 11 deletions(-)
 create mode 100644 examples/cybersecurity/dump_luts.py

diff --git a/examples/cybersecurity/dump_luts.py b/examples/cybersecurity/dump_luts.py
new file mode 100644
index 000000000..01a57663f
--- /dev/null
+++ b/examples/cybersecurity/dump_luts.py
@@ -0,0 +1,119 @@
+#  Copyright (C) 2021 Xilinx, Inc
+#
+#  Licensed under the Apache License, Version 2.0 (the "License");
+#  you may not use this file except in compliance with the License.
+#  You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing, software
+#  distributed under the License is distributed on an "AS IS" BASIS,
+#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+#  See the License for the specific language governing permissions and
+#  limitations under the License.
+
+import os
+from argparse import ArgumentParser
+
+import torch
+from torch.utils.data import DataLoader
+
+from logicnets.nn import    generate_truth_tables, \
+                            lut_inference, \
+                            save_luts, \
+                            module_list_to_verilog_module
+
+from train import configs, model_config, dataset_config, other_options, test
+from dataset import get_preqnt_dataset
+from models import UnswNb15NeqModel, UnswNb15LutModel
+
+if __name__ == "__main__":
+    parser = ArgumentParser(description="Generate histograms of states used throughout LogicNets")
+    parser.add_argument('--arch', type=str, choices=configs.keys(), default="jsc-s",
+        help="Specific the neural network model to use (default: %(default)s)")
+    parser.add_argument('--batch-size', type=int, default=None, metavar='N',
+        help="Batch size for evaluation (default: %(default)s)")
+    parser.add_argument('--input-bitwidth', type=int, default=None,
+        help="Bitwidth to use at the input (default: %(default)s)")
+    parser.add_argument('--hidden-bitwidth', type=int, default=None,
+        help="Bitwidth to use for activations in hidden layers (default: %(default)s)")
+    parser.add_argument('--output-bitwidth', type=int, default=None,
+        help="Bitwidth to use at the output (default: %(default)s)")
+    parser.add_argument('--input-fanin', type=int, default=None,
+        help="Fanin to use at the input (default: %(default)s)")
+    parser.add_argument('--hidden-fanin', type=int, default=None,
+        help="Fanin to use for the hidden layers (default: %(default)s)")
+    parser.add_argument('--output-fanin', type=int, default=None,
+        help="Fanin to use at the output (default: %(default)s)")
+    parser.add_argument('--hidden-layers', nargs='+', type=int, default=None,
+        help="A list of hidden layer neuron sizes (default: %(default)s)")
+    parser.add_argument('--dataset-file', type=str, default='data/unsw_nb15_binarized.npz',
+        help="The file to use as the dataset input (default: %(default)s)")
+    parser.add_argument('--log-dir', type=str, default='./log',
+        help="A location to store the calculated histograms (default: %(default)s)")
+    parser.add_argument('--checkpoint', type=str, required=True,
+        help="The checkpoint file which contains the model weights")
+    args = parser.parse_args()
+    defaults = configs[args.arch]
+    options = vars(args)
+    del options['arch']
+    config = {}
+    for k in options.keys():
+        config[k] = options[k] if options[k] is not None else defaults[k] # Override defaults, if specified.
+
+    if not os.path.exists(config['log_dir']):
+        os.makedirs(config['log_dir'])
+
+    # Split up configuration options to be more understandable
+    model_cfg = {}
+    for k in model_config.keys():
+        model_cfg[k] = config[k]
+    dataset_cfg = {}
+    for k in dataset_config.keys():
+        dataset_cfg[k] = config[k]
+    options_cfg = {}
+    for k in other_options.keys():
+        if k == 'cuda':
+            continue
+        options_cfg[k] = config[k]
+
+    # Fetch the test set
+    dataset = {}
+    dataset['train'] = get_preqnt_dataset(dataset_cfg['dataset_file'], split='train')
+    train_loader = DataLoader(dataset["train"], batch_size=config['batch_size'], shuffle=False)
+
+    # Instantiate the PyTorch model
+    x, y = dataset['train'][0]
+    dataset_length = len(dataset['train'])
+    model_cfg['input_length'] = len(x)
+    model_cfg['output_length'] = 1
+    model = UnswNb15NeqModel(model_cfg)
+
+    # Load the model weights
+    checkpoint = torch.load(options_cfg['checkpoint'], map_location='cpu')
+    model.load_state_dict(checkpoint['model_dict'])
+
+    # Test the PyTorch model
+    print("Running inference of baseline model on training set (%d examples)..." % (dataset_length))
+    model.eval()
+    baseline_accuracy = test(model, train_loader, cuda=False)
+    print("Baseline accuracy: %f" % (baseline_accuracy))
+
+    # Instantiate LUT-based model
+    lut_model = UnswNb15LutModel(model_cfg)
+    lut_model.load_state_dict(checkpoint['model_dict'])
+
+    # Generate the truth tables in the LUT module
+    print("Converting to NEQs to LUTs...")
+    generate_truth_tables(lut_model, verbose=True)
+
+    # Test the LUT-based model
+    print("Running inference of LUT-based model training set (%d examples)..." % (dataset_length))
+    lut_inference(lut_model, track_used_luts=True)
+    lut_model.eval()
+    lut_accuracy = test(lut_model, train_loader, cuda=False)
+    print("LUT-Based Model accuracy: %f" % (lut_accuracy))
+    print("Saving LUTs to %s... " % (options_cfg["log_dir"] + "/luts.pth"))
+    save_luts(lut_model, options_cfg["log_dir"] + "/luts.pth")
+    print("Done!")
+
diff --git a/examples/cybersecurity/models.py b/examples/cybersecurity/models.py
index b98ab5dc9..bfbaf2ca5 100644
--- a/examples/cybersecurity/models.py
+++ b/examples/cybersecurity/models.py
@@ -63,13 +63,15 @@ def __init__(self, model_config):
         self.verilog_dir = None
         self.top_module_filename = None
         self.dut = None
+        self.verify = True
         self.logfile = None
 
-    def verilog_inference(self, verilog_dir, top_module_filename, logfile: bool = False, add_registers: bool = False):
+    def verilog_inference(self, verilog_dir, top_module_filename, logfile: bool = False, add_registers: bool = False, verify: bool = True):
         self.verilog_dir = realpath(verilog_dir)
         self.top_module_filename = top_module_filename
-        self.dut = PyVerilator.build(f"{self.verilog_dir}/{self.top_module_filename}", verilog_path=[self.verilog_dir], build_dir=f"{self.verilog_dir}/verilator")
+        self.dut = PyVerilator.build(f"{self.verilog_dir}/{self.top_module_filename}", verilog_path=[self.verilog_dir], build_dir=f"{self.verilog_dir}/verilator", command_args=("--x-assign","0",))
         self.is_verilog_inference = True
+        self.verify = verify
         self.logfile = logfile
         if add_registers:
             self.latency = len(self.num_neurons)
@@ -95,11 +97,8 @@ def verilog_forward(self, x):
         self.dut.io.clk = 0
         for i in range(x.shape[0]):
             x_i = x[i,:]
-            y_i = self.pytorch_forward(x[i:i+1,:])[0]
             xv_i = list(map(lambda z: input_quant.get_bin_str(z), x_i))
-            ys_i = list(map(lambda z: output_quant.get_bin_str(z), y_i))
             xvc_i = reduce(lambda a,b: a+b, xv_i[::-1])
-            ysc_i = reduce(lambda a,b: a+b, ys_i[::-1])
             self.dut["M0"] = int(xvc_i, 2)
             for j in range(self.latency + 1):
                 #print(self.dut.io.M5)
@@ -107,9 +106,13 @@ def verilog_forward(self, x):
                 result = f"{res:0{int(total_output_bits)}b}"
                 self.dut.io.clk = 1
                 self.dut.io.clk = 0
-            expected = f"{int(ysc_i,2):0{int(total_output_bits)}b}"
             result = f"{res:0{int(total_output_bits)}b}"
-            assert(expected == result)
+            if self.verify:
+                y_i = self.pytorch_forward(x[i:i+1,:])[0]
+                ys_i = list(map(lambda z: output_quant.get_bin_str(z), y_i))
+                ysc_i = reduce(lambda a,b: a+b, ys_i[::-1])
+                expected = f"{int(ysc_i,2):0{int(total_output_bits)}b}"
+                assert(expected == result)
             res_split = [result[i:i+output_bitwidth] for i in range(0, len(result), output_bitwidth)][::-1]
             yv_i = torch.Tensor(list(map(lambda z: int(z, 2), res_split)))
             y[i,:] = yv_i
diff --git a/examples/cybersecurity/neq2lut.py b/examples/cybersecurity/neq2lut.py
index 4302ec304..bcc7ef049 100644
--- a/examples/cybersecurity/neq2lut.py
+++ b/examples/cybersecurity/neq2lut.py
@@ -20,7 +20,8 @@
 
 from logicnets.nn import    generate_truth_tables, \
                             lut_inference, \
-                            module_list_to_verilog_module
+                            module_list_to_verilog_module, \
+                            load_histograms
 from logicnets.synthesis import synthesize_and_get_resource_counts
 from logicnets.util import proc_postsynth_file
 
@@ -34,6 +35,8 @@
     "checkpoint": None,
     "generate_bench": False,
     "add_registers": False,
+    "histograms": None,
+    "freq_thresh": None,
     "simulate_pre_synthesis_verilog": False,
     "simulate_post_synthesis_verilog": False,
 }
@@ -68,6 +71,10 @@
         help="A location to store the log output of the training run and the output model (default: %(default)s)")
     parser.add_argument('--checkpoint', type=str, required=True,
         help="The checkpoint file which contains the model weights")
+    parser.add_argument('--histograms', type=str, default=None,
+        help="The checkpoint histograms of LUT usage (default: %(default)s)")
+    parser.add_argument('--freq-thresh', type=int, default=None,
+        help="Threshold to use to include this truth table into the model (default: %(default)s)")
     parser.add_argument('--generate-bench', action='store_true', default=False,
         help="Generate the truth table in BENCH format as well as verilog (default: %(default)s)")
     parser.add_argument('--dump-io', action='store_true', default=False,
@@ -141,9 +148,12 @@
                     'test_accuracy': lut_accuracy}
 
     torch.save(modelSave, options_cfg["log_dir"] + "/lut_based_model.pth")
+    if options_cfg["histograms"] is not None:
+        luts = torch.load(options_cfg["histograms"])
+        load_histograms(lut_model, luts)
 
     print("Generating verilog in %s..." % (options_cfg["log_dir"]))
-    module_list_to_verilog_module(lut_model.module_list, "logicnet", options_cfg["log_dir"], generate_bench=options_cfg["generate_bench"], add_registers=options_cfg["add_registers"])
+    module_list_to_verilog_module(lut_model.module_list, "logicnet", options_cfg["log_dir"], generate_bench=options_cfg["generate_bench"], add_registers=options_cfg["add_registers"], freq_thresh=options_cfg["freq_thresh"])
     print("Top level entity stored at: %s/logicnet.v ..." % (options_cfg["log_dir"]))
 
     if args.dump_io:
@@ -154,9 +164,10 @@
     else:
         io_filename = None
 
+
     if args.simulate_pre_synthesis_verilog:
         print("Running inference simulation of Verilog-based model...")
-        lut_model.verilog_inference(options_cfg["log_dir"], "logicnet.v", logfile=io_filename, add_registers=options_cfg["add_registers"])
+        lut_model.verilog_inference(options_cfg["log_dir"], "logicnet.v", logfile=io_filename, add_registers=options_cfg["add_registers"], verify=options_cfg["freq_thresh"] is None or options_cfg["freq_thresh"] == 0)
         verilog_accuracy = test(lut_model, test_loader, cuda=False)
         print("Verilog-Based Model accuracy: %f" % (verilog_accuracy))
 
@@ -166,7 +177,7 @@
     if args.simulate_post_synthesis_verilog:
         print("Running post-synthesis inference simulation of Verilog-based model...")
         proc_postsynth_file(options_cfg["log_dir"])
-        lut_model.verilog_inference(options_cfg["log_dir"]+"/post_synth", "logicnet_post_synth.v", io_filename, add_registers=options_cfg["add_registers"])
+        lut_model.verilog_inference(options_cfg["log_dir"]+"/post_synth", "logicnet_post_synth.v", io_filename, add_registers=options_cfg["add_registers"], verify=options_cfg["freq_thresh"] is None or options_cfg["freq_thresh"] == 0)
         post_synth_accuracy = test(lut_model, test_loader, cuda=False)
         print("Post-synthesis Verilog-Based Model accuracy: %f" % (post_synth_accuracy))
     
diff --git a/examples/cybersecurity/train.py b/examples/cybersecurity/train.py
index 3576ae15a..30dcba634 100644
--- a/examples/cybersecurity/train.py
+++ b/examples/cybersecurity/train.py
@@ -44,6 +44,8 @@
         "learning_rate": 1e-1,
         "seed": 25,
         "checkpoint": None,
+        "histograms": None,
+        "freq_thresh": None,
     },
     "nid-s-comp": {
         "hidden_layers": [49, 7],
@@ -59,6 +61,8 @@
         "learning_rate": 1e-1,
         "seed": 81,
         "checkpoint": None,
+        "histograms": None,
+        "freq_thresh": None,
     },
     "nid-m": {
         "hidden_layers": [593, 256, 128, 128],
@@ -74,6 +78,8 @@
         "learning_rate": 1e-1,
         "seed": 20,
         "checkpoint": None,
+        "histograms": None,
+        "freq_thresh": None,
     },
     "nid-m-comp": {
         "hidden_layers": [593, 256, 49, 7],
@@ -89,6 +95,8 @@
         "learning_rate": 1e-1,
         "seed": 40,
         "checkpoint": None,
+        "histograms": None,
+        "freq_thresh": None,
     },
     "nid-l": {
         "hidden_layers": [593, 100, 100, 100],
@@ -104,6 +112,8 @@
         "learning_rate": 1e-1,
         "seed": 2,
         "checkpoint": None,
+        "histograms": None,
+        "freq_thresh": None,
     },
     "nid-l-comp": {
         "hidden_layers": [593, 100, 25, 5],
@@ -119,6 +129,8 @@
         "learning_rate": 1e-1,
         "seed": 83,
         "checkpoint": None,
+        "histograms": None,
+        "freq_thresh": None,
     },
 }
 

From 60e121372db588fd9771b89b78c1d24ef2b148af Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Tue, 11 Oct 2022 17:28:16 +0100
Subject: [PATCH 17/64] [abc] Updated script generation function to support
 specifying the rarity optimization command.

---
 src/logicnets/abc.py | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/src/logicnets/abc.py b/src/logicnets/abc.py
index c3b56e568..c0966ce8f 100644
--- a/src/logicnets/abc.py
+++ b/src/logicnets/abc.py
@@ -56,7 +56,7 @@ def generate_prepare_script_string(num_layers, path):
                                             gen_monolithic_aig_string=gen_monolithic_aig_string)
 
 
-def generate_opt_script_string(module_list, path, num_registers, rarity=0):
+def generate_opt_script_string(module_list, path, num_registers, rarity=0, opt_cmd="&lnetopt"):
     opt_script_template = """\
 # Generating script with rarity = {rarity}.
 
@@ -78,7 +78,7 @@ def generate_opt_script_string(module_list, path, num_registers, rarity=0):
 &r {path}/aig/layers_opt.aig; &lneteval -O 2 {path}/test.simo {path}/test_output.txt
 
 """
-    optimise_with_rarity_template = "&r {path}/layer{i}.aig; &ps; &lnetopt -I {fanin_bits} -O {fanout_bits} -R {rarity} {path}/train{it}.sim;  &w {path}/aig/layer{i}_opt.aig; &ps; time\n"
+    optimise_with_rarity_template = "&r {path}/layer{i}.aig; &ps; {opt_cmd} -I {fanin_bits} -O {fanout_bits} -R {rarity} {path}/train{it}.sim;  &w {path}/aig/layer{i}_opt.aig; &ps; time\n"
     technology_map_layer_template = "&r {path}/aig/layer{i}_opt.aig; &lnetmap -I {fanin_bits} -O {fanout_bits}; write {path}/blif/layer{i}_opt.blif; write_verilog -fm {path}/ver/layer{i}_opt.v\n"
     gen_monolithic_aig_template = "putontop {aig_layers_string}; st; ps; write {path}/aig/layers_opt.aig\n"
     gen_monolithic_blif_template = "putontop {blif_layers_string}; sw; ps; write {path}/blif/layers_opt.blif\n"
@@ -98,7 +98,7 @@ def generate_opt_script_string(module_list, path, num_registers, rarity=0):
         fanout_bits = output_bitwidth
 
         # Generate optimisation script.
-        optimise_with_rarity_string += optimise_with_rarity_template.format(fanin_bits=fanin_bits, fanout_bits=fanout_bits, it="" if i == 0 else i, i=i, path=path, rarity=rarity)
+        optimise_with_rarity_string += optimise_with_rarity_template.format(fanin_bits=fanin_bits, fanout_bits=fanout_bits, it="" if i == 0 else i, i=i, path=path, rarity=rarity, opt_cmd=opt_cmd)
         technology_map_layers_string += technology_map_layer_template.format(fanin_bits=fanin_bits, fanout_bits=fanout_bits, i=i, path=path)
         aig_layers_string += "{path}/aig/layer{i}_opt.aig ".format(i=i, path=path)
         blif_layers_string += "{path}/blif/layer{i}_opt.blif ".format(i=i, path=path)

From 5347456fa2a13b22301c9481393f230d3c83faab Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Tue, 11 Oct 2022 17:36:03 +0100
Subject: [PATCH 18/64] [docker] Updated ABC version.

---
 docker/Dockerfile.cpu | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docker/Dockerfile.cpu b/docker/Dockerfile.cpu
index a52bb626b..dc7cb5b83 100644
--- a/docker/Dockerfile.cpu
+++ b/docker/Dockerfile.cpu
@@ -44,7 +44,7 @@ ENV NITROPARTSLIB=/workspace/Nitro-Parts-lib-Xilinx
 # Adding LogicNets dependency on ABC
 RUN git clone https://github.com/berkeley-abc/abc.git \
     && cd abc \
-    && git checkout ecda331a2a921bcac30bf3210f56adf9152ca22f \
+    && git checkout 813a0f1ff1ae7512cb7947f54cd3f2ab252848c8 \
     && make -j`nproc`
 ENV ABC_ROOT=/workspace/ABC
 

From f32fe89f2de604ff4d533a2dae53d158c029296f Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Wed, 12 Oct 2022 16:38:12 +0100
Subject: [PATCH 19/64] [abc] Initial ABC synthesis flow. Need to fetch results
 from output strings.

---
 src/logicnets/abc.py       | 105 +++++++++++++++++++++++++++++++++++++
 src/logicnets/synthesis.py |  79 +++++++++++++++++++++-------
 2 files changed, 164 insertions(+), 20 deletions(-)

diff --git a/src/logicnets/abc.py b/src/logicnets/abc.py
index c0966ce8f..80df04382 100644
--- a/src/logicnets/abc.py
+++ b/src/logicnets/abc.py
@@ -13,6 +13,111 @@
 #  See the License for the specific language governing permissions and
 #  limitations under the License.
 
+import os
+import subprocess
+
+def verilog_bench_to_aig(verilog_file, aig_file, abc_path=os.environ["ABC_ROOT"], working_dir=None, verbose=False):
+    cmd = [f"{abc_path}/abc", '-c', f"&lnetread {verilog_file}; &ps; &w {aig_file}"]
+    if verbose:
+        print(" ".join(cmd))
+    proc = subprocess.Popen(cmd, cwd=working_dir, stdout=subprocess.PIPE, env=os.environ)
+    out, err = proc.communicate()
+    nodes = 0
+    if verbose:
+        print(nodes)
+        print(out)
+        print(err)
+    return nodes, out, err # TODO: return the number of nodes
+
+def txt_to_sim(txt_file, sim_file, abc_path=os.environ["ABC_ROOT"], working_dir=None, verbose=False):
+    cmd = [f"{abc_path}/abc", '-c', f"&lnetread {txt_file} {sim_file}"]
+    if verbose:
+        print(" ".join(cmd))
+    proc = subprocess.Popen(cmd, cwd=working_dir, stdout=subprocess.PIPE, env=os.environ)
+    out, err = proc.communicate()
+    if verbose:
+        print(out)
+        print(err)
+    return out, err
+
+def simulate_circuit(circuit_file, sim_input_file, sim_output_file, abc_path=os.environ["ABC_ROOT"], working_dir=None, verbose=False):
+    cmd = [f"{abc_path}/abc", '-c', f"&r {circuit_file}; &lnetsim {sim_input_file} {sim_output_file}"]
+    if verbose:
+        print(" ".join(cmd))
+    proc = subprocess.Popen(cmd, cwd=working_dir, stdout=subprocess.PIPE, env=os.environ)
+    out, err = proc.communicate()
+    if verbose:
+        print(out)
+        print(err)
+    return out, err
+
+def putontop_aig(aig_files, output_aig_file, abc_path=os.environ["ABC_ROOT"], working_dir=None, verbose=False):
+    cmd = [f"{abc_path}/abc", '-c', f"putontop {' '.join(aig_files)}; st; ps; write {output_aig_file}"]
+    if verbose:
+        print(" ".join(cmd))
+    proc = subprocess.Popen(cmd, cwd=working_dir, stdout=subprocess.PIPE, env=os.environ)
+    out, err = proc.communicate()
+    nodes = 0
+    if verbose:
+        print(nodes)
+        print(out)
+        print(err)
+    return nodes, out, err # TODO: return the number of nodes
+
+def putontop_blif(blif_files, output_blif_file, abc_path=os.environ["ABC_ROOT"], working_dir=None, verbose=False):
+    cmd = [f"{abc_path}/abc", '-c', f"putontop {' '.join(blif_files)}; sw; ps; write {output_blif_file}"]
+    if verbose:
+        print(" ".join(cmd))
+    proc = subprocess.Popen(cmd, cwd=working_dir, stdout=subprocess.PIPE, env=os.environ)
+    out, err = proc.communicate()
+    nodes = 0
+    if verbose:
+        print(nodes)
+        print(out)
+        print(err)
+    return nodes, out, err # TODO: return the number of nodes
+
+def optimize_bdd_network(circuit_file, output_file, input_bitwidth, output_bitwidth, rarity, sim_file, opt_cmd="&lnetopt", abc_path=os.environ["ABC_ROOT"], working_dir=None, verbose=False):
+    cmd = [f"{abc_path}/abc", '-c', f"&r {circuit_file}; &ps; {opt_cmd} -I {input_bitwidth} -O {output_bitwidth} -R {rarity} {sim_file}; &w {output_file}; &ps; time"]
+    if verbose:
+        print(" ".join(cmd))
+    proc = subprocess.Popen(cmd, cwd=working_dir, stdout=subprocess.PIPE, env=os.environ)
+    out, err = proc.communicate()
+    nodes = 0
+    tt_pct = 100.
+    time_s = 0.0
+    if verbose:
+        print(nodes)
+        print(tt_pct)
+        print(time_s)
+        print(out)
+        print(err)
+    return nodes, tt_pct, time_s, out, err # TODO: return the number of nodes, tt%, time
+
+def tech_map_circuit(circuit_file, output_blif, output_verilog, input_bitwidth, output_bitwidth, abc_path=os.environ["ABC_ROOT"], working_dir=None, verbose=False):
+    cmd = [f"{abc_path}/abc", '-c', f"&r {circuit_file}; &lnetmap -I {input_bitwidth} -O {output_bitwidth}; write {output_blif}; write_verilog -fm {output_verilog}"]
+    if verbose:
+        print(" ".join(cmd))
+    proc = subprocess.Popen(cmd, cwd=working_dir, stdout=subprocess.PIPE, env=os.environ)
+    out, err = proc.communicate()
+    if verbose:
+        print(out)
+        print(err)
+    return out, err
+
+def evaluate_accuracy(circuit_file, sim_output_file, reference_txt, output_bitwidth, abc_path=os.environ["ABC_ROOT"], working_dir=None, verbose=False):
+    cmd = [f"{abc_path}/abc", '-c', f"&r {circuit_file}; &lneteval -O {output_bitwidth} {sim_output_file} {reference_txt}"]
+    if verbose:
+        print(" ".join(cmd))
+    proc = subprocess.Popen(cmd, cwd=working_dir, stdout=subprocess.PIPE, env=os.environ)
+    out, err = proc.communicate()
+    accuracy = 0.0
+    if verbose:
+        print(accuracy)
+        print(out)
+        print(err)
+    return accuracy, out, err # TODO: accuracy %, time
+
 def generate_prepare_script_string(num_layers, path):
     prepare_script_template = """\
 # This script prepares experiments in ABC by deriving intermediate simulation patterns
diff --git a/src/logicnets/synthesis.py b/src/logicnets/synthesis.py
index 195c552d8..c5956a458 100644
--- a/src/logicnets/synthesis.py
+++ b/src/logicnets/synthesis.py
@@ -18,7 +18,14 @@
 from shutil import which
 import glob
 
-from .abc import generate_prepare_script_string, generate_opt_script_string
+from .abc import    verilog_bench_to_aig,\
+                    txt_to_sim,\
+                    simulate_circuit,\
+                    putontop_aig,\
+                    putontop_blif,\
+                    optimize_bdd_network,\
+                    evaluate_accuracy,\
+                    tech_map_circuit
 
 #xcvu9p-flgb2104-2-i
 # TODO: Add option to perform synthesis on a remote server
@@ -62,47 +69,79 @@ def synthesize_and_get_resource_counts(verilog_dir, top_name, fpga_part = "xcku3
     return ret
 
 # Optimize the design with ABC
-def synthesize_and_get_resource_counts_with_abc(verilog_dir, module_list, pipeline_stages=0, freq_thresh=0):
+def synthesize_and_get_resource_counts_with_abc(verilog_dir, module_list, pipeline_stages=0, freq_thresh=0, train_input_txt="train_input.txt", train_output_txt="train_output.txt", test_input_txt="test_input.txt", test_output_txt="test_output.txt", verbose=False):
     if "ABC_ROOT" not in os.environ:
         raise Exception("The environment variable ABC_ROOT is not defined.")
     abc_path = os.environ["ABC_ROOT"]
 
     # Create directories and symlinks ready for processing with ABC
-    project_prefix = "logicnet"
+    project_prefix = "abc"
     abc_project_root = f"{verilog_dir}/{project_prefix}"
     verilog_bench_dir = f"{abc_project_root}/ver"
     aig_dir = f"{abc_project_root}/aig"
     blif_dir = f"{abc_project_root}/blif"
+    veropt_dir = f"{abc_project_root}/veropt"
     if not os.path.exists(verilog_bench_dir):
         os.makedirs(verilog_bench_dir)
     if not os.path.exists(aig_dir):
         os.makedirs(aig_dir)
     if not os.path.exists(blif_dir):
         os.makedirs(blif_dir)
-    real_abc_project_root = os.path.realpath(abc_project_root)
-    project_symlink_path = f"{abc_path}/{project_prefix}"
-    os.symlink(real_abc_project_root, project_symlink_path) # Create a symlink to this folder in the ABC root.
+    if not os.path.exists(veropt_dir):
+        os.makedirs(veropt_dir)
     # Fetch the right source files from the verilog directory
-    source_files = glob.glob(f"{verilog_dir}/*.v") + glob.glob(f"{verilog_dir}/*.bench")
+    source_files = glob.glob(f"{verilog_dir}/logicnet.v") + [f"{verilog_dir}/layer{i}.v" for i in range(len(module_list))] + glob.glob(f"{verilog_dir}/*.bench")
     for f in source_files:
         shutil.copy(f, verilog_bench_dir)
     # Fetch the I/O files
-    for f in glob.glob(f"{verilog_dir}/*.txt"):
+    for f in list(map(lambda x: f"{verilog_dir}/{x}", [train_input_txt, train_output_txt, test_input_txt, test_output_txt])):
         shutil.copy(f, f"{abc_project_root}")
 
-    # Create script files to pass to ABC
-    # TODO: Calculate number of layers from the model
-    with open(f"{abc_project_root}/prepare.script", "w") as f:
-        f.write(generate_prepare_script_string(num_layers=len(module_list), path=project_prefix))
-    with open(f"{abc_project_root}/opt_all.script", "w") as f:
-        f.write(generate_opt_script_string(module_list=module_list, path=project_prefix, num_registers=pipeline_stages, rarity=freq_thresh))
+    # Preparation - model / I/O conversion
+    # Convert txt inputs into the sim format
+    out, err = txt_to_sim(train_input_txt, "train.sim", working_dir=abc_project_root, verbose=verbose)
+    out, err = txt_to_sim(test_input_txt, "test.sim", working_dir=abc_project_root)
 
-    #proc = subprocess.Popen(['./abc', '-c', '"x/jsc_s/prepare.script"', '-c', '"x/jsc_s/opt_all.script"'], cwd=abc_path, stdout=subprocess.PIPE, env=os.environ)
-    proc = subprocess.Popen(['./abc', '-c', f'"{project_prefix}/prepare.script"', '-c', f'"{project_prefix}/opt_all.script"'], cwd=abc_path, stdout=subprocess.PIPE, env=os.environ)
-    out, err = proc.communicate()
+    # Create AIGs from verilog
+    for i in range(len(module_list)):
+        nodes, out, err = verilog_bench_to_aig(f"ver/layer{i}.v", f"aig/layer{i}.aig", working_dir=abc_project_root, verbose=verbose)
 
-    with open(f"{abc_project_root}/abc.log", "w") as f:
-        f.write(out.decode("utf-8"))
+    # Simulate each layer
+    for i in range(len(module_list)):
+        out, err = simulate_circuit(f"aig/layer{i}.aig", f"train{i}.sim" if i != 0 else "train.sim", f"train{i+1}.sim", working_dir=abc_project_root, verbose=verbose)
 
-    os.remove(project_symlink_path)
+    # Synthesis
+    for i in range(len(module_list)):
+        _, input_bitwidth = module_list[i].input_quant.get_scale_factor_bits()
+        _, output_bitwidth = module_list[i].output_quant.get_scale_factor_bits()
+        indices, _, _, _ = module_list[i].neuron_truth_tables[0]
+        fanin = len(indices)
+        nodes, tt_pct, time, out, err = optimize_bdd_network(f"aig/layer{i}.aig", f"aig/layer{i}_full.aig", int(input_bitwidth*fanin), int(output_bitwidth), freq_thresh, f"train{i}.sim" if i != 0 else "train.sim", opt_cmd="&lnetopt", working_dir=abc_project_root, verbose=verbose)
+
+    # Technology mapping
+    for i in range(len(module_list)):
+        _, input_bitwidth = module_list[i].input_quant.get_scale_factor_bits()
+        _, output_bitwidth = module_list[i].output_quant.get_scale_factor_bits()
+        indices, _, _, _ = module_list[i].neuron_truth_tables[0]
+        fanin = len(indices)
+        out, err = tech_map_circuit(f"aig/layer{i}_full.aig", f"blif/layer{i}_full.blif", f"veropt/layer{i}_full.v", int(input_bitwidth*fanin), int(output_bitwidth), working_dir=abc_project_root, verbose=verbose)
+
+    # Generate monolithic circuits
+    if len(module_list) > 1:
+        nodes, out, err = putontop_aig([f"aig/layer{i}_full.aig" for i in range(len(module_list))], f"aig/layers_full.aig", working_dir=abc_project_root, verbose=verbose)
+        nodes, out, err = putontop_blif([f"blif/layer{i}_full.blif" for i in range(len(module_list))], f"blif/layers_full.blif", working_dir=abc_project_root, verbose=verbose)
+    else:
+        shutil.copy(f"{aig_dir}/layer0_full.aig", f"{aig_dir}/layers_full.aig")
+        shutil.copy(f"{blif_dir}/layer0_full.blif", f"{blif_dir}/layers_full.blif")
+
+    # Evaluation
+    # Training set:
+    _, output_bitwidth = module_list[-1].output_quant.get_scale_factor_bits()
+    out, err = simulate_circuit(f"aig/layers_full.aig", "train.sim", "train.simo", working_dir=abc_project_root, verbose=verbose)
+    train_accuracy, out, err = evaluate_accuracy(f"aig/layers_full.aig", "train.simo", train_output_txt, int(output_bitwidth), working_dir=abc_project_root, verbose=verbose)
+    # Test set:
+    out, err = simulate_circuit(f"aig/layers_full.aig", "test.sim", "test.simo", working_dir=abc_project_root, verbose=verbose)
+    test_accuracy, out, err = evaluate_accuracy(f"aig/layers_full.aig", "test.simo", test_output_txt, int(output_bitwidth), working_dir=abc_project_root, verbose=verbose)
+
+    return train_accuracy, test_accuracy, nodes
 

From 5da1be51c4901f1b28f07b836aee5f28b0eb6da5 Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Wed, 12 Oct 2022 16:46:12 +0100
Subject: [PATCH 20/64] [abc] Added option to specify the BDD command for
 synthesis preset.

---
 src/logicnets/synthesis.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/logicnets/synthesis.py b/src/logicnets/synthesis.py
index c5956a458..909d22965 100644
--- a/src/logicnets/synthesis.py
+++ b/src/logicnets/synthesis.py
@@ -69,7 +69,7 @@ def synthesize_and_get_resource_counts(verilog_dir, top_name, fpga_part = "xcku3
     return ret
 
 # Optimize the design with ABC
-def synthesize_and_get_resource_counts_with_abc(verilog_dir, module_list, pipeline_stages=0, freq_thresh=0, train_input_txt="train_input.txt", train_output_txt="train_output.txt", test_input_txt="test_input.txt", test_output_txt="test_output.txt", verbose=False):
+def synthesize_and_get_resource_counts_with_abc(verilog_dir, module_list, pipeline_stages=0, freq_thresh=0, train_input_txt="train_input.txt", train_output_txt="train_output.txt", test_input_txt="test_input.txt", test_output_txt="test_output.txt", bdd_opt_cmd="lnetopt", verbose=False):
     if "ABC_ROOT" not in os.environ:
         raise Exception("The environment variable ABC_ROOT is not defined.")
     abc_path = os.environ["ABC_ROOT"]
@@ -116,7 +116,7 @@ def synthesize_and_get_resource_counts_with_abc(verilog_dir, module_list, pipeli
         _, output_bitwidth = module_list[i].output_quant.get_scale_factor_bits()
         indices, _, _, _ = module_list[i].neuron_truth_tables[0]
         fanin = len(indices)
-        nodes, tt_pct, time, out, err = optimize_bdd_network(f"aig/layer{i}.aig", f"aig/layer{i}_full.aig", int(input_bitwidth*fanin), int(output_bitwidth), freq_thresh, f"train{i}.sim" if i != 0 else "train.sim", opt_cmd="&lnetopt", working_dir=abc_project_root, verbose=verbose)
+        nodes, tt_pct, time, out, err = optimize_bdd_network(f"aig/layer{i}.aig", f"aig/layer{i}_full.aig", int(input_bitwidth*fanin), int(output_bitwidth), freq_thresh, f"train{i}.sim" if i != 0 else "train.sim", opt_cmd=bdd_opt_cmd, working_dir=abc_project_root, verbose=verbose)
 
     # Technology mapping
     for i in range(len(module_list)):

From 580a04ffa54a1ebe85936502f5bc79f544883873 Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Wed, 12 Oct 2022 18:04:12 +0100
Subject: [PATCH 21/64] [abc] Used re to extract important information for the
 ABC logs.

---
 src/logicnets/abc.py       | 30 +++++++++++++++++++++++-------
 src/logicnets/synthesis.py |  4 +++-
 2 files changed, 26 insertions(+), 8 deletions(-)

diff --git a/src/logicnets/abc.py b/src/logicnets/abc.py
index 80df04382..b8382b461 100644
--- a/src/logicnets/abc.py
+++ b/src/logicnets/abc.py
@@ -15,6 +15,12 @@
 
 import os
 import subprocess
+import re
+
+_aig_re_str = r'and\s+=\s+\d+'
+_acc_re_str = r'The\s+accuracy\s+is\s+\d+\.\d+'
+_avg_cs_re_str = r'Average\s+care\s+set\s+is\s+\d+\.\d+'
+_elapse_s_re_str = r'elapse:\s+\d+\.\d+'
 
 def verilog_bench_to_aig(verilog_file, aig_file, abc_path=os.environ["ABC_ROOT"], working_dir=None, verbose=False):
     cmd = [f"{abc_path}/abc", '-c', f"&lnetread {verilog_file}; &ps; &w {aig_file}"]
@@ -22,7 +28,8 @@ def verilog_bench_to_aig(verilog_file, aig_file, abc_path=os.environ["ABC_ROOT"]
         print(" ".join(cmd))
     proc = subprocess.Popen(cmd, cwd=working_dir, stdout=subprocess.PIPE, env=os.environ)
     out, err = proc.communicate()
-    nodes = 0
+    aig_re = re.compile(_aig_re_str)
+    nodes = int(aig_re.search(str(out)).group().split(" ")[-1])
     if verbose:
         print(nodes)
         print(out)
@@ -57,7 +64,8 @@ def putontop_aig(aig_files, output_aig_file, abc_path=os.environ["ABC_ROOT"], wo
         print(" ".join(cmd))
     proc = subprocess.Popen(cmd, cwd=working_dir, stdout=subprocess.PIPE, env=os.environ)
     out, err = proc.communicate()
-    nodes = 0
+    aig_re = re.compile(_aig_re_str)
+    nodes = int(aig_re.search(str(out)).group().split(" ")[-1])
     if verbose:
         print(nodes)
         print(out)
@@ -70,7 +78,8 @@ def putontop_blif(blif_files, output_blif_file, abc_path=os.environ["ABC_ROOT"],
         print(" ".join(cmd))
     proc = subprocess.Popen(cmd, cwd=working_dir, stdout=subprocess.PIPE, env=os.environ)
     out, err = proc.communicate()
-    nodes = 0
+    aig_re = re.compile(_aig_re_str)
+    nodes = int(aig_re.search(str(out)).group().split(" ")[-1])
     if verbose:
         print(nodes)
         print(out)
@@ -83,9 +92,15 @@ def optimize_bdd_network(circuit_file, output_file, input_bitwidth, output_bitwi
         print(" ".join(cmd))
     proc = subprocess.Popen(cmd, cwd=working_dir, stdout=subprocess.PIPE, env=os.environ)
     out, err = proc.communicate()
-    nodes = 0
-    tt_pct = 100.
-    time_s = 0.0
+    aig_re = re.compile(_aig_re_str)
+    nodes = int(aig_re.search(str(out)).group().split(" ")[-1])
+    if opt_cmd == "&lnetopt":
+        tt_pct_re = re.compile(_avg_cs_re_str)
+        tt_pct = float(tt_pct_re.search(str(out)).group().split(" ")[-1])
+    else:
+        tt_pct = None
+    time_re = re.compile(_elapse_s_re_str)
+    time_s = float(time_re.search(str(out)).group().split(" ")[-1])
     if verbose:
         print(nodes)
         print(tt_pct)
@@ -111,7 +126,8 @@ def evaluate_accuracy(circuit_file, sim_output_file, reference_txt, output_bitwi
         print(" ".join(cmd))
     proc = subprocess.Popen(cmd, cwd=working_dir, stdout=subprocess.PIPE, env=os.environ)
     out, err = proc.communicate()
-    accuracy = 0.0
+    acc_re = re.compile(_acc_re_str)
+    accuracy = float(acc_re.search(str(out)).group().split(" ")[-1])
     if verbose:
         print(accuracy)
         print(out)
diff --git a/src/logicnets/synthesis.py b/src/logicnets/synthesis.py
index 909d22965..753b883f1 100644
--- a/src/logicnets/synthesis.py
+++ b/src/logicnets/synthesis.py
@@ -111,12 +111,14 @@ def synthesize_and_get_resource_counts_with_abc(verilog_dir, module_list, pipeli
         out, err = simulate_circuit(f"aig/layer{i}.aig", f"train{i}.sim" if i != 0 else "train.sim", f"train{i+1}.sim", working_dir=abc_project_root, verbose=verbose)
 
     # Synthesis
+    average_tt_pcts = []
     for i in range(len(module_list)):
         _, input_bitwidth = module_list[i].input_quant.get_scale_factor_bits()
         _, output_bitwidth = module_list[i].output_quant.get_scale_factor_bits()
         indices, _, _, _ = module_list[i].neuron_truth_tables[0]
         fanin = len(indices)
         nodes, tt_pct, time, out, err = optimize_bdd_network(f"aig/layer{i}.aig", f"aig/layer{i}_full.aig", int(input_bitwidth*fanin), int(output_bitwidth), freq_thresh, f"train{i}.sim" if i != 0 else "train.sim", opt_cmd=bdd_opt_cmd, working_dir=abc_project_root, verbose=verbose)
+        average_tt_pcts.append(tt_pct)
 
     # Technology mapping
     for i in range(len(module_list)):
@@ -143,5 +145,5 @@ def synthesize_and_get_resource_counts_with_abc(verilog_dir, module_list, pipeli
     out, err = simulate_circuit(f"aig/layers_full.aig", "test.sim", "test.simo", working_dir=abc_project_root, verbose=verbose)
     test_accuracy, out, err = evaluate_accuracy(f"aig/layers_full.aig", "test.simo", test_output_txt, int(output_bitwidth), working_dir=abc_project_root, verbose=verbose)
 
-    return train_accuracy, test_accuracy, nodes
+    return train_accuracy, test_accuracy, nodes, average_tt_pcts
 

From 2b4273e7267b9dc81b37e58f26d59092cd4288c2 Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Thu, 13 Oct 2022 17:00:31 +0100
Subject: [PATCH 22/64] [abc] Added functions for generic synthesis
 optimizations and final tech mapping / pipelining.

---
 src/logicnets/abc.py       | 89 +++++++++++++++++++++++++++++++++++++-
 src/logicnets/synthesis.py | 16 ++++++-
 2 files changed, 101 insertions(+), 4 deletions(-)

diff --git a/src/logicnets/abc.py b/src/logicnets/abc.py
index b8382b461..7e8e95902 100644
--- a/src/logicnets/abc.py
+++ b/src/logicnets/abc.py
@@ -16,8 +16,10 @@
 import os
 import subprocess
 import re
+import shutil
 
 _aig_re_str = r'and\s+=\s+\d+'
+_lut_re_str = r'nd\s+=\s+\d+'
 _acc_re_str = r'The\s+accuracy\s+is\s+\d+\.\d+'
 _avg_cs_re_str = r'Average\s+care\s+set\s+is\s+\d+\.\d+'
 _elapse_s_re_str = r'elapse:\s+\d+\.\d+'
@@ -109,8 +111,63 @@ def optimize_bdd_network(circuit_file, output_file, input_bitwidth, output_bitwi
         print(err)
     return nodes, tt_pct, time_s, out, err # TODO: return the number of nodes, tt%, time
 
-def tech_map_circuit(circuit_file, output_blif, output_verilog, input_bitwidth, output_bitwidth, abc_path=os.environ["ABC_ROOT"], working_dir=None, verbose=False):
-    cmd = [f"{abc_path}/abc", '-c', f"&r {circuit_file}; &lnetmap -I {input_bitwidth} -O {output_bitwidth}; write {output_blif}; write_verilog -fm {output_verilog}"]
+def optimize_mfs2(circuit_file, output_file, abc_path=os.environ["ABC_ROOT"], working_dir=None, verbose=False):
+    cmd = [f"{abc_path}/abc", '-c', f"read {circuit_file}; if -K 6 -a; mfs2; write_blif {output_file}; print_stats"]
+    if verbose:
+        print(" ".join(cmd))
+    proc = subprocess.Popen(cmd, cwd=working_dir, stdout=subprocess.PIPE, env=os.environ)
+    out, err = proc.communicate()
+    lut_re = re.compile(_lut_re_str)
+    nodes = int(lut_re.search(str(out)).group().split(" ")[-1])
+    if verbose:
+        print(nodes)
+        print(out)
+        print(err)
+    return nodes, out, err # TODO: return the number of nodes
+
+def iterative_mfs2_optimize(circuit_file, output_file, tmp_file="tmp.blif", max_loop=100, abc_path=os.environ["ABC_ROOT"], working_dir=None, verbose=False):
+    tmp_file_path = tmp_file if working_dir is None else f"{working_dir}/{tmp_file}"
+    output_file_path = output_file if working_dir is None else f"{working_dir}/{output_file}"
+    cmd = [f"{abc_path}/abc", '-c', f"read {circuit_file}; sweep; write_blif {tmp_file}; print_stats"]
+    if verbose:
+        print(" ".join(cmd))
+    proc = subprocess.Popen(cmd, cwd=working_dir, stdout=subprocess.PIPE, env=os.environ)
+    out, err = proc.communicate()
+    lut_re = re.compile(_lut_re_str)
+    nodes = int(lut_re.search(str(out)).group().split(" ")[-1])
+    best = nodes
+    shutil.copy(tmp_file_path, output_file_path)
+    if verbose:
+        print(nodes)
+        print(best)
+        print(out)
+        print(err)
+    for i in range(max_loop):
+        if i == 0:
+            cmd = [f"{abc_path}/abc", '-c', f"read {tmp_file}; mfs2; write_blif {tmp_file}; print_stats"]
+            proc = subprocess.Popen(cmd, cwd=working_dir, stdout=subprocess.PIPE, env=os.environ)
+            if verbose:
+                print(" ".join(cmd))
+            out, err = proc.communicate()
+            lut_re = re.compile(_lut_re_str)
+            nodes = int(lut_re.search(str(out)).group().split(" ")[-1])
+            if verbose:
+                print(nodes)
+                print(out)
+                print(err)
+        else:
+            nodes, out, err = optimize_mfs2(tmp_file, tmp_file, abc_path=abc_path, working_dir=working_dir, verbose=verbose)
+        if nodes >= best:
+            break
+        else:
+            print(best)
+            best = nodes
+            shutil.copy(tmp_file_path, output_file_path)
+    os.remove(tmp_file_path)
+    return best
+
+def tech_map_circuit(circuit_file, output_blif, input_bitwidth, output_bitwidth, abc_path=os.environ["ABC_ROOT"], working_dir=None, verbose=False):
+    cmd = [f"{abc_path}/abc", '-c', f"&r {circuit_file}; &lnetmap -I {input_bitwidth} -O {output_bitwidth}; write {output_blif}"]
     if verbose:
         print(" ".join(cmd))
     proc = subprocess.Popen(cmd, cwd=working_dir, stdout=subprocess.PIPE, env=os.environ)
@@ -120,6 +177,34 @@ def tech_map_circuit(circuit_file, output_blif, output_verilog, input_bitwidth,
         print(err)
     return out, err
 
+def pipeline_tech_mapped_circuit(circuit_file, output_verilog, num_registers, abc_path=os.environ["ABC_ROOT"], working_dir=None, verbose=False):
+    cmd = [f"{abc_path}/abc", '-c', f"&r {circuit_file}; ps; pipe -L {num_registers}; ps; retime -M 4; ps; sweep; ps; write_verilog -fm {output_verilog}"]
+    if verbose:
+        print(" ".join(cmd))
+    proc = subprocess.Popen(cmd, cwd=working_dir, stdout=subprocess.PIPE, env=os.environ)
+    out, err = proc.communicate()
+    lut_re = re.compile(_lut_re_str)
+    nodes = int(lut_re.search(str(out)).group().split(" ")[-1])
+    if verbose:
+        print(nodes)
+        print(out)
+        print(err)
+    return out, err
+
+def tech_map_to_verilog(circuit_file, output_verilog, abc_path=os.environ["ABC_ROOT"], working_dir=None, verbose=False):
+    cmd = [f"{abc_path}/abc", '-c', f"read {circuit_file}; print_stats; write_verilog -fm {output_verilog}"]
+    if verbose:
+        print(" ".join(cmd))
+    proc = subprocess.Popen(cmd, cwd=working_dir, stdout=subprocess.PIPE, env=os.environ)
+    out, err = proc.communicate()
+    lut_re = re.compile(_lut_re_str)
+    nodes = int(lut_re.search(str(out)).group().split(" ")[-1])
+    if verbose:
+        print(nodes)
+        print(out)
+        print(err)
+    return nodes, out, err
+
 def evaluate_accuracy(circuit_file, sim_output_file, reference_txt, output_bitwidth, abc_path=os.environ["ABC_ROOT"], working_dir=None, verbose=False):
     cmd = [f"{abc_path}/abc", '-c', f"&r {circuit_file}; &lneteval -O {output_bitwidth} {sim_output_file} {reference_txt}"]
     if verbose:
diff --git a/src/logicnets/synthesis.py b/src/logicnets/synthesis.py
index 753b883f1..7c4fe1eac 100644
--- a/src/logicnets/synthesis.py
+++ b/src/logicnets/synthesis.py
@@ -25,7 +25,10 @@
                     putontop_blif,\
                     optimize_bdd_network,\
                     evaluate_accuracy,\
-                    tech_map_circuit
+                    tech_map_circuit,\
+                    iterative_mfs2_optimize,\
+                    pipeline_tech_mapped_circuit,\
+                    tech_map_to_verilog
 
 #xcvu9p-flgb2104-2-i
 # TODO: Add option to perform synthesis on a remote server
@@ -126,7 +129,7 @@ def synthesize_and_get_resource_counts_with_abc(verilog_dir, module_list, pipeli
         _, output_bitwidth = module_list[i].output_quant.get_scale_factor_bits()
         indices, _, _, _ = module_list[i].neuron_truth_tables[0]
         fanin = len(indices)
-        out, err = tech_map_circuit(f"aig/layer{i}_full.aig", f"blif/layer{i}_full.blif", f"veropt/layer{i}_full.v", int(input_bitwidth*fanin), int(output_bitwidth), working_dir=abc_project_root, verbose=verbose)
+        out, err = tech_map_circuit(f"aig/layer{i}_full.aig", f"blif/layer{i}_full.blif", int(input_bitwidth*fanin), int(output_bitwidth), working_dir=abc_project_root, verbose=verbose)
 
     # Generate monolithic circuits
     if len(module_list) > 1:
@@ -136,6 +139,15 @@ def synthesize_and_get_resource_counts_with_abc(verilog_dir, module_list, pipeli
         shutil.copy(f"{aig_dir}/layer0_full.aig", f"{aig_dir}/layers_full.aig")
         shutil.copy(f"{blif_dir}/layer0_full.blif", f"{blif_dir}/layers_full.blif")
 
+    # Generic logic synthesis optimizations
+    nodes = iterative_mfs2_optimize(circuit_file=f"blif/layers_full.blif", output_file=f"blif/layers_full_opt.blif", tmp_file="blif/tmp.blif", max_loop=100, working_dir=abc_project_root, verbose=verbose)
+
+    # Generate verilog, with or without pipelining
+    if pipeline_stages == 0:
+        nodes, out, err = tech_map_to_verilog(circuit_file=f"blif/layers_full_opt.blif", output_verilog=f"veropt/layers_full_opt.v", working_dir=abc_project_root, verbose=verbose)
+    else:
+        nodes, out, err = pipeline_tech_mapped_circuit(circuit_file=f"blif/layers_full_opt.blif", output_verilog=f"veropt/layers_full_opt.v", num_registers=num_registers, working_dir=abc_project_root, verbose=verbose)
+
     # Evaluation
     # Training set:
     _, output_bitwidth = module_list[-1].output_quant.get_scale_factor_bits()

From 314949387e5515f34f0e4002b3c8f69cdc7122a8 Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Thu, 13 Oct 2022 17:15:51 +0100
Subject: [PATCH 23/64] [abc] Updated simulation/evaluation to work on blif
 models.

---
 src/logicnets/abc.py       | 16 +++++++++++++---
 src/logicnets/synthesis.py |  8 ++++----
 2 files changed, 17 insertions(+), 7 deletions(-)

diff --git a/src/logicnets/abc.py b/src/logicnets/abc.py
index 7e8e95902..b3aba9783 100644
--- a/src/logicnets/abc.py
+++ b/src/logicnets/abc.py
@@ -50,7 +50,12 @@ def txt_to_sim(txt_file, sim_file, abc_path=os.environ["ABC_ROOT"], working_dir=
     return out, err
 
 def simulate_circuit(circuit_file, sim_input_file, sim_output_file, abc_path=os.environ["ABC_ROOT"], working_dir=None, verbose=False):
-    cmd = [f"{abc_path}/abc", '-c', f"&r {circuit_file}; &lnetsim {sim_input_file} {sim_output_file}"]
+    if circuit_file.endswith(".aig"):
+        cmd = [f"{abc_path}/abc", '-c', f"&r {circuit_file}; &lnetsim {sim_input_file} {sim_output_file}"]
+    elif circuit_file.endswith(".blif"):
+        cmd = [f"{abc_path}/abc", '-c', f"read {circuit_file}; strash; &get; &lnetsim {sim_input_file} {sim_output_file}"]
+    else:
+        raise ValueError(f"Unsupported file type: {circuit_file}")
     if verbose:
         print(" ".join(cmd))
     proc = subprocess.Popen(cmd, cwd=working_dir, stdout=subprocess.PIPE, env=os.environ)
@@ -178,7 +183,7 @@ def tech_map_circuit(circuit_file, output_blif, input_bitwidth, output_bitwidth,
     return out, err
 
 def pipeline_tech_mapped_circuit(circuit_file, output_verilog, num_registers, abc_path=os.environ["ABC_ROOT"], working_dir=None, verbose=False):
-    cmd = [f"{abc_path}/abc", '-c', f"&r {circuit_file}; ps; pipe -L {num_registers}; ps; retime -M 4; ps; sweep; ps; write_verilog -fm {output_verilog}"]
+    cmd = [f"{abc_path}/abc", '-c', f"read {circuit_file}; print_stats; pipe -L {num_registers}; print_stats; retime -M 4; print_stats; sweep; print_stats; write_verilog -fm {output_verilog}"]
     if verbose:
         print(" ".join(cmd))
     proc = subprocess.Popen(cmd, cwd=working_dir, stdout=subprocess.PIPE, env=os.environ)
@@ -206,7 +211,12 @@ def tech_map_to_verilog(circuit_file, output_verilog, abc_path=os.environ["ABC_R
     return nodes, out, err
 
 def evaluate_accuracy(circuit_file, sim_output_file, reference_txt, output_bitwidth, abc_path=os.environ["ABC_ROOT"], working_dir=None, verbose=False):
-    cmd = [f"{abc_path}/abc", '-c', f"&r {circuit_file}; &lneteval -O {output_bitwidth} {sim_output_file} {reference_txt}"]
+    if circuit_file.endswith(".aig"):
+        cmd = [f"{abc_path}/abc", '-c', f"&r {circuit_file}; &lneteval -O {output_bitwidth} {sim_output_file} {reference_txt}"]
+    elif circuit_file.endswith(".blif"):
+        cmd = [f"{abc_path}/abc", '-c', f"read {circuit_file}; strash; &get; &lneteval -O {output_bitwidth} {sim_output_file} {reference_txt}"]
+    else:
+        raise ValueError(f"Unsupported file type: {circuit_file}")
     if verbose:
         print(" ".join(cmd))
     proc = subprocess.Popen(cmd, cwd=working_dir, stdout=subprocess.PIPE, env=os.environ)
diff --git a/src/logicnets/synthesis.py b/src/logicnets/synthesis.py
index 7c4fe1eac..36ffbfcf3 100644
--- a/src/logicnets/synthesis.py
+++ b/src/logicnets/synthesis.py
@@ -151,11 +151,11 @@ def synthesize_and_get_resource_counts_with_abc(verilog_dir, module_list, pipeli
     # Evaluation
     # Training set:
     _, output_bitwidth = module_list[-1].output_quant.get_scale_factor_bits()
-    out, err = simulate_circuit(f"aig/layers_full.aig", "train.sim", "train.simo", working_dir=abc_project_root, verbose=verbose)
-    train_accuracy, out, err = evaluate_accuracy(f"aig/layers_full.aig", "train.simo", train_output_txt, int(output_bitwidth), working_dir=abc_project_root, verbose=verbose)
+    out, err = simulate_circuit(f"blif/layers_full_opt.blif", "train.sim", "train.simo", working_dir=abc_project_root, verbose=verbose)
+    train_accuracy, out, err = evaluate_accuracy(f"blif/layers_full_opt.blif", "train.simo", train_output_txt, int(output_bitwidth), working_dir=abc_project_root, verbose=verbose)
     # Test set:
-    out, err = simulate_circuit(f"aig/layers_full.aig", "test.sim", "test.simo", working_dir=abc_project_root, verbose=verbose)
-    test_accuracy, out, err = evaluate_accuracy(f"aig/layers_full.aig", "test.simo", test_output_txt, int(output_bitwidth), working_dir=abc_project_root, verbose=verbose)
+    out, err = simulate_circuit(f"blif/layers_full_opt.blif", "test.sim", "test.simo", working_dir=abc_project_root, verbose=verbose)
+    test_accuracy, out, err = evaluate_accuracy(f"blif/layers_full_opt.blif", "test.simo", test_output_txt, int(output_bitwidth), working_dir=abc_project_root, verbose=verbose)
 
     return train_accuracy, test_accuracy, nodes, average_tt_pcts
 

From d345c38a8b94bb42573e445d18408952da2ae9b5 Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Tue, 18 Oct 2022 12:14:32 +0100
Subject: [PATCH 24/64] [abc] Bugfixes for putontop commands.

---
 src/logicnets/abc.py | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/src/logicnets/abc.py b/src/logicnets/abc.py
index b3aba9783..e53e7dccc 100644
--- a/src/logicnets/abc.py
+++ b/src/logicnets/abc.py
@@ -66,7 +66,7 @@ def simulate_circuit(circuit_file, sim_input_file, sim_output_file, abc_path=os.
     return out, err
 
 def putontop_aig(aig_files, output_aig_file, abc_path=os.environ["ABC_ROOT"], working_dir=None, verbose=False):
-    cmd = [f"{abc_path}/abc", '-c', f"putontop {' '.join(aig_files)}; st; ps; write {output_aig_file}"]
+    cmd = [f"{abc_path}/abc", '-c', f"putontop {' '.join(aig_files)}; strash; print_stats; write {output_aig_file}"]
     if verbose:
         print(" ".join(cmd))
     proc = subprocess.Popen(cmd, cwd=working_dir, stdout=subprocess.PIPE, env=os.environ)
@@ -80,13 +80,13 @@ def putontop_aig(aig_files, output_aig_file, abc_path=os.environ["ABC_ROOT"], wo
     return nodes, out, err # TODO: return the number of nodes
 
 def putontop_blif(blif_files, output_blif_file, abc_path=os.environ["ABC_ROOT"], working_dir=None, verbose=False):
-    cmd = [f"{abc_path}/abc", '-c', f"putontop {' '.join(blif_files)}; sw; ps; write {output_blif_file}"]
+    cmd = [f"{abc_path}/abc", '-c', f"putontop {' '.join(blif_files)}; sweep; print_stats; write {output_blif_file}"]
     if verbose:
         print(" ".join(cmd))
     proc = subprocess.Popen(cmd, cwd=working_dir, stdout=subprocess.PIPE, env=os.environ)
     out, err = proc.communicate()
-    aig_re = re.compile(_aig_re_str)
-    nodes = int(aig_re.search(str(out)).group().split(" ")[-1])
+    lut_re = re.compile(_lut_re_str)
+    nodes = int(lut_re.search(str(out)).group().split(" ")[-1])
     if verbose:
         print(nodes)
         print(out)

From 22736317e88e0f44a1fc8ab7b7de08b52e2e4aac Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Tue, 18 Oct 2022 12:15:07 +0100
Subject: [PATCH 25/64] [abc] Disabled print of the best model in the iterative
 optimizer.

---
 src/logicnets/abc.py | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/src/logicnets/abc.py b/src/logicnets/abc.py
index e53e7dccc..b5c07c4cc 100644
--- a/src/logicnets/abc.py
+++ b/src/logicnets/abc.py
@@ -165,7 +165,8 @@ def iterative_mfs2_optimize(circuit_file, output_file, tmp_file="tmp.blif", max_
         if nodes >= best:
             break
         else:
-            print(best)
+            if verbose:
+                print(best)
             best = nodes
             shutil.copy(tmp_file_path, output_file_path)
     os.remove(tmp_file_path)

From 0d01979aff97d936e3937f0b1c4c4d8b1d371e26 Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Tue, 18 Oct 2022 12:16:17 +0100
Subject: [PATCH 26/64] [abc] Added PyVerilator compatible verilog wrapper and
 post-process functions for ABC-generated verilog.

---
 src/logicnets/verilog.py | 43 ++++++++++++++++++++++++++++++++++++++++
 1 file changed, 43 insertions(+)

diff --git a/src/logicnets/verilog.py b/src/logicnets/verilog.py
index f073a4692..9d4f0ab30 100644
--- a/src/logicnets/verilog.py
+++ b/src/logicnets/verilog.py
@@ -12,6 +12,8 @@
 #  See the License for the specific language governing permissions and
 #  limitations under the License.
 
+import numpy as np
+
 def generate_register_verilog(module_name="myreg", param_name="DataWidth", input_name="data_in", output_name="data_out"):
     register_template = """\
 module {module_name} #(parameter {param_name}=16) (
@@ -91,3 +93,44 @@ def generate_neuron_connection_verilog(input_indices, input_bitwidth):
                 connection_string += ", "
     return connection_string
 
+def fix_abc_module_name(input_verilog_file, output_verilog_file, old_module_name, new_module_name, add_timescale: bool = False):
+    with open(input_verilog_file, 'r') as f:
+        lines = f.readlines()
+    with open(output_verilog_file, 'w') as f:
+        if add_timescale:
+            f.write("`timescale 1 ps / 1 ps\n")
+        for l in lines:
+            if l.__contains__(f"module {old_module_name}"):
+                l = f"module {new_module_name}  (\n"
+            f.write(l)
+
+def generate_abc_verilog_wrapper(module_name: str, input_name: str, input_bits: int, output_name: str, output_bits: int, submodule_name: str, num_registers: int, add_timescale: bool = True):
+    abc_wrapper_template = """\
+{timescale}
+module {module_name} (input [{input_bits_1:d}:0] {input_name}, input clk, input rst, output[{output_bits_1:d}:0] {output_name});
+{module_contents}
+endmodule\n"""
+    input_digits = int(np.ceil(np.log10(input_bits)))
+    output_digits = int(np.ceil(np.log10(output_bits)))
+    module_contents = []
+    module_contents.append(f"{submodule_name} {submodule_name}_inst (")
+    # Connect inputs
+    if num_registers > 0:
+        module_contents.append(f"    .clock(clk),")
+    for i in range(input_bits):
+        module_contents.append(f"    .pi{i:0{input_digits}d}({input_name}[{i}]),")
+    for i in range(output_bits):
+        if i < output_bits-1:
+            module_contents.append(f"    .po{i:0{output_digits}d}({output_name}[{i}]),")
+        else:
+            module_contents.append(f"    .po{i:0{output_digits}d}({output_name}[{i}])")
+    module_contents.append(f"    );\n")
+    module_contents = "\n".join(module_contents)
+    return abc_wrapper_template.format( module_name=module_name,
+                                input_name=input_name,
+                                input_bits_1=input_bits-1,
+                                output_name=output_name,
+                                output_bits_1=output_bits-1,
+                                module_contents=module_contents,
+                                timescale="`timescale 1 ps / 1 ps" if add_timescale else "")
+

From ebdb1f09a5d302a1a5385decb558f49084e1ff0a Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Tue, 18 Oct 2022 12:18:21 +0100
Subject: [PATCH 27/64] [synthesis] Updated ABC synthesis to fix the generated
 verilog and generate the verilog wrapper.

---
 src/logicnets/synthesis.py | 14 ++++++++++++++
 1 file changed, 14 insertions(+)

diff --git a/src/logicnets/synthesis.py b/src/logicnets/synthesis.py
index 36ffbfcf3..4856640c4 100644
--- a/src/logicnets/synthesis.py
+++ b/src/logicnets/synthesis.py
@@ -29,6 +29,8 @@
                     iterative_mfs2_optimize,\
                     pipeline_tech_mapped_circuit,\
                     tech_map_to_verilog
+from .verilog import    generate_abc_verilog_wrapper,\
+                        fix_abc_module_name
 
 #xcvu9p-flgb2104-2-i
 # TODO: Add option to perform synthesis on a remote server
@@ -147,6 +149,18 @@ def synthesize_and_get_resource_counts_with_abc(verilog_dir, module_list, pipeli
         nodes, out, err = tech_map_to_verilog(circuit_file=f"blif/layers_full_opt.blif", output_verilog=f"veropt/layers_full_opt.v", working_dir=abc_project_root, verbose=verbose)
     else:
         nodes, out, err = pipeline_tech_mapped_circuit(circuit_file=f"blif/layers_full_opt.blif", output_verilog=f"veropt/layers_full_opt.v", num_registers=num_registers, working_dir=abc_project_root, verbose=verbose)
+    fix_abc_module_name(f"{veropt_dir}/layers_full_opt.v", f"{veropt_dir}/layers_full_opt.v", "\\aig", "layers_full_opt", add_timescale=True)
+
+    # Generate top-level entity wrapper
+    _, input_bitwidth = module_list[0].input_quant.get_scale_factor_bits()
+    _, output_bitwidth = module_list[-1].output_quant.get_scale_factor_bits()
+    input_bitwidth, output_bitwidth = int(input_bitwidth), int(output_bitwidth)
+    total_input_bits = module_list[0].in_features*input_bitwidth
+    total_output_bits = module_list[-1].out_features*output_bitwidth
+    module_name="logicnet"
+    veropt_wrapper_str = generate_abc_verilog_wrapper(module_name=module_name, input_name="M0", input_bits=total_input_bits, output_name=f"M{len(module_list)}", output_bits=total_output_bits, submodule_name="layers_full_opt", num_registers=pipeline_stages)
+    with open(f"{veropt_dir}/{module_name}.v", "w") as f:
+        f.write(veropt_wrapper_str)
 
     # Evaluation
     # Training set:

From 71bc3d7f782f4663f02c441cd64cc12206d94ef0 Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Tue, 18 Oct 2022 13:30:36 +0100
Subject: [PATCH 28/64] [jsc] Updated neq2lut_abc scripts to work with new
 end-to-end ABC synthesis flow.

---
 examples/jet_substructure/neq2lut_abc.py | 20 +++++++++++++++++---
 1 file changed, 17 insertions(+), 3 deletions(-)

diff --git a/examples/jet_substructure/neq2lut_abc.py b/examples/jet_substructure/neq2lut_abc.py
index bdd431c2e..1f2cc4709 100644
--- a/examples/jet_substructure/neq2lut_abc.py
+++ b/examples/jet_substructure/neq2lut_abc.py
@@ -20,7 +20,8 @@
 
 from logicnets.nn import    generate_truth_tables, \
                             lut_inference, \
-                            module_list_to_verilog_module
+                            module_list_to_verilog_module, \
+                            load_histograms
 from logicnets.synthesis import synthesize_and_get_resource_counts_with_abc
 
 from train import configs, model_config, dataset_config, test
@@ -32,10 +33,12 @@
     "cuda": None,
     "log_dir": None,
     "checkpoint": None,
+    "histograms": None,
+    "freq_thresh": None,
 }
 
 if __name__ == "__main__":
-    parser = ArgumentParser(description="Synthesize convert a PyTorch trained model into verilog")
+    parser = ArgumentParser(description="Synthesize convert a PyTorch trained model into verilog using ABC")
     parser.add_argument('--arch', type=str, choices=configs.keys(), default="jsc-s",
         help="Specific the neural network model to use (default: %(default)s)")
     parser.add_argument('--batch-size', type=int, default=None, metavar='N',
@@ -66,6 +69,10 @@
         help="A location to store the log output of the training run and the output model (default: %(default)s)")
     parser.add_argument('--checkpoint', type=str, required=True,
         help="The checkpoint file which contains the model weights")
+    parser.add_argument('--histograms', type=str, default=None,
+        help="The checkpoint histograms of LUT usage (default: %(default)s)")
+    parser.add_argument('--freq-thresh', type=int, default=None,
+        help="Threshold to use to include this truth table into the model (default: %(default)s)")
     parser.add_argument('--num-registers', type=int, default=0,
         help="The number of registers to add to the generated verilog (default: %(default)s)")
     args = parser.parse_args()
@@ -144,11 +151,18 @@
                     'test_accuracy': lut_accuracy}
 
     torch.save(modelSave, options_cfg["log_dir"] + "/lut_based_model.pth")
+    if options_cfg["histograms"] is not None:
+        luts = torch.load(options_cfg["histograms"])
+        load_histograms(lut_model, luts)
 
     print("Generating verilog in %s..." % (options_cfg["log_dir"]))
     module_list_to_verilog_module(lut_model.module_list, "logicnet", options_cfg["log_dir"], generate_bench=True, add_registers=False)
     print("Top level entity stored at: %s/logicnet.v ..." % (options_cfg["log_dir"]))
 
     print("Running synthesis and verilog technology-mapped verilog in ABC")
-    synthesize_and_get_resource_counts_with_abc(options_cfg["log_dir"], lut_model.module_list, pipeline_stages=args.num_registers, freq_thresh=0)
+    train_accuracy, test_accuracy, nodes, average_care_set_size = synthesize_and_get_resource_counts_with_abc(options_cfg["log_dir"], lut_model.module_list, pipeline_stages=args.num_registers, freq_thresh=args.freq_thresh, train_input_txt="train_input.txt", train_output_txt="train_output.txt", test_input_txt="test_input.txt", test_output_txt="test_output.txt", bdd_opt_cmd="&ttopt", verbose=False)
+    print(f"Training set accuracy(%): {train_accuracy}")
+    print(f"Test set accuracy(%): {test_accuracy}")
+    print(f"LUT6(#): {nodes}")
+    print(f"Average care set sizes(%): {average_care_set_size}")
 

From 63d75471fb5a3c2674292a37091fa5c729c06f28 Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Thu, 27 Oct 2022 15:40:45 +0100
Subject: [PATCH 29/64] [jsc] Added scripts to convert blif->verilog, and to
 test the verilog.

---
 examples/jet_substructure/README.md           |  29 ++++
 examples/jet_substructure/blif2verilog.py     | 141 ++++++++++++++++++
 examples/jet_substructure/simulate_verilog.py | 111 ++++++++++++++
 3 files changed, 281 insertions(+)
 create mode 100644 examples/jet_substructure/blif2verilog.py
 create mode 100644 examples/jet_substructure/simulate_verilog.py

diff --git a/examples/jet_substructure/README.md b/examples/jet_substructure/README.md
index d9a544d55..2b27d8806 100644
--- a/examples/jet_substructure/README.md
+++ b/examples/jet_substructure/README.md
@@ -72,3 +72,32 @@ our paper below:
 }
 ```
 
+## Testing BLIF Files on the JSC Dataset
+
+In this section, we show how to take technology-mapped BLIF files,
+generate technology-mapped verilog and simulate the verilog on the JSC dataset.
+
+### Convert BLIF Files into Verilog
+
+To convert the full BLIF files (as generated from the LogicNets examples, via `neq2lut_abc.py`) into verilog, run the following:
+
+```bash
+python blif2verilog.py --arch <jsc-s|jsc-m|jsc-l> --input-blif <path_to_tech_mapped_blif>/layers_full_opt.blif --output-directory <output_directory>
+```
+
+To convert the layer-wise BLIF files into verilog, run the following:
+
+```bash
+python blif2verilog.py --arch <jsc-s|jsc-m|jsc-l> --input-blifs <path_to_tech_mapped_blif>/*.blif --output-directory <output_directory> --generated-module-name-prefix layer0
+```
+
+Note, the generated module name prefix will likely have to change if the source files are handled in a different way.
+
+### Simulate Verilog
+
+The resultant verilog can be simulated as follows:
+
+```bash
+python simulate_verilog.py --arch <jsc-s|jsc-m|jsc-l> --checkpoint <path_to_checkpoint> --input-verilog <output_directory>/logicnet.v
+```
+
diff --git a/examples/jet_substructure/blif2verilog.py b/examples/jet_substructure/blif2verilog.py
new file mode 100644
index 000000000..dc55f1afa
--- /dev/null
+++ b/examples/jet_substructure/blif2verilog.py
@@ -0,0 +1,141 @@
+#  Copyright (C) 2022 Xilinx, Inc
+#
+#  Licensed under the Apache License, Version 2.0 (the "License");
+#  you may not use this file except in compliance with the License.
+#  You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing, software
+#  distributed under the License is distributed on an "AS IS" BASIS,
+#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+#  See the License for the specific language governing permissions and
+#  limitations under the License.
+
+# A script to convert technology-mapped BLIF files to technology mapped verilog.
+
+import os
+import glob
+import shutil
+from argparse import ArgumentParser
+
+import torch
+from torch.utils.data import DataLoader
+
+from logicnets.abc import   tech_map_to_verilog,\
+                            putontop_blif,\
+                            pipeline_tech_mapped_circuit
+from logicnets.verilog import   fix_abc_module_name,\
+                                generate_abc_verilog_wrapper
+
+from train import configs, model_config, dataset_config, test
+from models import JetSubstructureNeqModel
+from dataset import JetSubstructureDataset
+
+other_options = {
+    "output_directory": None,
+    "input_blifs": None,
+    "num_registers": None,
+    "generated_module_name_prefix": None,
+}
+
+if __name__ == "__main__":
+    parser = ArgumentParser(description="Convert a technology-mapped BLIF files into a technology-mapped verilog file, using ABC")
+    parser.add_argument('--arch', type=str, choices=configs.keys(), default="jsc-s",
+        help="Specific the neural network model to use (default: %(default)s)")
+    parser.add_argument('--input-bitwidth', type=int, default=None,
+        help="Bitwidth to use at the input (default: %(default)s)")
+    parser.add_argument('--hidden-bitwidth', type=int, default=None,
+        help="Bitwidth to use for activations in hidden layers (default: %(default)s)")
+    parser.add_argument('--output-bitwidth', type=int, default=None,
+        help="Bitwidth to use at the output (default: %(default)s)")
+    parser.add_argument('--input-fanin', type=int, default=None,
+        help="Fanin to use at the input (default: %(default)s)")
+    parser.add_argument('--hidden-fanin', type=int, default=None,
+        help="Fanin to use for the hidden layers (default: %(default)s)")
+    parser.add_argument('--output-fanin', type=int, default=None,
+        help="Fanin to use at the output (default: %(default)s)")
+    parser.add_argument('--hidden-layers', nargs='+', type=int, default=None,
+        help="A list of hidden layer neuron sizes (default: %(default)s)")
+    parser.add_argument('--dataset-file', type=str, default='data/processed-pythia82-lhc13-all-pt1-50k-r1_h022_e0175_t220_nonu_truth.z',
+        help="The file to use as the dataset input (default: %(default)s)")
+    parser.add_argument('--dataset-config', type=str, default='config/yaml_IP_OP_config.yml',
+        help="The file to use to configure the input dataset (default: %(default)s)")
+    parser.add_argument('--dataset-split', type=str, default='test', choices=['train', 'test'],
+        help="Dataset to use for evaluation (default: %(default)s)")
+    parser.add_argument('--input-blifs', nargs='+', type=str, required=True,
+        help="The input BLIF files")
+    parser.add_argument('--output-directory', type=str, default='./log',
+        help="The directory which the generated verilog gets stored. (default: %(default)s)")
+    parser.add_argument('--num-registers', type=int, default=0,
+        help="The number of registers to add to the generated verilog (default: %(default)s)")
+    parser.add_argument('--generated-module-name-prefix', type=str, default='\\aig',
+        help="A prefix which matches the module name in the generated verilog, but no other line of code (default: %(default)s)")
+    args = parser.parse_args()
+    defaults = configs[args.arch]
+    options = vars(args)
+    del options['arch']
+    config = {}
+    for k in options.keys():
+        config[k] = options[k] if options[k] is not None else defaults[k] # Override defaults, if specified.
+
+    if not os.path.exists(args.output_directory):
+        os.makedirs(args.output_directory)
+
+    # Split up configuration options to be more understandable
+    model_cfg = {}
+    for k in model_config.keys():
+        model_cfg[k] = config[k]
+    dataset_cfg = {}
+    for k in dataset_config.keys():
+        dataset_cfg[k] = config[k]
+    options_cfg = {}
+    for k in other_options.keys():
+        options_cfg[k] = config[k]
+
+    # Fetch the test set
+    dataset = {}
+    dataset[args.dataset_split] = JetSubstructureDataset(dataset_cfg['dataset_file'], dataset_cfg['dataset_config'], split=args.dataset_split)
+    test_loader = DataLoader(dataset[args.dataset_split], batch_size=1, shuffle=False)
+
+    # Instantiate the PyTorch model
+    x, y = dataset[args.dataset_split][0]
+    model_cfg['input_length'] = len(x)
+    model_cfg['output_length'] = len(y)
+    model = JetSubstructureNeqModel(model_cfg)
+
+    abc_project_root = options_cfg['output_directory']
+    veropt_dir = options_cfg['output_directory']
+    input_blif = "layers_full_opt.blif"
+    verbose = False
+
+    if len(options_cfg['input_blifs']) > 1:
+        nodes, out, err = putontop_blif([os.path.realpath(blif) for blif in options_cfg['input_blifs']], input_blif, working_dir=abc_project_root, verbose=verbose)
+    else:
+        shutil.copy(os.path.realpath(options_cfg['input_blifs'][0]), f"{abc_project_root}/{input_blif}")
+
+    if options_cfg['num_registers'] == 0:
+        nodes, out, err = tech_map_to_verilog(circuit_file=input_blif, output_verilog=f"layers_full_opt.v", working_dir=abc_project_root, verbose=verbose)
+    else:
+        nodes, out, err = pipeline_tech_mapped_circuit(circuit_file=input_blif, output_verilog=f"layers_full_opt.v", num_registers=options_cfg['num_registers'], working_dir=abc_project_root, verbose=verbose)
+
+    # Fix the resultant verilog file so that it can be simulated
+    fix_abc_module_name(f"{veropt_dir}/layers_full_opt.v", f"{veropt_dir}/layers_full_opt.v", options_cfg["generated_module_name_prefix"], "layers_full_opt", add_timescale=True)
+
+    # Generate top-level entity wrapper
+    module_list = model.module_list
+    _, input_bitwidth = module_list[0].input_quant.get_scale_factor_bits()
+    _, output_bitwidth = module_list[-1].output_quant.get_scale_factor_bits()
+    input_bitwidth, output_bitwidth = int(input_bitwidth), int(output_bitwidth)
+    total_input_bits = module_list[0].in_features*input_bitwidth
+    total_output_bits = module_list[-1].out_features*output_bitwidth
+    module_name="logicnet"
+    veropt_wrapper_str = generate_abc_verilog_wrapper(module_name=module_name, input_name="M0", input_bits=total_input_bits, output_name=f"M{len(module_list)}", output_bits=total_output_bits, submodule_name="layers_full_opt", num_registers=options_cfg['num_registers'])
+    with open(f"{veropt_dir}/{module_name}.v", "w") as f:
+        f.write(veropt_wrapper_str)
+
+    print(f"Adding Nitro-Parts-Lib to {veropt_dir}")
+    source_files = glob.glob(f"{os.environ['NITROPARTSLIB']}/*.v")
+    for f in source_files:
+        shutil.copy(f, f"{veropt_dir}")
+
diff --git a/examples/jet_substructure/simulate_verilog.py b/examples/jet_substructure/simulate_verilog.py
new file mode 100644
index 000000000..15746b802
--- /dev/null
+++ b/examples/jet_substructure/simulate_verilog.py
@@ -0,0 +1,111 @@
+#  Copyright (C) 2021 Xilinx, Inc
+#
+#  Licensed under the Apache License, Version 2.0 (the "License");
+#  you may not use this file except in compliance with the License.
+#  You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing, software
+#  distributed under the License is distributed on an "AS IS" BASIS,
+#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+#  See the License for the specific language governing permissions and
+#  limitations under the License.
+
+import os
+from argparse import ArgumentParser
+
+import torch
+from torch.utils.data import DataLoader
+
+from train import configs, model_config, dataset_config, test
+from dataset import JetSubstructureDataset
+from models import JetSubstructureNeqModel
+
+other_options = {
+    "checkpoint": None,
+    "input_verilog": None,
+    "num_registers": None,
+}
+
+if __name__ == "__main__":
+    parser = ArgumentParser(description="Synthesize convert a PyTorch trained model into verilog")
+    parser.add_argument('--arch', type=str, choices=configs.keys(), default="jsc-s",
+        help="Specific the neural network model to use (default: %(default)s)")
+    parser.add_argument('--batch-size', type=int, default=None, metavar='N',
+        help="Batch size for evaluation (default: %(default)s)")
+    parser.add_argument('--input-bitwidth', type=int, default=None,
+        help="Bitwidth to use at the input (default: %(default)s)")
+    parser.add_argument('--hidden-bitwidth', type=int, default=None,
+        help="Bitwidth to use for activations in hidden layers (default: %(default)s)")
+    parser.add_argument('--output-bitwidth', type=int, default=None,
+        help="Bitwidth to use at the output (default: %(default)s)")
+    parser.add_argument('--input-fanin', type=int, default=None,
+        help="Fanin to use at the input (default: %(default)s)")
+    parser.add_argument('--hidden-fanin', type=int, default=None,
+        help="Fanin to use for the hidden layers (default: %(default)s)")
+    parser.add_argument('--output-fanin', type=int, default=None,
+        help="Fanin to use at the output (default: %(default)s)")
+    parser.add_argument('--hidden-layers', nargs='+', type=int, default=None,
+        help="A list of hidden layer neuron sizes (default: %(default)s)")
+    parser.add_argument('--dataset-file', type=str, default='data/processed-pythia82-lhc13-all-pt1-50k-r1_h022_e0175_t220_nonu_truth.z',
+        help="The file to use as the dataset input (default: %(default)s)")
+    parser.add_argument('--dataset-config', type=str, default='config/yaml_IP_OP_config.yml',
+        help="The file to use to configure the input dataset (default: %(default)s)")
+    parser.add_argument('--dataset-split', type=str, default='test', choices=['train', 'test'],
+        help="Dataset to use for evaluation (default: %(default)s)")
+    parser.add_argument('--checkpoint', type=str, required=True,
+        help="The checkpoint file which contains the model weights")
+    parser.add_argument('--input-verilog', type=str, required=True,
+        help="The input verilog file to simulate")
+    parser.add_argument('--num-registers', type=int, default=0,
+        help="The number of pipeline registers in the verilog (default: %(default)s)")
+    args = parser.parse_args()
+    defaults = configs[args.arch]
+    options = vars(args)
+    del options['arch']
+    config = {}
+    for k in options.keys():
+        config[k] = options[k] if options[k] is not None else defaults[k] # Override defaults, if specified.
+
+    # Split up configuration options to be more understandable
+    model_cfg = {}
+    for k in model_config.keys():
+        model_cfg[k] = config[k]
+    dataset_cfg = {}
+    for k in dataset_config.keys():
+        dataset_cfg[k] = config[k]
+    options_cfg = {}
+    for k in other_options.keys():
+        if k == 'cuda':
+            continue
+        options_cfg[k] = config[k]
+
+    # Fetch the test set
+    dataset = {}
+    dataset[args.dataset_split] = JetSubstructureDataset(dataset_cfg['dataset_file'], dataset_cfg['dataset_config'], split=args.dataset_split)
+    test_loader = DataLoader(dataset[args.dataset_split], batch_size=config['batch_size'], shuffle=False)
+
+    # Instantiate the PyTorch model
+    x, y = dataset[args.dataset_split][0]
+    model_cfg['input_length'] = len(x)
+    model_cfg['output_length'] = len(y)
+    model = JetSubstructureNeqModel(model_cfg)
+
+    # Load the model weights
+    checkpoint = torch.load(options_cfg['checkpoint'], map_location='cpu')
+    model.load_state_dict(checkpoint['model_dict'])
+
+    # Test the PyTorch model
+    print("Running inference on baseline model...")
+    model.eval()
+    baseline_accuracy = test(model, test_loader, cuda=False)
+    print("Baseline accuracy: %f" % (baseline_accuracy))
+
+    verilog_dir = os.path.dirname(options_cfg["input_verilog"])
+    filename = os.path.split(options_cfg["input_verilog"])[-1]
+    print(f"Running inference simulation of Verilog-based model ({filename})")
+    model.verilog_inference(verilog_dir, filename, logfile=None, add_registers=options_cfg["num_registers"] == 0, verify=False)
+    verilog_accuracy = test(model, test_loader, cuda=False)
+    print("Verilog-Based Model accuracy: %f" % (verilog_accuracy))
+

From 98f8342f8449adb538a7279d14b3e99f1f9a2454 Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Thu, 27 Oct 2022 17:48:26 +0100
Subject: [PATCH 30/64] [abc] Added option to specify the mfs2 command and
 mapping command.

---
 src/logicnets/abc.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/src/logicnets/abc.py b/src/logicnets/abc.py
index b5c07c4cc..14d74c48b 100644
--- a/src/logicnets/abc.py
+++ b/src/logicnets/abc.py
@@ -116,8 +116,8 @@ def optimize_bdd_network(circuit_file, output_file, input_bitwidth, output_bitwi
         print(err)
     return nodes, tt_pct, time_s, out, err # TODO: return the number of nodes, tt%, time
 
-def optimize_mfs2(circuit_file, output_file, abc_path=os.environ["ABC_ROOT"], working_dir=None, verbose=False):
-    cmd = [f"{abc_path}/abc", '-c', f"read {circuit_file}; if -K 6 -a; mfs2; write_blif {output_file}; print_stats"]
+def optimize_mfs2(circuit_file, output_file, abc_path=os.environ["ABC_ROOT"], command="mfs2", mapping="if -K 6 -a;", working_dir=None, verbose=False):
+    cmd = [f"{abc_path}/abc", '-c', f"read {circuit_file}; {mapping} {command}; write_blif {output_file}; print_stats"]
     if verbose:
         print(" ".join(cmd))
     proc = subprocess.Popen(cmd, cwd=working_dir, stdout=subprocess.PIPE, env=os.environ)

From b63c3f6f0df2fb6f24dc559d9e485a00d4bc2127 Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Wed, 4 Jan 2023 11:40:53 +0000
Subject: [PATCH 31/64] [mnist] Initial train scripts and model definitions.

---
 examples/mnist/models.py  | 141 +++++++++++++++++
 examples/mnist/neq2lut.py | 182 ++++++++++++++++++++++
 examples/mnist/train.py   | 314 ++++++++++++++++++++++++++++++++++++++
 3 files changed, 637 insertions(+)
 create mode 100644 examples/mnist/models.py
 create mode 100644 examples/mnist/neq2lut.py
 create mode 100644 examples/mnist/train.py

diff --git a/examples/mnist/models.py b/examples/mnist/models.py
new file mode 100644
index 000000000..a67a9128d
--- /dev/null
+++ b/examples/mnist/models.py
@@ -0,0 +1,141 @@
+#  Copyright (C) 2021 Xilinx, Inc
+#
+#  Licensed under the Apache License, Version 2.0 (the "License");
+#  you may not use this file except in compliance with the License.
+#  You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing, software
+#  distributed under the License is distributed on an "AS IS" BASIS,
+#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+#  See the License for the specific language governing permissions and
+#  limitations under the License.
+
+from functools import reduce
+from os.path import realpath
+
+import torch
+import torch.nn as nn
+from torch.nn.parameter import Parameter
+from torch.nn import init
+
+from brevitas.core.quant import QuantType
+from brevitas.core.scaling import ScalingImplType
+from brevitas.nn import QuantHardTanh, QuantReLU
+
+from pyverilator import PyVerilator
+
+from logicnets.quant import QuantBrevitasActivation
+from logicnets.nn import SparseLinearNeq, ScalarBiasScale, RandomFixedSparsityMask2D, DenseMask2D
+from logicnets.init import random_restrict_fanin
+
+class MnistNeqModel(nn.Module):
+    def __init__(self, model_config):
+        super(MnistNeqModel, self).__init__()
+        self.model_config = model_config
+        self.num_neurons = [model_config["input_length"]] + model_config["hidden_layers"] + [model_config["output_length"]]
+        layer_list = []
+        for i in range(1, len(self.num_neurons)):
+            in_features = self.num_neurons[i-1]
+            out_features = self.num_neurons[i]
+            bn = nn.BatchNorm1d(out_features)
+            if i == 1:
+                do_in = nn.Dropout(p=0.3)
+                bn_in = nn.BatchNorm1d(in_features)
+                input_bias = ScalarBiasScale(scale=False, bias_init=-0.25)
+                input_quant = QuantBrevitasActivation(QuantHardTanh(model_config["input_bitwidth"], max_val=1., narrow_range=False, quant_type=QuantType.INT, scaling_impl_type=ScalingImplType.PARAMETER), pre_transforms=[do_in, bn_in, input_bias])
+                output_quant = QuantBrevitasActivation(QuantReLU(bit_width=model_config["hidden_bitwidth"], max_val=1.61, quant_type=QuantType.INT, scaling_impl_type=ScalingImplType.PARAMETER), pre_transforms=[bn])
+                mask = RandomFixedSparsityMask2D(in_features, out_features, fan_in=model_config["input_fanin"])
+                layer = SparseLinearNeq(in_features, out_features, input_quant=input_quant, output_quant=output_quant, sparse_linear_kws={'mask': mask})
+                layer_list.append(layer)
+            elif i == len(self.num_neurons)-1:
+                output_bias_scale = ScalarBiasScale(bias_init=0.33)
+                output_quant = QuantBrevitasActivation(QuantHardTanh(bit_width=model_config["output_bitwidth"], max_val=1.33, narrow_range=False, quant_type=QuantType.INT, scaling_impl_type=ScalingImplType.PARAMETER), pre_transforms=[bn], post_transforms=[output_bias_scale])
+                mask = RandomFixedSparsityMask2D(in_features, out_features, fan_in=model_config["output_fanin"])
+                layer = SparseLinearNeq(in_features, out_features, input_quant=layer_list[-1].output_quant, output_quant=output_quant, sparse_linear_kws={'mask': mask}, apply_input_quant=False)
+                layer_list.append(layer)
+            else:
+                output_quant = QuantBrevitasActivation(QuantReLU(bit_width=model_config["hidden_bitwidth"], max_val=1.61, quant_type=QuantType.INT, scaling_impl_type=ScalingImplType.PARAMETER), pre_transforms=[bn])
+                mask = RandomFixedSparsityMask2D(in_features, out_features, fan_in=model_config["hidden_fanin"])
+                layer = SparseLinearNeq(in_features, out_features, input_quant=layer_list[-1].output_quant, output_quant=output_quant, sparse_linear_kws={'mask': mask}, apply_input_quant=False)
+                layer_list.append(layer)
+        self.module_list = nn.ModuleList(layer_list)
+        self.is_verilog_inference = False
+        self.latency = 1
+        self.verilog_dir = None
+        self.top_module_filename = None
+        self.dut = None
+        self.logfile = None
+
+    def verilog_inference(self, verilog_dir, top_module_filename, logfile: bool = False, add_registers: bool = False):
+        self.verilog_dir = realpath(verilog_dir)
+        self.top_module_filename = top_module_filename
+        self.dut = PyVerilator.build(f"{self.verilog_dir}/{self.top_module_filename}", verilog_path=[self.verilog_dir], build_dir=f"{self.verilog_dir}/verilator")
+        self.is_verilog_inference = True
+        self.logfile = logfile
+        if add_registers:
+            self.latency = len(self.num_neurons)
+
+    def pytorch_inference(self):
+        self.is_verilog_inference = False
+
+    def verilog_forward(self, x):
+        # Get integer output from the first layer
+        input_quant = self.module_list[0].input_quant
+        output_quant = self.module_list[-1].output_quant
+        _, input_bitwidth = self.module_list[0].input_quant.get_scale_factor_bits()
+        _, output_bitwidth = self.module_list[-1].output_quant.get_scale_factor_bits()
+        input_bitwidth, output_bitwidth = int(input_bitwidth), int(output_bitwidth)
+        total_input_bits = self.module_list[0].in_features*input_bitwidth
+        total_output_bits = self.module_list[-1].out_features*output_bitwidth
+        num_layers = len(self.module_list)
+        input_quant.bin_output()
+        self.module_list[0].apply_input_quant = False
+        y = torch.zeros(x.shape[0], self.module_list[-1].out_features)
+        x = input_quant(x)
+        self.dut.io.rst = 0
+        self.dut.io.clk = 0
+        for i in range(x.shape[0]):
+            x_i = x[i,:]
+            y_i = self.pytorch_forward(x[i:i+1,:])[0]
+            xv_i = list(map(lambda z: input_quant.get_bin_str(z), x_i))
+            ys_i = list(map(lambda z: output_quant.get_bin_str(z), y_i))
+            xvc_i = reduce(lambda a,b: a+b, xv_i[::-1])
+            ysc_i = reduce(lambda a,b: a+b, ys_i[::-1])
+            self.dut["M0"] = int(xvc_i, 2)
+            for j in range(self.latency + 1):
+                #print(self.dut.io.M5)
+                res = self.dut[f"M{num_layers}"]
+                result = f"{res:0{int(total_output_bits)}b}"
+                self.dut.io.clk = 1
+                self.dut.io.clk = 0
+            expected = f"{int(ysc_i,2):0{int(total_output_bits)}b}"
+            result = f"{res:0{int(total_output_bits)}b}"
+            assert(expected == result)
+            res_split = [result[i:i+output_bitwidth] for i in range(0, len(result), output_bitwidth)][::-1]
+            yv_i = torch.Tensor(list(map(lambda z: int(z, 2), res_split)))
+            y[i,:] = yv_i
+            # Dump the I/O pairs
+            if self.logfile is not None:
+                with open(self.logfile, "a") as f:
+                    f.write(f"{int(xvc_i,2):0{int(total_input_bits)}b}{int(ysc_i,2):0{int(total_output_bits)}b}\n")
+        return y
+
+    def pytorch_forward(self, x):
+        for l in self.module_list:
+            x = l(x)
+        return x
+
+    def forward(self, x):
+        if self.is_verilog_inference:
+            return self.verilog_forward(x)
+        else:
+            return self.pytorch_forward(x)
+
+class MnistLutModel(MnistNeqModel):
+    pass
+
+class MnistVerilogModel(MnistNeqModel):
+    pass
+
diff --git a/examples/mnist/neq2lut.py b/examples/mnist/neq2lut.py
new file mode 100644
index 000000000..53c36624d
--- /dev/null
+++ b/examples/mnist/neq2lut.py
@@ -0,0 +1,182 @@
+#  Copyright (C) 2021 Xilinx, Inc
+#
+#  Licensed under the Apache License, Version 2.0 (the "License");
+#  you may not use this file except in compliance with the License.
+#  You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing, software
+#  distributed under the License is distributed on an "AS IS" BASIS,
+#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+#  See the License for the specific language governing permissions and
+#  limitations under the License.
+
+import os
+from argparse import ArgumentParser
+from functools import partial
+
+import torch
+from torch.utils.data import DataLoader
+from torchvision.datasets import MNIST
+from torchvision import transforms
+
+from logicnets.nn import    generate_truth_tables, \
+                            lut_inference, \
+                            module_list_to_verilog_module
+from logicnets.synthesis import synthesize_and_get_resource_counts
+from logicnets.util import proc_postsynth_file
+
+from models import MnistNeqModel, MnistLutModel, MnistVerilogModel
+from train import configs, model_config, dataset_config, test
+
+other_options = {
+    "cuda": None,
+    "log_dir": None,
+    "checkpoint": None,
+    "generate_bench": False,
+    "add_registers": False,
+    "simulate_pre_synthesis_verilog": False,
+    "simulate_post_synthesis_verilog": False,
+}
+
+if __name__ == "__main__":
+    parser = ArgumentParser(description="Synthesize convert a PyTorch trained model into verilog")
+    parser.add_argument('--arch', type=str, choices=configs.keys(), default="jsc-s",
+        help="Specific the neural network model to use (default: %(default)s)")
+    parser.add_argument('--batch-size', type=int, default=None, metavar='N',
+        help="Batch size for evaluation (default: %(default)s)")
+    parser.add_argument('--input-bitwidth', type=int, default=None,
+        help="Bitwidth to use at the input (default: %(default)s)")
+    parser.add_argument('--hidden-bitwidth', type=int, default=None,
+        help="Bitwidth to use for activations in hidden layers (default: %(default)s)")
+    parser.add_argument('--output-bitwidth', type=int, default=None,
+        help="Bitwidth to use at the output (default: %(default)s)")
+    parser.add_argument('--input-fanin', type=int, default=None,
+        help="Fanin to use at the input (default: %(default)s)")
+    parser.add_argument('--hidden-fanin', type=int, default=None,
+        help="Fanin to use for the hidden layers (default: %(default)s)")
+    parser.add_argument('--output-fanin', type=int, default=None,
+        help="Fanin to use at the output (default: %(default)s)")
+    parser.add_argument('--hidden-layers', nargs='+', type=int, default=None,
+        help="A list of hidden layer neuron sizes (default: %(default)s)")
+    parser.add_argument('--dataset-file', type=str, default='data/processed-pythia82-lhc13-all-pt1-50k-r1_h022_e0175_t220_nonu_truth.z',
+        help="The file to use as the dataset input (default: %(default)s)")
+    parser.add_argument('--clock-period', type=float, default=1.0,
+        help="Target clock frequency to use during Vivado synthesis (default: %(default)s)")
+    parser.add_argument('--dataset-config', type=str, default='config/yaml_IP_OP_config.yml',
+        help="The file to use to configure the input dataset (default: %(default)s)")
+    parser.add_argument('--dataset-split', type=str, default='test', choices=['train', 'test'],
+        help="Dataset to use for evaluation (default: %(default)s)")
+    parser.add_argument('--log-dir', type=str, default='./log',
+        help="A location to store the log output of the training run and the output model (default: %(default)s)")
+    parser.add_argument('--checkpoint', type=str, required=True,
+        help="The checkpoint file which contains the model weights")
+    parser.add_argument('--generate-bench', action='store_true', default=False,
+        help="Generate the truth table in BENCH format as well as verilog (default: %(default)s)")
+    parser.add_argument('--dump-io', action='store_true', default=False,
+        help="Dump I/O to the verilog LUT to a text file in the log directory (default: %(default)s)")
+    parser.add_argument('--add-registers', action='store_true', default=False,
+        help="Add registers between each layer in generated verilog (default: %(default)s)")
+    parser.add_argument('--simulate-pre-synthesis-verilog', action='store_true', default=False,
+        help="Simulate the verilog generated by LogicNets (default: %(default)s)")
+    parser.add_argument('--simulate-post-synthesis-verilog', action='store_true', default=False,
+        help="Simulate the post-synthesis verilog produced by vivado (default: %(default)s)")
+    args = parser.parse_args()
+    defaults = configs[args.arch]
+    options = vars(args)
+    del options['arch']
+    config = {}
+    for k in options.keys():
+        config[k] = options[k] if options[k] is not None else defaults[k] # Override defaults, if specified.
+
+    if not os.path.exists(config['log_dir']):
+        os.makedirs(config['log_dir'])
+
+    # Split up configuration options to be more understandable
+    model_cfg = {}
+    for k in model_config.keys():
+        model_cfg[k] = config[k]
+    dataset_cfg = {}
+    for k in dataset_config.keys():
+        dataset_cfg[k] = config[k]
+    options_cfg = {}
+    for k in other_options.keys():
+        if k == 'cuda':
+            continue
+        options_cfg[k] = config[k]
+
+    trans = transform=transforms.Compose([
+                transforms.ToTensor(),
+                transforms.Normalize((0.1307,), (0.3081,)),
+                transforms.Lambda(partial(torch.reshape, shape=(-1,)))
+            ])
+
+    # Fetch the test set
+    dataset = {}
+    dataset[args.dataset_split] = MNIST('./data', train=args.dataset_split == "train", download=True, transform=trans)
+    test_loader = DataLoader(dataset[args.dataset_split], batch_size=config['batch_size'], shuffle=False)
+
+    # Instantiate the PyTorch model
+    x, y = dataset[args.dataset_split][0]
+    model_cfg['input_length'] = len(x)
+    model_cfg['output_length'] = 10
+    model = MnistNeqModel(model_cfg)
+
+    # Load the model weights
+    checkpoint = torch.load(options_cfg['checkpoint'], map_location='cpu')
+    model.load_state_dict(checkpoint['model_dict'])
+
+    # Test the PyTorch model
+    print("Running inference on baseline model...")
+    model.eval()
+    baseline_accuracy = test(model, test_loader, cuda=False)
+    print("Baseline accuracy: %f" % (baseline_accuracy))
+
+    # Instantiate LUT-based model
+    lut_model = MnistLutModel(model_cfg)
+    lut_model.load_state_dict(checkpoint['model_dict'])
+
+    # Generate the truth tables in the LUT module
+    print("Converting to NEQs to LUTs...")
+    generate_truth_tables(lut_model, verbose=True)
+
+    # Test the LUT-based model
+    print("Running inference on LUT-based model...")
+    lut_inference(lut_model)
+    lut_model.eval()
+    lut_accuracy = test(lut_model, test_loader, cuda=False)
+    print("LUT-Based Model accuracy: %f" % (lut_accuracy))
+    modelSave = {   'model_dict': lut_model.state_dict(),
+                    'test_accuracy': lut_accuracy}
+
+    torch.save(modelSave, options_cfg["log_dir"] + "/lut_based_model.pth")
+
+    print("Generating verilog in %s..." % (options_cfg["log_dir"]))
+    module_list_to_verilog_module(lut_model.module_list, "logicnet", options_cfg["log_dir"], generate_bench=options_cfg["generate_bench"], add_registers=options_cfg["add_registers"])
+    print("Top level entity stored at: %s/logicnet.v ..." % (options_cfg["log_dir"]))
+
+    if args.dump_io:
+        io_filename = options_cfg["log_dir"] + f"io_{args.dataset_split}.txt"
+        with open(io_filename, 'w') as f:
+            pass # Create an empty file.
+        print(f"Dumping verilog I/O to {io_filename}...")
+    else:
+        io_filename = None
+
+    if args.simulate_pre_synthesis_verilog:
+        print("Running inference simulation of Verilog-based model...")
+        lut_model.verilog_inference(options_cfg["log_dir"], "logicnet.v", logfile=io_filename, add_registers=options_cfg["add_registers"])
+        verilog_accuracy = test(lut_model, test_loader, cuda=False)
+        print("Verilog-Based Model accuracy: %f" % (verilog_accuracy))
+
+    print("Running out-of-context synthesis")
+    ret = synthesize_and_get_resource_counts(options_cfg["log_dir"], "logicnet", fpga_part="xcu280-fsvh2892-2L-e", clk_period_ns=args.clock_period, post_synthesis = 1)
+
+    if args.simulate_post_synthesis_verilog:
+        print("Running post-synthesis inference simulation of Verilog-based model...")
+        proc_postsynth_file(options_cfg["log_dir"])
+        lut_model.verilog_inference(options_cfg["log_dir"]+"/post_synth", "logicnet_post_synth.v", io_filename, add_registers=options_cfg["add_registers"])
+        post_synth_accuracy = test(lut_model, test_loader, cuda=False)
+        print("Post-synthesis Verilog-Based Model accuracy: %f" % (post_synth_accuracy))
+    
diff --git a/examples/mnist/train.py b/examples/mnist/train.py
new file mode 100644
index 000000000..4ed574cd2
--- /dev/null
+++ b/examples/mnist/train.py
@@ -0,0 +1,314 @@
+#  Copyright (C) 2021 Xilinx, Inc
+#
+#  Licensed under the Apache License, Version 2.0 (the "License");
+#  you may not use this file except in compliance with the License.
+#  You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing, software
+#  distributed under the License is distributed on an "AS IS" BASIS,
+#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+#  See the License for the specific language governing permissions and
+#  limitations under the License.
+
+import os
+from argparse import ArgumentParser
+from functools import reduce, partial
+import random
+
+import numpy as np
+
+import torch
+import torch.nn as nn
+import torch.optim as optim
+from torch.utils.data import DataLoader
+from torch.utils.tensorboard import SummaryWriter
+from torchvision import transforms
+from torchvision.datasets import MNIST
+
+from models import MnistNeqModel
+
+# TODO: Replace default configs with YAML files.
+configs = {
+    "mnist-s": {
+        "hidden_layers": [512, 256, 128, 100],
+        "input_bitwidth": 1,
+        "hidden_bitwidth": 1,
+        "output_bitwidth": 4,
+        "input_fanin": 6,
+        "hidden_fanin": 6,
+        "output_fanin": 6,
+        "weight_decay": 1e-3,
+        "batch_size": 1024,
+        "epochs": 1000,
+        "learning_rate": 1e-3,
+        "seed": 0,
+        "checkpoint": None,
+    },
+    "mnist-m": {
+        "hidden_layers": [512, 256, 128, 100],
+        "input_bitwidth": 2,
+        "hidden_bitwidth": 2,
+        "output_bitwidth": 4,
+        "input_fanin": 4,
+        "hidden_fanin": 4,
+        "output_fanin": 4,
+        "weight_decay": 1e-3,
+        "batch_size": 1024,
+        "epochs": 1000,
+        "learning_rate": 1e-3,
+        "seed": 0,
+        "checkpoint": None,
+    },
+    "mnist-l": {
+        "hidden_layers": [512, 256, 128, 100],
+        "input_bitwidth": 3,
+        "hidden_bitwidth": 3,
+        "output_bitwidth": 4,
+        "input_fanin": 4,
+        "hidden_fanin": 4,
+        "output_fanin": 4,
+        "weight_decay": 1e-3,
+        "batch_size": 1024,
+        "epochs": 1000,
+        "learning_rate": 1e-3,
+        "seed": 0,
+        "checkpoint": None,
+    },
+}
+
+# A dictionary, so we can set some defaults if necessary
+model_config = {
+    "hidden_layers": None,
+    "input_bitwidth": None,
+    "hidden_bitwidth": None,
+    "output_bitwidth": None,
+    "input_fanin": None,
+    "hidden_fanin": None,
+    "output_fanin": None,
+}
+
+training_config = {
+    "weight_decay": None,
+    "batch_size": None,
+    "epochs": None,
+    "learning_rate": None,
+    "seed": None,
+}
+
+dataset_config = {
+    "dataset_file": None,
+    "dataset_config": None,
+}
+
+other_options = {
+    "cuda": None,
+    "log_dir": None,
+    "checkpoint": None,
+}
+
+def train(model, datasets, train_cfg, options):
+    # Create data loaders for training and inference:
+    train_loader = DataLoader(datasets["train"], batch_size=train_cfg['batch_size'], shuffle=True)
+    val_loader = DataLoader(datasets["valid"], batch_size=train_cfg['batch_size'], shuffle=False)
+    test_loader = DataLoader(datasets["test"], batch_size=train_cfg['batch_size'], shuffle=False)
+
+    # Configure optimizer
+    weight_decay = train_cfg["weight_decay"]
+    decay_exclusions = ["bn", "bias", "learned_value"] # Make a list of parameters name fragments which will ignore weight decay TODO: make this list part of the train_cfg
+    decay_params = []
+    no_decay_params = []
+    for pname, params in model.named_parameters():
+        if params.requires_grad:
+            if reduce(lambda a,b: a or b, map(lambda x: x in pname, decay_exclusions)): # check if the current label should be excluded from weight decay
+                #print("Disabling weight decay for %s" % (pname))
+                no_decay_params.append(params)
+            else:
+                #print("Enabling weight decay for %s" % (pname))
+                decay_params.append(params)
+        #else:
+            #print("Ignoring %s" % (pname))
+    params =    [{'params': decay_params, 'weight_decay': weight_decay},
+                {'params': no_decay_params, 'weight_decay': 0.0}]
+    optimizer = optim.AdamW(params, lr=train_cfg['learning_rate'], betas=(0.5, 0.999), weight_decay=weight_decay)
+
+    # Configure scheduler
+    steps = len(train_loader)
+    scheduler = optim.lr_scheduler.CosineAnnealingWarmRestarts(optimizer, T_0=steps*100, T_mult=1)
+
+    # Configure criterion
+    criterion = nn.CrossEntropyLoss()
+
+    # Push the model to the GPU, if necessary
+    if options["cuda"]:
+        model.cuda()
+
+    # Setup tensorboard
+    writer = SummaryWriter(options["log_dir"])
+
+    # Main training loop
+    maxAcc = 0.0
+    num_epochs = train_cfg["epochs"]
+    for epoch in range(0, num_epochs):
+        # Train for this epoch
+        model.train()
+        accLoss = 0.0
+        correct = 0
+        for batch_idx, (data, target) in enumerate(train_loader):
+            if options["cuda"]:
+                data, target = data.cuda(), target.cuda()
+            optimizer.zero_grad()
+            output = model(data)
+            loss = criterion(output, target)
+            pred = output.detach().max(1, keepdim=True)[1]
+            target_label = target.detach().unsqueeze(1)
+            curCorrect = pred.eq(target_label).long().sum()
+            curAcc = 100.0*curCorrect / len(data)
+            correct += curCorrect
+            accLoss += loss.detach()*len(data)
+            loss.backward()
+            optimizer.step()
+            scheduler.step()
+
+            # Log stats to tensorboard
+            #writer.add_scalar('train_loss', loss.detach().cpu().numpy(), epoch*steps + batch_idx)
+            #writer.add_scalar('train_accuracy', curAcc.detach().cpu().numpy(), epoch*steps + batch_idx)
+            #g = optimizer.param_groups[0]
+            #writer.add_scalar('LR', g['lr'], epoch*steps + batch_idx)
+
+        accLoss /= len(train_loader.dataset)
+        accuracy = 100.0*correct / len(train_loader.dataset)
+        print(f"Epoch: {epoch}/{num_epochs}\tTrain Acc (%): {accuracy.detach().cpu().numpy():.2f}\tTrain Loss: {accLoss.detach().cpu().numpy():.3e}")
+        #for g in optimizer.param_groups:
+        #        print("LR: {:.6f} ".format(g['lr']))
+        #        print("LR: {:.6f} ".format(g['weight_decay']))
+        writer.add_scalar('avg_train_loss', accLoss.detach().cpu().numpy(), (epoch+1)*steps)
+        writer.add_scalar('avg_train_accuracy', accuracy.detach().cpu().numpy(), (epoch+1)*steps)
+        val_accuracy = test(model, val_loader, options["cuda"])
+        test_accuracy = test(model, test_loader, options["cuda"])
+        modelSave = {   'model_dict': model.state_dict(),
+                        'optim_dict': optimizer.state_dict(),
+                        'val_accuracy': val_accuracy,
+                        'test_accuracy': test_accuracy,
+                        'epoch': epoch}
+        torch.save(modelSave, options["log_dir"] + "/checkpoint.pth")
+        if(maxAcc<val_accuracy):
+            torch.save(modelSave, options["log_dir"] + "/best_accuracy.pth")
+            maxAcc = val_accuracy
+        writer.add_scalar('val_accuracy', val_accuracy, (epoch+1)*steps)
+        writer.add_scalar('test_accuracy', test_accuracy, (epoch+1)*steps)
+        print(f"Epoch: {epoch}/{num_epochs}\tValid Acc (%): {val_accuracy:.2f}\tTest Acc: {test_accuracy:.2f}")
+
+def test(model, dataset_loader, cuda):
+    model.eval()
+    correct = 0
+    accLoss = 0.0
+    for batch_idx, (data, target) in enumerate(dataset_loader):
+        if cuda:
+            data, target = data.cuda(), target.cuda()
+        output = model(data)
+        pred = output.detach().max(1, keepdim=True)[1]
+        target_label = target.detach().unsqueeze(1)
+        curCorrect = pred.eq(target_label).long().sum()
+        curAcc = 100.0*curCorrect / len(data)
+        correct += curCorrect
+    accuracy = 100*float(correct) / len(dataset_loader.dataset)
+    return accuracy
+
+if __name__ == "__main__":
+    parser = ArgumentParser(description="LogicNets MNIST Classification Example")
+    parser.add_argument('--arch', type=str, choices=configs.keys(), default="mnist-s",
+        help="Specific the neural network model to use (default: %(default)s)")
+    parser.add_argument('--weight-decay', type=float, default=None, metavar='D',
+        help="Weight decay (default: %(default)s)")
+    parser.add_argument('--batch-size', type=int, default=None, metavar='N',
+        help="Batch size for training (default: %(default)s)")
+    parser.add_argument('--epochs', type=int, default=None, metavar='N',
+        help="Number of epochs to train (default: %(default)s)")
+    parser.add_argument('--learning-rate', type=float, default=None, metavar='LR',
+        help="Initial learning rate (default: %(default)s)")
+    parser.add_argument('--cuda', action='store_true', default=False,
+        help="Train on a GPU (default: %(default)s)")
+    parser.add_argument('--seed', type=int, default=None,
+        help="Seed to use for RNG (default: %(default)s)")
+    parser.add_argument('--input-bitwidth', type=int, default=None,
+        help="Bitwidth to use at the input (default: %(default)s)")
+    parser.add_argument('--hidden-bitwidth', type=int, default=None,
+        help="Bitwidth to use for activations in hidden layers (default: %(default)s)")
+    parser.add_argument('--output-bitwidth', type=int, default=None,
+        help="Bitwidth to use at the output (default: %(default)s)")
+    parser.add_argument('--input-fanin', type=int, default=None,
+        help="Fanin to use at the input (default: %(default)s)")
+    parser.add_argument('--hidden-fanin', type=int, default=None,
+        help="Fanin to use for the hidden layers (default: %(default)s)")
+    parser.add_argument('--output-fanin', type=int, default=None,
+        help="Fanin to use at the output (default: %(default)s)")
+    parser.add_argument('--hidden-layers', nargs='+', type=int, default=None,
+        help="A list of hidden layer neuron sizes (default: %(default)s)")
+    parser.add_argument('--log-dir', type=str, default='./log',
+        help="A location to store the log output of the training run and the output model (default: %(default)s)")
+    parser.add_argument('--dataset-file', type=str, default='data/processed-pythia82-lhc13-all-pt1-50k-r1_h022_e0175_t220_nonu_truth.z',
+        help="The file to use as the dataset input (default: %(default)s)")
+    parser.add_argument('--dataset-config', type=str, default='config/yaml_IP_OP_config.yml',
+        help="The file to use to configure the input dataset (default: %(default)s)")
+    parser.add_argument('--checkpoint', type=str, default=None,
+        help="Retrain the model from a previous checkpoint (default: %(default)s)")
+    args = parser.parse_args()
+    defaults = configs[args.arch]
+    options = vars(args)
+    del options['arch']
+    config = {}
+    for k in options.keys():
+        config[k] = options[k] if options[k] is not None else defaults[k] # Override defaults, if specified.
+
+    if not os.path.exists(config['log_dir']):
+        os.makedirs(config['log_dir'])
+
+    # Split up configuration options to be more understandable
+    model_cfg = {}
+    for k in model_config.keys():
+        model_cfg[k] = config[k]
+    train_cfg = {}
+    for k in training_config.keys():
+        train_cfg[k] = config[k]
+    dataset_cfg = {}
+    for k in dataset_config.keys():
+        dataset_cfg[k] = config[k]
+    options_cfg = {}
+    for k in other_options.keys():
+        options_cfg[k] = config[k]
+
+    # Set random seeds
+    random.seed(train_cfg['seed'])
+    np.random.seed(train_cfg['seed'])
+    torch.manual_seed(train_cfg['seed'])
+    os.environ['PYTHONHASHSEED'] = str(train_cfg['seed'])
+    if options["cuda"]:
+        torch.cuda.manual_seed_all(train_cfg['seed'])
+        torch.backends.cudnn.deterministic = True
+
+    trans = transform=transforms.Compose([
+                transforms.ToTensor(),
+                transforms.Normalize((0.1307,), (0.3081,)),
+                transforms.Lambda(partial(torch.reshape, shape=(-1,)))
+            ])
+
+    # Fetch the datasets
+    dataset = {}
+    dataset['train'] = MNIST('./data', train=True, download=True, transform=trans)
+    dataset['valid'] = MNIST('./data', train=False, download=True, transform=trans)
+    dataset['test'] = MNIST('./data', train=False, download=True, transform=trans)
+
+    # Instantiate model
+    x, y = dataset['train'][0]
+    model_cfg['input_length'] = len(x)
+    model_cfg['output_length'] = 10
+    model = MnistNeqModel(model_cfg)
+    if options_cfg['checkpoint'] is not None:
+        print(f"Loading pre-trained checkpoint {options_cfg['checkpoint']}")
+        checkpoint = torch.load(options_cfg['checkpoint'], map_location='cpu')
+        model.load_state_dict(checkpoint['model_dict'])
+
+    train(model, dataset, train_cfg, options_cfg)
+

From 1a29d68c1f46ca481fab85ccfd134fd6c53736cd Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Wed, 4 Jan 2023 17:13:20 +0000
Subject: [PATCH 32/64] [mnist/requirements] Added a requirements file for
 MNIST.

---
 examples/mnist/requirements.txt | 17 +++++++++++++++++
 1 file changed, 17 insertions(+)
 create mode 100644 examples/mnist/requirements.txt

diff --git a/examples/mnist/requirements.txt b/examples/mnist/requirements.txt
new file mode 100644
index 000000000..ac3ab55bf
--- /dev/null
+++ b/examples/mnist/requirements.txt
@@ -0,0 +1,17 @@
+#  Copyright (C) 2021 Xilinx, Inc
+#
+#  Licensed under the Apache License, Version 2.0 (the "License");
+#  you may not use this file except in compliance with the License.
+#  You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing, software
+#  distributed under the License is distributed on an "AS IS" BASIS,
+#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+#  See the License for the specific language governing permissions and
+#  limitations under the License.
+
+numpy
+tensorboard
+torchvision

From f31c773c2a771395b6db3c1ed7dce18f0bf7f080 Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Wed, 4 Jan 2023 17:14:02 +0000
Subject: [PATCH 33/64] [mnist/readme] Added basic README template for MNIST.

---
 examples/mnist/README.md | 68 ++++++++++++++++++++++++++++++++++++++++
 1 file changed, 68 insertions(+)
 create mode 100644 examples/mnist/README.md

diff --git a/examples/mnist/README.md b/examples/mnist/README.md
new file mode 100644
index 000000000..c157551fd
--- /dev/null
+++ b/examples/mnist/README.md
@@ -0,0 +1,68 @@
+# LogicNets for MNIST Classification
+
+This example shows the accuracy that is attainable using the LogicNets methodology on the MNIST hand-written character classification task.
+
+## Prerequisites
+
+* LogicNets
+* numpy
+* torchvision
+
+## Installation
+
+If you're using the docker image, all the above prerequisites will be already installed.
+Otherwise, you can install the above dependencies with pip and/or conda.
+
+## Download the Dataset
+
+The MNIST dataset will download automatically when the training script is first run.
+You only need to make sure the necessary directory has been created:
+
+```bash
+mkdir -p data
+```
+
+## Usage
+
+To train the \"MNIST-S\", \"MNIST-M\" and \"MNIST-L\" networks,
+run the following:
+
+```bash
+python train.py --arch <mnist-s|mnist-m|mnist-l> --log-dir ./<mnist_s|mnist_m|mnist_l>/
+```
+
+To then generate verilog from this trained model, run the following:
+
+```bash
+python neq2lut.py --arch <mnist-s|mnist-m|mnist-l> --checkpoint ./<mnist_s|mnist_m|mnist_l>/best_accuracy.pth --log-dir ./<mnist_s|mnist_m|mnist_l>/verilog/ --add-registers
+```
+
+## Results
+
+Your results may vary slightly, depending on your system configuration.
+The following results are attained when training on a CPU and synthesising with Vivado 2019.2:
+
+| Network Architecture  | Test Accuracy (%) | LUTs  | Flip Flops    | Fmax (Mhz)    | Latency (Cycles)  |
+| --------------------- | ----------------- | ----- | ------------- | ------------- | ----------------- |
+| MNIST-S               |                   |       |               |               |                   |
+| MNIST-M               |                   |       |               |               |                   |
+| MNIST-L               |                   |       |               |               |                   |
+
+## Citation
+
+If you find this work useful for your research, please consider citing
+our paper below:
+
+```bibtex
+@inproceedings{umuroglu2020logicnets,
+  author = {Umuroglu, Yaman and Akhauri, Yash and Fraser, Nicholas J and Blott, Michaela},
+  booktitle = {Proceedings of the International Conference on Field-Programmable Logic and Applications},
+  title = {LogicNets: Co-Designed Neural Networks and Circuits for Extreme-Throughput Applications},
+  year = {2020},
+  pages = {291-297},
+  publisher = {IEEE Computer Society},
+  address = {Los Alamitos, CA, USA},
+  month = {sep}
+}
+```
+

From abf5fbb66501e8713251064cc2ee8a0512867b01 Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Wed, 4 Jan 2023 17:36:00 +0000
Subject: [PATCH 34/64] [mnist] Removed references to the dataset config.

---
 examples/mnist/neq2lut.py |  9 +--------
 examples/mnist/train.py   | 12 ------------
 2 files changed, 1 insertion(+), 20 deletions(-)

diff --git a/examples/mnist/neq2lut.py b/examples/mnist/neq2lut.py
index 53c36624d..4f09e4695 100644
--- a/examples/mnist/neq2lut.py
+++ b/examples/mnist/neq2lut.py
@@ -28,7 +28,7 @@
 from logicnets.util import proc_postsynth_file
 
 from models import MnistNeqModel, MnistLutModel, MnistVerilogModel
-from train import configs, model_config, dataset_config, test
+from train import configs, model_config, test
 
 other_options = {
     "cuda": None,
@@ -60,12 +60,8 @@
         help="Fanin to use at the output (default: %(default)s)")
     parser.add_argument('--hidden-layers', nargs='+', type=int, default=None,
         help="A list of hidden layer neuron sizes (default: %(default)s)")
-    parser.add_argument('--dataset-file', type=str, default='data/processed-pythia82-lhc13-all-pt1-50k-r1_h022_e0175_t220_nonu_truth.z',
-        help="The file to use as the dataset input (default: %(default)s)")
     parser.add_argument('--clock-period', type=float, default=1.0,
         help="Target clock frequency to use during Vivado synthesis (default: %(default)s)")
-    parser.add_argument('--dataset-config', type=str, default='config/yaml_IP_OP_config.yml',
-        help="The file to use to configure the input dataset (default: %(default)s)")
     parser.add_argument('--dataset-split', type=str, default='test', choices=['train', 'test'],
         help="Dataset to use for evaluation (default: %(default)s)")
     parser.add_argument('--log-dir', type=str, default='./log',
@@ -97,9 +93,6 @@
     model_cfg = {}
     for k in model_config.keys():
         model_cfg[k] = config[k]
-    dataset_cfg = {}
-    for k in dataset_config.keys():
-        dataset_cfg[k] = config[k]
     options_cfg = {}
     for k in other_options.keys():
         if k == 'cuda':
diff --git a/examples/mnist/train.py b/examples/mnist/train.py
index 4ed574cd2..fb7cf10c0 100644
--- a/examples/mnist/train.py
+++ b/examples/mnist/train.py
@@ -97,11 +97,6 @@
     "seed": None,
 }
 
-dataset_config = {
-    "dataset_file": None,
-    "dataset_config": None,
-}
-
 other_options = {
     "cuda": None,
     "log_dir": None,
@@ -248,10 +243,6 @@ def test(model, dataset_loader, cuda):
         help="A list of hidden layer neuron sizes (default: %(default)s)")
     parser.add_argument('--log-dir', type=str, default='./log',
         help="A location to store the log output of the training run and the output model (default: %(default)s)")
-    parser.add_argument('--dataset-file', type=str, default='data/processed-pythia82-lhc13-all-pt1-50k-r1_h022_e0175_t220_nonu_truth.z',
-        help="The file to use as the dataset input (default: %(default)s)")
-    parser.add_argument('--dataset-config', type=str, default='config/yaml_IP_OP_config.yml',
-        help="The file to use to configure the input dataset (default: %(default)s)")
     parser.add_argument('--checkpoint', type=str, default=None,
         help="Retrain the model from a previous checkpoint (default: %(default)s)")
     args = parser.parse_args()
@@ -272,9 +263,6 @@ def test(model, dataset_loader, cuda):
     train_cfg = {}
     for k in training_config.keys():
         train_cfg[k] = config[k]
-    dataset_cfg = {}
-    for k in dataset_config.keys():
-        dataset_cfg[k] = config[k]
     options_cfg = {}
     for k in other_options.keys():
         options_cfg[k] = config[k]

From ade941870052193a3690350081382cac9a843ed4 Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Wed, 4 Jan 2023 17:36:47 +0000
Subject: [PATCH 35/64] [mnist] Bugfix in default values for arch.

---
 examples/mnist/neq2lut.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/examples/mnist/neq2lut.py b/examples/mnist/neq2lut.py
index 4f09e4695..ec887fb7e 100644
--- a/examples/mnist/neq2lut.py
+++ b/examples/mnist/neq2lut.py
@@ -42,7 +42,7 @@
 
 if __name__ == "__main__":
     parser = ArgumentParser(description="Synthesize convert a PyTorch trained model into verilog")
-    parser.add_argument('--arch', type=str, choices=configs.keys(), default="jsc-s",
+    parser.add_argument('--arch', type=str, choices=configs.keys(), default="mnist-s",
         help="Specific the neural network model to use (default: %(default)s)")
     parser.add_argument('--batch-size', type=int, default=None, metavar='N',
         help="Batch size for evaluation (default: %(default)s)")

From 54c6d5cdac5e28baee983092a80f29984ca1b91b Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Wed, 4 Jan 2023 17:37:28 +0000
Subject: [PATCH 36/64] [mnist] Added first version of dataset_dump file, ready
 for testing.

---
 examples/mnist/dataset_dump.py | 131 +++++++++++++++++++++++++++++++++
 1 file changed, 131 insertions(+)
 create mode 100644 examples/mnist/dataset_dump.py

diff --git a/examples/mnist/dataset_dump.py b/examples/mnist/dataset_dump.py
new file mode 100644
index 000000000..5c96d7616
--- /dev/null
+++ b/examples/mnist/dataset_dump.py
@@ -0,0 +1,131 @@
+#  Copyright (C) 2021 Xilinx, Inc
+#
+#  Licensed under the Apache License, Version 2.0 (the "License");
+#  you may not use this file except in compliance with the License.
+#  You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing, software
+#  distributed under the License is distributed on an "AS IS" BASIS,
+#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+#  See the License for the specific language governing permissions and
+#  limitations under the License.
+
+import os
+from argparse import ArgumentParser
+from functools import reduce, partial
+
+import torch
+from torch.utils.data import DataLoader
+from torchvision.datasets import MNIST
+from torchvision import transforms
+
+from logicnets.nn import    generate_truth_tables, \
+                            lut_inference, \
+                            module_list_to_verilog_module
+from logicnets.synthesis import synthesize_and_get_resource_counts
+
+from train import configs, model_config, other_options, test
+from models import MnistNeqModel, MnistLutModel
+
+def dump_io(model, data_loader, input_file, output_file):
+    input_quant = model.module_list[0].input_quant
+    _, input_bitwidth = input_quant.get_scale_factor_bits()
+    input_bitwidth = int(input_bitwidth)
+    total_input_bits = model.module_list[0].in_features*input_bitwidth
+    input_quant.bin_output()
+    with open(input_file, 'w') as i_f, open(output_file, 'w') as o_f:
+        for data, target in data_loader:
+            x = input_quant(data)
+            indices = target
+            for i in range(x.shape[0]):
+                x_i = x[i,:]
+                xv_i = list(map(lambda z: input_quant.get_bin_str(z), x_i))
+                xvc_i = reduce(lambda a,b: a+b, xv_i[::-1])
+                i_f.write(f"{int(xvc_i,2):0{int(total_input_bits)}b}\n")
+                o_f.write(f"{int(indices[i])}\n")
+
+if __name__ == "__main__":
+    parser = ArgumentParser(description="Dump the train and test datasets (after input quantization) into text files")
+    parser.add_argument('--arch', type=str, choices=configs.keys(), default="mnist-s",
+        help="Specific the neural network model to use (default: %(default)s)")
+    parser.add_argument('--batch-size', type=int, default=None, metavar='N',
+        help="Batch size for evaluation (default: %(default)s)")
+    parser.add_argument('--input-bitwidth', type=int, default=None,
+        help="Bitwidth to use at the input (default: %(default)s)")
+    parser.add_argument('--hidden-bitwidth', type=int, default=None,
+        help="Bitwidth to use for activations in hidden layers (default: %(default)s)")
+    parser.add_argument('--output-bitwidth', type=int, default=None,
+        help="Bitwidth to use at the output (default: %(default)s)")
+    parser.add_argument('--input-fanin', type=int, default=None,
+        help="Fanin to use at the input (default: %(default)s)")
+    parser.add_argument('--hidden-fanin', type=int, default=None,
+        help="Fanin to use for the hidden layers (default: %(default)s)")
+    parser.add_argument('--output-fanin', type=int, default=None,
+        help="Fanin to use at the output (default: %(default)s)")
+    parser.add_argument('--hidden-layers', nargs='+', type=int, default=None,
+        help="A list of hidden layer neuron sizes (default: %(default)s)")
+    parser.add_argument('--log-dir', type=str, default='./log',
+        help="A location to store the output I/O text files (default: %(default)s)")
+    parser.add_argument('--checkpoint', type=str, required=True,
+        help="The checkpoint file which contains the model weights")
+    args = parser.parse_args()
+    defaults = configs[args.arch]
+    options = vars(args)
+    del options['arch']
+    config = {}
+    for k in options.keys():
+        config[k] = options[k] if options[k] is not None else defaults[k] # Override defaults, if specified.
+
+    if not os.path.exists(config['log_dir']):
+        os.makedirs(config['log_dir'])
+
+    # Split up configuration options to be more understandable
+    model_cfg = {}
+    for k in model_config.keys():
+        model_cfg[k] = config[k]
+    options_cfg = {}
+    for k in other_options.keys():
+        if k == 'cuda':
+            continue
+        options_cfg[k] = config[k]
+
+    trans = transform=transforms.Compose([
+                transforms.ToTensor(),
+                transforms.Normalize((0.1307,), (0.3081,)),
+                transforms.Lambda(partial(torch.reshape, shape=(-1,)))
+            ])
+
+    # Fetch the datasets
+    dataset = {}
+    dataset['train'] = MNIST('./data', train=True, download=True, transform=trans)
+    dataset['test'] = MNIST('./data', train=False, download=True, transform=trans)
+    train_loader = DataLoader(dataset["train"], batch_size=config['batch_size'], shuffle=False)
+    test_loader = DataLoader(dataset["test"], batch_size=config['batch_size'], shuffle=False)
+
+    # Instantiate the PyTorch model
+    x, y = dataset["train"][0]
+    model_cfg['input_length'] = len(x)
+    model_cfg['output_length'] = 10
+    model = MnistNeqModel(model_cfg)
+
+    # Load the model weights
+    checkpoint = torch.load(options_cfg['checkpoint'], map_location='cpu')
+    model.load_state_dict(checkpoint['model_dict'])
+
+    # Test the PyTorch model
+    print("Running inference on baseline model...")
+    model.eval()
+    baseline_accuracy = test(model, test_loader, cuda=False)
+    print("Baseline accuracy: %f" % (baseline_accuracy))
+
+    # Run preprocessing on training set.
+    train_input_file = config['log_dir'] + "/train_input.txt"
+    train_output_file = config['log_dir'] + "/train_output.txt"
+    test_input_file = config['log_dir'] + "/test_input.txt"
+    test_output_file = config['log_dir'] + "/test_output.txt"
+    print(f"Dumping train I/O to {train_input_file} and {train_output_file}")
+    dump_io(model, train_loader, train_input_file, train_output_file)
+    print(f"Dumping test I/O to {test_input_file} and {test_output_file}")
+    dump_io(model, test_loader, test_input_file, test_output_file)

From 0c3bcf6e108b57c7b57b3e4b7580b7ab781e5cde Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Thu, 5 Jan 2023 10:44:35 +0000
Subject: [PATCH 37/64] [mnist] First version of MNIST-S. ~96% accuracy.

---
 examples/mnist/models.py | 2 +-
 examples/mnist/train.py  | 8 ++++----
 2 files changed, 5 insertions(+), 5 deletions(-)

diff --git a/examples/mnist/models.py b/examples/mnist/models.py
index a67a9128d..be2001b71 100644
--- a/examples/mnist/models.py
+++ b/examples/mnist/models.py
@@ -41,7 +41,7 @@ def __init__(self, model_config):
             out_features = self.num_neurons[i]
             bn = nn.BatchNorm1d(out_features)
             if i == 1:
-                do_in = nn.Dropout(p=0.3)
+                do_in = nn.Dropout(p=0.01)
                 bn_in = nn.BatchNorm1d(in_features)
                 input_bias = ScalarBiasScale(scale=False, bias_init=-0.25)
                 input_quant = QuantBrevitasActivation(QuantHardTanh(model_config["input_bitwidth"], max_val=1., narrow_range=False, quant_type=QuantType.INT, scaling_impl_type=ScalingImplType.PARAMETER), pre_transforms=[do_in, bn_in, input_bias])
diff --git a/examples/mnist/train.py b/examples/mnist/train.py
index fb7cf10c0..118e820a8 100644
--- a/examples/mnist/train.py
+++ b/examples/mnist/train.py
@@ -32,13 +32,13 @@
 # TODO: Replace default configs with YAML files.
 configs = {
     "mnist-s": {
-        "hidden_layers": [512, 256, 128, 100],
+        "hidden_layers": [1024, 1024, 1024, 1024, 1024, 128],
         "input_bitwidth": 1,
         "hidden_bitwidth": 1,
         "output_bitwidth": 4,
-        "input_fanin": 6,
-        "hidden_fanin": 6,
-        "output_fanin": 6,
+        "input_fanin": 8,
+        "hidden_fanin": 8,
+        "output_fanin": 8,
         "weight_decay": 1e-3,
         "batch_size": 1024,
         "epochs": 1000,

From 8a7d5817958202510a1520cbf871015ba7f06989 Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Thu, 2 Feb 2023 11:20:48 +0000
Subject: [PATCH 38/64] [examples/mnist] Added v1.1 models and seeds s-1.1,
 m-1.1, l-1.1 get ~94.9, ~97.8, ~98.0 respectively.

---
 examples/mnist/models.py |  6 ++-
 examples/mnist/train.py  | 82 ++++++++++++++++++++++++++++++++++------
 2 files changed, 76 insertions(+), 12 deletions(-)

diff --git a/examples/mnist/models.py b/examples/mnist/models.py
index be2001b71..ec81bd710 100644
--- a/examples/mnist/models.py
+++ b/examples/mnist/models.py
@@ -40,9 +40,13 @@ def __init__(self, model_config):
             in_features = self.num_neurons[i-1]
             out_features = self.num_neurons[i]
             bn = nn.BatchNorm1d(out_features)
+            nn.init.constant_(bn.weight.data, 1)
+            nn.init.constant_(bn.bias.data, 0)
             if i == 1:
-                do_in = nn.Dropout(p=0.01)
+                do_in = nn.Dropout(p=0.1)
                 bn_in = nn.BatchNorm1d(in_features)
+                nn.init.constant_(bn_in.weight.data, 1)
+                nn.init.constant_(bn_in.bias.data, 0)
                 input_bias = ScalarBiasScale(scale=False, bias_init=-0.25)
                 input_quant = QuantBrevitasActivation(QuantHardTanh(model_config["input_bitwidth"], max_val=1., narrow_range=False, quant_type=QuantType.INT, scaling_impl_type=ScalingImplType.PARAMETER), pre_transforms=[do_in, bn_in, input_bias])
                 output_quant = QuantBrevitasActivation(QuantReLU(bit_width=model_config["hidden_bitwidth"], max_val=1.61, quant_type=QuantType.INT, scaling_impl_type=ScalingImplType.PARAMETER), pre_transforms=[bn])
diff --git a/examples/mnist/train.py b/examples/mnist/train.py
index 118e820a8..6bebd21e2 100644
--- a/examples/mnist/train.py
+++ b/examples/mnist/train.py
@@ -43,32 +43,77 @@
         "batch_size": 1024,
         "epochs": 1000,
         "learning_rate": 1e-3,
-        "seed": 0,
+        "seed": 5,
+        "checkpoint": None,
+    },
+    "mnist-s-1.1": {
+        "hidden_layers": [1024, 1024, 1024, 1024, 1024, 128],
+        "input_bitwidth": 1,
+        "hidden_bitwidth": 1,
+        "output_bitwidth": 4,
+        "input_fanin": 6,
+        "hidden_fanin": 6,
+        "output_fanin": 6,
+        "weight_decay": 1e-3,
+        "batch_size": 1024,
+        "epochs": 1000,
+        "learning_rate": 1e-3,
+        "seed": 18,
         "checkpoint": None,
     },
     "mnist-m": {
-        "hidden_layers": [512, 256, 128, 100],
+        "hidden_layers": [1024, 1024, 1024, 1024, 1024, 128],
+        "input_bitwidth": 1,
+        "hidden_bitwidth": 1,
+        "output_bitwidth": 4,
+        "input_fanin": 10,
+        "hidden_fanin": 10,
+        "output_fanin": 10,
+        "weight_decay": 1e-3,
+        "batch_size": 1024,
+        "epochs": 1000,
+        "learning_rate": 1e-3,
+        "seed": 0,
+        "checkpoint": None,
+    },
+    "mnist-m-1.1": {
+        "hidden_layers": [1024, 1024, 1024, 1024, 1024, 128],
         "input_bitwidth": 2,
         "hidden_bitwidth": 2,
         "output_bitwidth": 4,
-        "input_fanin": 4,
-        "hidden_fanin": 4,
-        "output_fanin": 4,
+        "input_fanin": 5,
+        "hidden_fanin": 5,
+        "output_fanin": 5,
         "weight_decay": 1e-3,
         "batch_size": 1024,
         "epochs": 1000,
         "learning_rate": 1e-3,
-        "seed": 0,
+        "seed": 20,
         "checkpoint": None,
     },
-    "mnist-l": {
-        "hidden_layers": [512, 256, 128, 100],
+    "mnist-m-1.2": {
+        "hidden_layers": [1024, 1024, 1024, 1024, 1024, 128],
         "input_bitwidth": 3,
         "hidden_bitwidth": 3,
         "output_bitwidth": 4,
-        "input_fanin": 4,
-        "hidden_fanin": 4,
-        "output_fanin": 4,
+        "input_fanin": 3,
+        "hidden_fanin": 3,
+        "output_fanin": 3,
+        "weight_decay": 1e-3,
+        "batch_size": 1024,
+        "epochs": 1000,
+        "learning_rate": 1e-3,
+        "seed": 0,
+        "checkpoint": None,
+    },
+    "mnist-l": {
+        "hidden_layers": [1024, 1024, 1024, 1024, 1024, 128],
+        "input_bitwidth": 1,
+        "hidden_bitwidth": 1,
+        "output_bitwidth": 4,
+        "input_fanin": 12,
+        "hidden_fanin": 12,
+        "output_fanin": 12,
         "weight_decay": 1e-3,
         "batch_size": 1024,
         "epochs": 1000,
@@ -76,6 +121,21 @@
         "seed": 0,
         "checkpoint": None,
     },
+    "mnist-l-1.1": {
+        "hidden_layers": [1024, 1024, 1024, 1024, 1024, 128],
+        "input_bitwidth": 2,
+        "hidden_bitwidth": 2,
+        "output_bitwidth": 4,
+        "input_fanin": 6,
+        "hidden_fanin": 6,
+        "output_fanin": 6,
+        "weight_decay": 1e-3,
+        "batch_size": 1024,
+        "epochs": 1000,
+        "learning_rate": 1e-3,
+        "seed": 12,
+        "checkpoint": None,
+    },
 }
 
 # A dictionary, so we can set some defaults if necessary

From abc13e33637617480d407304bb276072c6a89842 Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Tue, 28 Feb 2023 17:38:02 +0000
Subject: [PATCH 39/64] [ex/mnist] Added input_dropout as a configurable
 parameter

---
 examples/mnist/models.py  |  2 +-
 examples/mnist/neq2lut.py |  2 ++
 examples/mnist/train.py   | 10 ++++++++++
 3 files changed, 13 insertions(+), 1 deletion(-)

diff --git a/examples/mnist/models.py b/examples/mnist/models.py
index ec81bd710..fcedfd932 100644
--- a/examples/mnist/models.py
+++ b/examples/mnist/models.py
@@ -43,7 +43,7 @@ def __init__(self, model_config):
             nn.init.constant_(bn.weight.data, 1)
             nn.init.constant_(bn.bias.data, 0)
             if i == 1:
-                do_in = nn.Dropout(p=0.1)
+                do_in = nn.Dropout(p=model_config["input_dropout"])
                 bn_in = nn.BatchNorm1d(in_features)
                 nn.init.constant_(bn_in.weight.data, 1)
                 nn.init.constant_(bn_in.bias.data, 0)
diff --git a/examples/mnist/neq2lut.py b/examples/mnist/neq2lut.py
index ec887fb7e..6a3007080 100644
--- a/examples/mnist/neq2lut.py
+++ b/examples/mnist/neq2lut.py
@@ -60,6 +60,8 @@
         help="Fanin to use at the output (default: %(default)s)")
     parser.add_argument('--hidden-layers', nargs='+', type=int, default=None,
         help="A list of hidden layer neuron sizes (default: %(default)s)")
+    parser.add_argument('--input-dropout', type=float, default=None,
+        help="The amount of dropout to apply at the model input (default: %(default)s)")
     parser.add_argument('--clock-period', type=float, default=1.0,
         help="Target clock frequency to use during Vivado synthesis (default: %(default)s)")
     parser.add_argument('--dataset-split', type=str, default='test', choices=['train', 'test'],
diff --git a/examples/mnist/train.py b/examples/mnist/train.py
index 6bebd21e2..c23ab59cf 100644
--- a/examples/mnist/train.py
+++ b/examples/mnist/train.py
@@ -39,6 +39,7 @@
         "input_fanin": 8,
         "hidden_fanin": 8,
         "output_fanin": 8,
+        "input_dropout": 0.01,
         "weight_decay": 1e-3,
         "batch_size": 1024,
         "epochs": 1000,
@@ -54,6 +55,7 @@
         "input_fanin": 6,
         "hidden_fanin": 6,
         "output_fanin": 6,
+        "input_dropout": 0.1,
         "weight_decay": 1e-3,
         "batch_size": 1024,
         "epochs": 1000,
@@ -69,6 +71,7 @@
         "input_fanin": 10,
         "hidden_fanin": 10,
         "output_fanin": 10,
+        "input_dropout": 0.01,
         "weight_decay": 1e-3,
         "batch_size": 1024,
         "epochs": 1000,
@@ -84,6 +87,7 @@
         "input_fanin": 5,
         "hidden_fanin": 5,
         "output_fanin": 5,
+        "input_dropout": 0.1,
         "weight_decay": 1e-3,
         "batch_size": 1024,
         "epochs": 1000,
@@ -99,6 +103,7 @@
         "input_fanin": 3,
         "hidden_fanin": 3,
         "output_fanin": 3,
+        "input_dropout": 0.01,
         "weight_decay": 1e-3,
         "batch_size": 1024,
         "epochs": 1000,
@@ -114,6 +119,7 @@
         "input_fanin": 12,
         "hidden_fanin": 12,
         "output_fanin": 12,
+        "input_dropout": 0.01,
         "weight_decay": 1e-3,
         "batch_size": 1024,
         "epochs": 1000,
@@ -129,6 +135,7 @@
         "input_fanin": 6,
         "hidden_fanin": 6,
         "output_fanin": 6,
+        "input_dropout": 0.1,
         "weight_decay": 1e-3,
         "batch_size": 1024,
         "epochs": 1000,
@@ -147,6 +154,7 @@
     "input_fanin": None,
     "hidden_fanin": None,
     "output_fanin": None,
+    "input_dropout": None,
 }
 
 training_config = {
@@ -301,6 +309,8 @@ def test(model, dataset_loader, cuda):
         help="Fanin to use at the output (default: %(default)s)")
     parser.add_argument('--hidden-layers', nargs='+', type=int, default=None,
         help="A list of hidden layer neuron sizes (default: %(default)s)")
+    parser.add_argument('--input-dropout', type=float, default=None,
+        help="The amount of dropout to apply at the model input (default: %(default)s)")
     parser.add_argument('--log-dir', type=str, default='./log',
         help="A location to store the log output of the training run and the output model (default: %(default)s)")
     parser.add_argument('--checkpoint', type=str, default=None,

From 1feca628873501d91de0dbae6fd830142e0f34e9 Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Tue, 28 Feb 2023 17:38:39 +0000
Subject: [PATCH 40/64] [ex/mnist] Updated seed for mnist-m

---
 examples/mnist/train.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/examples/mnist/train.py b/examples/mnist/train.py
index c23ab59cf..fed1a322b 100644
--- a/examples/mnist/train.py
+++ b/examples/mnist/train.py
@@ -76,7 +76,7 @@
         "batch_size": 1024,
         "epochs": 1000,
         "learning_rate": 1e-3,
-        "seed": 0,
+        "seed": 2,
         "checkpoint": None,
     },
     "mnist-m-1.1": {

From aca10f133cd9c0d4343654d001483dadd94d6ebc Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Tue, 28 Feb 2023 17:39:18 +0000
Subject: [PATCH 41/64] [ex/mnist] Added very small configs

---
 examples/mnist/train.py | 32 ++++++++++++++++++++++++++++++++
 1 file changed, 32 insertions(+)

diff --git a/examples/mnist/train.py b/examples/mnist/train.py
index fed1a322b..1f5bf7e7f 100644
--- a/examples/mnist/train.py
+++ b/examples/mnist/train.py
@@ -31,6 +31,38 @@
 
 # TODO: Replace default configs with YAML files.
 configs = {
+    "mnist-xxs": {
+        "hidden_layers": [1024, 1024, 1024, 128],
+        "input_bitwidth": 1,
+        "hidden_bitwidth": 1,
+        "output_bitwidth": 4,
+        "input_fanin": 8,
+        "hidden_fanin": 8,
+        "output_fanin": 8,
+        "input_dropout": 0.01,
+        "weight_decay": 1e-3,
+        "batch_size": 1024,
+        "epochs": 1000,
+        "learning_rate": 1e-3,
+        "seed": 0,
+        "checkpoint": None,
+    },
+    "mnist-xs": {
+        "hidden_layers": [1024, 1024, 128],
+        "input_bitwidth": 1,
+        "hidden_bitwidth": 1,
+        "output_bitwidth": 4,
+        "input_fanin": 8,
+        "hidden_fanin": 8,
+        "output_fanin": 8,
+        "input_dropout": 0.01,
+        "weight_decay": 1e-3,
+        "batch_size": 1024,
+        "epochs": 1000,
+        "learning_rate": 1e-3,
+        "seed": 0,
+        "checkpoint": None,
+    },
     "mnist-s": {
         "hidden_layers": [1024, 1024, 1024, 1024, 1024, 128],
         "input_bitwidth": 1,

From 0de0ba25ef04d72d6f4f96ee5e8a1cd558ef86a6 Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Tue, 28 Feb 2023 18:03:15 +0000
Subject: [PATCH 42/64] [ex/mnist] Updated mnist example to track cares

---
 examples/mnist/dump_luts.py | 122 ++++++++++++++++++++++++++++++++++++
 examples/mnist/models.py    |  17 ++---
 examples/mnist/neq2lut.py   |  18 ++++--
 examples/mnist/train.py     |  18 ++++++
 4 files changed, 164 insertions(+), 11 deletions(-)
 create mode 100644 examples/mnist/dump_luts.py

diff --git a/examples/mnist/dump_luts.py b/examples/mnist/dump_luts.py
new file mode 100644
index 000000000..071e96861
--- /dev/null
+++ b/examples/mnist/dump_luts.py
@@ -0,0 +1,122 @@
+#  Copyright (C) 2021 Xilinx, Inc
+#
+#  Licensed under the Apache License, Version 2.0 (the "License");
+#  you may not use this file except in compliance with the License.
+#  You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing, software
+#  distributed under the License is distributed on an "AS IS" BASIS,
+#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+#  See the License for the specific language governing permissions and
+#  limitations under the License.
+
+import os
+from argparse import ArgumentParser
+from functools import partial
+
+import torch
+from torch.utils.data import DataLoader
+from torchvision.datasets import MNIST
+from torchvision import transforms
+
+from logicnets.nn import    generate_truth_tables, \
+                            lut_inference, \
+                            save_luts, \
+                            module_list_to_verilog_module
+
+from models import MnistNeqModel, MnistLutModel
+from train import configs, model_config, other_options, test
+from logicnets.synthesis import synthesize_and_get_resource_counts
+
+if __name__ == "__main__":
+    parser = ArgumentParser(description="Generate histograms of states used throughout LogicNets")
+    parser.add_argument('--arch', type=str, choices=configs.keys(), default="mnist-s",
+        help="Specific the neural network model to use (default: %(default)s)")
+    parser.add_argument('--batch-size', type=int, default=None, metavar='N',
+        help="Batch size for evaluation (default: %(default)s)")
+    parser.add_argument('--input-bitwidth', type=int, default=None,
+        help="Bitwidth to use at the input (default: %(default)s)")
+    parser.add_argument('--hidden-bitwidth', type=int, default=None,
+        help="Bitwidth to use for activations in hidden layers (default: %(default)s)")
+    parser.add_argument('--output-bitwidth', type=int, default=None,
+        help="Bitwidth to use at the output (default: %(default)s)")
+    parser.add_argument('--input-fanin', type=int, default=None,
+        help="Fanin to use at the input (default: %(default)s)")
+    parser.add_argument('--hidden-fanin', type=int, default=None,
+        help="Fanin to use for the hidden layers (default: %(default)s)")
+    parser.add_argument('--output-fanin', type=int, default=None,
+        help="Fanin to use at the output (default: %(default)s)")
+    parser.add_argument('--hidden-layers', nargs='+', type=int, default=None,
+        help="A list of hidden layer neuron sizes (default: %(default)s)")
+    parser.add_argument('--log-dir', type=str, default='./log',
+        help="A location to store the calculated histograms (default: %(default)s)")
+    parser.add_argument('--checkpoint', type=str, required=True,
+        help="The checkpoint file which contains the model weights")
+    args = parser.parse_args()
+    defaults = configs[args.arch]
+    options = vars(args)
+    del options['arch']
+    config = {}
+    for k in options.keys():
+        config[k] = options[k] if options[k] is not None else defaults[k] # Override defaults, if specified.
+
+    if not os.path.exists(config['log_dir']):
+        os.makedirs(config['log_dir'])
+
+    # Split up configuration options to be more understandable
+    model_cfg = {}
+    for k in model_config.keys():
+        model_cfg[k] = config[k]
+    options_cfg = {}
+    for k in other_options.keys():
+        if k == 'cuda':
+            continue
+        options_cfg[k] = config[k]
+
+    trans = transform=transforms.Compose([
+                transforms.ToTensor(),
+                transforms.Normalize((0.1307,), (0.3081,)),
+                transforms.Lambda(partial(torch.reshape, shape=(-1,)))
+            ])
+
+    # Fetch the test set
+    dataset = {}
+    dataset[args.dataset_split] = MNIST('./data', train=args.dataset_split == "train", download=True, transform=trans)
+    test_loader = DataLoader(dataset[args.dataset_split], batch_size=config['batch_size'], shuffle=False)
+
+    # Instantiate the PyTorch model
+    x, y = dataset[args.dataset_split][0]
+    model_cfg['input_length'] = len(x)
+    model_cfg['output_length'] = 10
+    model = MnistNeqModel(model_cfg)
+
+    # Load the model weights
+    checkpoint = torch.load(options_cfg['checkpoint'], map_location='cpu')
+    model.load_state_dict(checkpoint['model_dict'])
+
+    # Test the PyTorch model
+    print("Running inference of baseline model on training set (%d examples)..." % (dataset_length))
+    model.eval()
+    baseline_accuracy = test(model, train_loader, cuda=False)
+    print("Baseline accuracy: %f" % (baseline_accuracy))
+
+    # Instantiate LUT-based model
+    lut_model = MnistLutModel(model_cfg)
+    lut_model.load_state_dict(checkpoint['model_dict'])
+
+    # Generate the truth tables in the LUT module
+    print("Converting to NEQs to LUTs...")
+    generate_truth_tables(lut_model, verbose=True)
+
+    # Test the LUT-based model
+    print("Running inference of LUT-based model training set (%d examples)..." % (dataset_length))
+    lut_inference(lut_model, track_used_luts=True)
+    lut_model.eval()
+    lut_accuracy = test(lut_model, train_loader, cuda=False)
+    print("LUT-Based Model accuracy: %f" % (lut_accuracy))
+    print("Saving LUTs to %s... " % (options_cfg["log_dir"] + "/luts.pth"))
+    save_luts(lut_model, options_cfg["log_dir"] + "/luts.pth")
+    print("Done!")
+
diff --git a/examples/mnist/models.py b/examples/mnist/models.py
index fcedfd932..1afeaf21e 100644
--- a/examples/mnist/models.py
+++ b/examples/mnist/models.py
@@ -70,13 +70,15 @@ def __init__(self, model_config):
         self.verilog_dir = None
         self.top_module_filename = None
         self.dut = None
+        self.verify = True
         self.logfile = None
 
-    def verilog_inference(self, verilog_dir, top_module_filename, logfile: bool = False, add_registers: bool = False):
+    def verilog_inference(self, verilog_dir, top_module_filename, logfile: bool = False, add_registers: bool = False, verify: bool = True):
         self.verilog_dir = realpath(verilog_dir)
         self.top_module_filename = top_module_filename
-        self.dut = PyVerilator.build(f"{self.verilog_dir}/{self.top_module_filename}", verilog_path=[self.verilog_dir], build_dir=f"{self.verilog_dir}/verilator")
+        self.dut = PyVerilator.build(f"{self.verilog_dir}/{self.top_module_filename}", verilog_path=[self.verilog_dir], build_dir=f"{self.verilog_dir}/verilator", command_args=("--x-assign","0",))
         self.is_verilog_inference = True
+        self.verify = verify
         self.logfile = logfile
         if add_registers:
             self.latency = len(self.num_neurons)
@@ -102,11 +104,8 @@ def verilog_forward(self, x):
         self.dut.io.clk = 0
         for i in range(x.shape[0]):
             x_i = x[i,:]
-            y_i = self.pytorch_forward(x[i:i+1,:])[0]
             xv_i = list(map(lambda z: input_quant.get_bin_str(z), x_i))
-            ys_i = list(map(lambda z: output_quant.get_bin_str(z), y_i))
             xvc_i = reduce(lambda a,b: a+b, xv_i[::-1])
-            ysc_i = reduce(lambda a,b: a+b, ys_i[::-1])
             self.dut["M0"] = int(xvc_i, 2)
             for j in range(self.latency + 1):
                 #print(self.dut.io.M5)
@@ -114,9 +113,13 @@ def verilog_forward(self, x):
                 result = f"{res:0{int(total_output_bits)}b}"
                 self.dut.io.clk = 1
                 self.dut.io.clk = 0
-            expected = f"{int(ysc_i,2):0{int(total_output_bits)}b}"
             result = f"{res:0{int(total_output_bits)}b}"
-            assert(expected == result)
+            if self.verify:
+                y_i = self.pytorch_forward(x[i:i+1,:])[0]
+                ys_i = list(map(lambda z: output_quant.get_bin_str(z), y_i))
+                ysc_i = reduce(lambda a,b: a+b, ys_i[::-1])
+                expected = f"{int(ysc_i,2):0{int(total_output_bits)}b}"
+                assert(expected == result)
             res_split = [result[i:i+output_bitwidth] for i in range(0, len(result), output_bitwidth)][::-1]
             yv_i = torch.Tensor(list(map(lambda z: int(z, 2), res_split)))
             y[i,:] = yv_i
diff --git a/examples/mnist/neq2lut.py b/examples/mnist/neq2lut.py
index 6a3007080..533ae6e4b 100644
--- a/examples/mnist/neq2lut.py
+++ b/examples/mnist/neq2lut.py
@@ -23,7 +23,8 @@
 
 from logicnets.nn import    generate_truth_tables, \
                             lut_inference, \
-                            module_list_to_verilog_module
+                            module_list_to_verilog_module, \
+                            load_histograms
 from logicnets.synthesis import synthesize_and_get_resource_counts
 from logicnets.util import proc_postsynth_file
 
@@ -36,6 +37,8 @@
     "checkpoint": None,
     "generate_bench": False,
     "add_registers": False,
+    "histograms": None,
+    "freq_thresh": None,
     "simulate_pre_synthesis_verilog": False,
     "simulate_post_synthesis_verilog": False,
 }
@@ -70,6 +73,10 @@
         help="A location to store the log output of the training run and the output model (default: %(default)s)")
     parser.add_argument('--checkpoint', type=str, required=True,
         help="The checkpoint file which contains the model weights")
+    parser.add_argument('--histograms', type=str, default=None,
+        help="The checkpoint histograms of LUT usage (default: %(default)s)")
+    parser.add_argument('--freq-thresh', type=int, default=None,
+        help="Threshold to use to include this truth table into the model (default: %(default)s)")
     parser.add_argument('--generate-bench', action='store_true', default=False,
         help="Generate the truth table in BENCH format as well as verilog (default: %(default)s)")
     parser.add_argument('--dump-io', action='store_true', default=False,
@@ -146,9 +153,12 @@
                     'test_accuracy': lut_accuracy}
 
     torch.save(modelSave, options_cfg["log_dir"] + "/lut_based_model.pth")
+    if options_cfg["histograms"] is not None:
+        luts = torch.load(options_cfg["histograms"])
+        load_histograms(lut_model, luts)
 
     print("Generating verilog in %s..." % (options_cfg["log_dir"]))
-    module_list_to_verilog_module(lut_model.module_list, "logicnet", options_cfg["log_dir"], generate_bench=options_cfg["generate_bench"], add_registers=options_cfg["add_registers"])
+    module_list_to_verilog_module(lut_model.module_list, "logicnet", options_cfg["log_dir"], generate_bench=options_cfg["generate_bench"], add_registers=options_cfg["add_registers"], freq_thresh=options_cfg["freq_thresh"])
     print("Top level entity stored at: %s/logicnet.v ..." % (options_cfg["log_dir"]))
 
     if args.dump_io:
@@ -161,7 +171,7 @@
 
     if args.simulate_pre_synthesis_verilog:
         print("Running inference simulation of Verilog-based model...")
-        lut_model.verilog_inference(options_cfg["log_dir"], "logicnet.v", logfile=io_filename, add_registers=options_cfg["add_registers"])
+        lut_model.verilog_inference(options_cfg["log_dir"], "logicnet.v", logfile=io_filename, add_registers=options_cfg["add_registers"], verify=options_cfg["freq_thresh"] is None or options_cfg["freq_thresh"] == 0)
         verilog_accuracy = test(lut_model, test_loader, cuda=False)
         print("Verilog-Based Model accuracy: %f" % (verilog_accuracy))
 
@@ -171,7 +181,7 @@
     if args.simulate_post_synthesis_verilog:
         print("Running post-synthesis inference simulation of Verilog-based model...")
         proc_postsynth_file(options_cfg["log_dir"])
-        lut_model.verilog_inference(options_cfg["log_dir"]+"/post_synth", "logicnet_post_synth.v", io_filename, add_registers=options_cfg["add_registers"])
+        lut_model.verilog_inference(options_cfg["log_dir"]+"/post_synth", "logicnet_post_synth.v", io_filename, add_registers=options_cfg["add_registers"], verify=options_cfg["freq_thresh"] is None or options_cfg["freq_thresh"] == 0)
         post_synth_accuracy = test(lut_model, test_loader, cuda=False)
         print("Post-synthesis Verilog-Based Model accuracy: %f" % (post_synth_accuracy))
     
diff --git a/examples/mnist/train.py b/examples/mnist/train.py
index 1f5bf7e7f..a7e635f64 100644
--- a/examples/mnist/train.py
+++ b/examples/mnist/train.py
@@ -46,6 +46,8 @@
         "learning_rate": 1e-3,
         "seed": 0,
         "checkpoint": None,
+        "histograms": None,
+        "freq_thresh": None,
     },
     "mnist-xs": {
         "hidden_layers": [1024, 1024, 128],
@@ -62,6 +64,8 @@
         "learning_rate": 1e-3,
         "seed": 0,
         "checkpoint": None,
+        "histograms": None,
+        "freq_thresh": None,
     },
     "mnist-s": {
         "hidden_layers": [1024, 1024, 1024, 1024, 1024, 128],
@@ -78,6 +82,8 @@
         "learning_rate": 1e-3,
         "seed": 5,
         "checkpoint": None,
+        "histograms": None,
+        "freq_thresh": None,
     },
     "mnist-s-1.1": {
         "hidden_layers": [1024, 1024, 1024, 1024, 1024, 128],
@@ -94,6 +100,8 @@
         "learning_rate": 1e-3,
         "seed": 18,
         "checkpoint": None,
+        "histograms": None,
+        "freq_thresh": None,
     },
     "mnist-m": {
         "hidden_layers": [1024, 1024, 1024, 1024, 1024, 128],
@@ -110,6 +118,8 @@
         "learning_rate": 1e-3,
         "seed": 2,
         "checkpoint": None,
+        "histograms": None,
+        "freq_thresh": None,
     },
     "mnist-m-1.1": {
         "hidden_layers": [1024, 1024, 1024, 1024, 1024, 128],
@@ -126,6 +136,8 @@
         "learning_rate": 1e-3,
         "seed": 20,
         "checkpoint": None,
+        "histograms": None,
+        "freq_thresh": None,
     },
     "mnist-m-1.2": {
         "hidden_layers": [1024, 1024, 1024, 1024, 1024, 128],
@@ -142,6 +154,8 @@
         "learning_rate": 1e-3,
         "seed": 0,
         "checkpoint": None,
+        "histograms": None,
+        "freq_thresh": None,
     },
     "mnist-l": {
         "hidden_layers": [1024, 1024, 1024, 1024, 1024, 128],
@@ -158,6 +172,8 @@
         "learning_rate": 1e-3,
         "seed": 0,
         "checkpoint": None,
+        "histograms": None,
+        "freq_thresh": None,
     },
     "mnist-l-1.1": {
         "hidden_layers": [1024, 1024, 1024, 1024, 1024, 128],
@@ -174,6 +190,8 @@
         "learning_rate": 1e-3,
         "seed": 12,
         "checkpoint": None,
+        "histograms": None,
+        "freq_thresh": None,
     },
 }
 

From 811f65f6540030b7275c6cdf8a822317ec6b2748 Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Wed, 1 Mar 2023 12:01:51 +0000
Subject: [PATCH 43/64] [ex/mnist] Added dropout parameter to dataset/lut
 dumping scripts

---
 examples/mnist/dataset_dump.py | 2 ++
 examples/mnist/dump_luts.py    | 2 ++
 2 files changed, 4 insertions(+)

diff --git a/examples/mnist/dataset_dump.py b/examples/mnist/dataset_dump.py
index 5c96d7616..0e5963f6f 100644
--- a/examples/mnist/dataset_dump.py
+++ b/examples/mnist/dataset_dump.py
@@ -66,6 +66,8 @@ def dump_io(model, data_loader, input_file, output_file):
         help="Fanin to use at the output (default: %(default)s)")
     parser.add_argument('--hidden-layers', nargs='+', type=int, default=None,
         help="A list of hidden layer neuron sizes (default: %(default)s)")
+    parser.add_argument('--input-dropout', type=float, default=None,
+        help="The amount of dropout to apply at the model input (default: %(default)s)")
     parser.add_argument('--log-dir', type=str, default='./log',
         help="A location to store the output I/O text files (default: %(default)s)")
     parser.add_argument('--checkpoint', type=str, required=True,
diff --git a/examples/mnist/dump_luts.py b/examples/mnist/dump_luts.py
index 071e96861..baebad927 100644
--- a/examples/mnist/dump_luts.py
+++ b/examples/mnist/dump_luts.py
@@ -50,6 +50,8 @@
         help="Fanin to use at the output (default: %(default)s)")
     parser.add_argument('--hidden-layers', nargs='+', type=int, default=None,
         help="A list of hidden layer neuron sizes (default: %(default)s)")
+    parser.add_argument('--input-dropout', type=float, default=None,
+        help="The amount of dropout to apply at the model input (default: %(default)s)")
     parser.add_argument('--log-dir', type=str, default='./log',
         help="A location to store the calculated histograms (default: %(default)s)")
     parser.add_argument('--checkpoint', type=str, required=True,

From 0a1715f6dfb53486cf9afe747a8c4bfa0f4a7021 Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Wed, 1 Mar 2023 12:05:43 +0000
Subject: [PATCH 44/64] [ex/mnist] Bugfix in dataloader instantiation in the
 LUT dumping script

---
 examples/mnist/dump_luts.py | 7 ++++---
 1 file changed, 4 insertions(+), 3 deletions(-)

diff --git a/examples/mnist/dump_luts.py b/examples/mnist/dump_luts.py
index baebad927..0b0604071 100644
--- a/examples/mnist/dump_luts.py
+++ b/examples/mnist/dump_luts.py
@@ -85,11 +85,12 @@
 
     # Fetch the test set
     dataset = {}
-    dataset[args.dataset_split] = MNIST('./data', train=args.dataset_split == "train", download=True, transform=trans)
-    test_loader = DataLoader(dataset[args.dataset_split], batch_size=config['batch_size'], shuffle=False)
+    dataset["train"] = MNIST('./data', train=True, download=True, transform=trans)
+    train_loader = DataLoader(dataset["train"], batch_size=config['batch_size'], shuffle=False)
 
     # Instantiate the PyTorch model
-    x, y = dataset[args.dataset_split][0]
+    x, y = dataset["train"][0]
+    dataset_length = len(dataset['train'])
     model_cfg['input_length'] = len(x)
     model_cfg['output_length'] = 10
     model = MnistNeqModel(model_cfg)

From 3bb764c61008622955366727ec97ea163a9a7b28 Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Fri, 3 Mar 2023 10:34:55 +0000
Subject: [PATCH 45/64] [ex/mnist] Added extra M/L configurations

---
 examples/mnist/train.py | 54 +++++++++++++++++++++++++++++++++++++++++
 1 file changed, 54 insertions(+)

diff --git a/examples/mnist/train.py b/examples/mnist/train.py
index a7e635f64..dddc85732 100644
--- a/examples/mnist/train.py
+++ b/examples/mnist/train.py
@@ -157,6 +157,24 @@
         "histograms": None,
         "freq_thresh": None,
     },
+    "mnist-m-1.3": {
+        "hidden_layers": [1024, 1024, 1024, 1024, 1024, 128],
+        "input_bitwidth": 1,
+        "hidden_bitwidth": 2,
+        "output_bitwidth": 4,
+        "input_fanin": 10,
+        "hidden_fanin": 5,
+        "output_fanin": 5,
+        "input_dropout": 0.1,
+        "weight_decay": 1e-3,
+        "batch_size": 1024,
+        "epochs": 1000,
+        "learning_rate": 1e-3,
+        "seed": 20,
+        "checkpoint": None,
+        "histograms": None,
+        "freq_thresh": None,
+    },
     "mnist-l": {
         "hidden_layers": [1024, 1024, 1024, 1024, 1024, 128],
         "input_bitwidth": 1,
@@ -193,6 +211,42 @@
         "histograms": None,
         "freq_thresh": None,
     },
+    "mnist-l-1.2": {
+        "hidden_layers": [1024, 1024, 1024, 1024, 1024, 128],
+        "input_bitwidth": 1,
+        "hidden_bitwidth": 2,
+        "output_bitwidth": 4,
+        "input_fanin": 12,
+        "hidden_fanin": 6,
+        "output_fanin": 6,
+        "input_dropout": 0.1,
+        "weight_decay": 1e-3,
+        "batch_size": 1024,
+        "epochs": 1000,
+        "learning_rate": 1e-3,
+        "seed": 12,
+        "checkpoint": None,
+        "histograms": None,
+        "freq_thresh": None,
+    },
+    "mnist-l-1.3": {
+        "hidden_layers": [1024, 1024, 1024, 1024, 1024, 128],
+        "input_bitwidth": 1,
+        "hidden_bitwidth": 3,
+        "output_bitwidth": 4,
+        "input_fanin": 12,
+        "hidden_fanin": 4,
+        "output_fanin": 6,
+        "input_dropout": 0.1,
+        "weight_decay": 1e-3,
+        "batch_size": 1024,
+        "epochs": 1000,
+        "learning_rate": 1e-3,
+        "seed": 12,
+        "checkpoint": None,
+        "histograms": None,
+        "freq_thresh": None,
+    },
 }
 
 # A dictionary, so we can set some defaults if necessary

From 58f2df9cb893e116a0ce0af93bc23071a7dd91a5 Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Fri, 3 Mar 2023 10:50:03 +0000
Subject: [PATCH 46/64] [ex/mnist] Updated seeds for m-1.3, l-1.2, l-1.3 for
 (97.42, 97.63, 97.60) respectively

---
 examples/mnist/train.py | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/examples/mnist/train.py b/examples/mnist/train.py
index dddc85732..320d9564a 100644
--- a/examples/mnist/train.py
+++ b/examples/mnist/train.py
@@ -170,7 +170,7 @@
         "batch_size": 1024,
         "epochs": 1000,
         "learning_rate": 1e-3,
-        "seed": 20,
+        "seed": 6,
         "checkpoint": None,
         "histograms": None,
         "freq_thresh": None,
@@ -224,7 +224,7 @@
         "batch_size": 1024,
         "epochs": 1000,
         "learning_rate": 1e-3,
-        "seed": 12,
+        "seed": 6,
         "checkpoint": None,
         "histograms": None,
         "freq_thresh": None,
@@ -242,7 +242,7 @@
         "batch_size": 1024,
         "epochs": 1000,
         "learning_rate": 1e-3,
-        "seed": 12,
+        "seed": 6,
         "checkpoint": None,
         "histograms": None,
         "freq_thresh": None,

From c5c2addcd3c3f429ac4426f150d8d883693edc79 Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Fri, 3 Mar 2023 21:01:55 +0000
Subject: [PATCH 47/64] [ex/mnist] Allowed dataloaders to use a few threads

---
 examples/mnist/train.py | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/examples/mnist/train.py b/examples/mnist/train.py
index 320d9564a..2ed90a72e 100644
--- a/examples/mnist/train.py
+++ b/examples/mnist/train.py
@@ -277,9 +277,9 @@
 
 def train(model, datasets, train_cfg, options):
     # Create data loaders for training and inference:
-    train_loader = DataLoader(datasets["train"], batch_size=train_cfg['batch_size'], shuffle=True)
-    val_loader = DataLoader(datasets["valid"], batch_size=train_cfg['batch_size'], shuffle=False)
-    test_loader = DataLoader(datasets["test"], batch_size=train_cfg['batch_size'], shuffle=False)
+    train_loader = DataLoader(datasets["train"], batch_size=train_cfg['batch_size'], shuffle=True, num_workers=2)
+    val_loader = DataLoader(datasets["valid"], batch_size=train_cfg['batch_size'], shuffle=False, num_workers=2)
+    test_loader = DataLoader(datasets["test"], batch_size=train_cfg['batch_size'], shuffle=False, num_workers=2)
 
     # Configure optimizer
     weight_decay = train_cfg["weight_decay"]

From ddf9f48cfb8ff85f2340fc2538b7b937441cecd4 Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Fri, 3 Mar 2023 21:02:50 +0000
Subject: [PATCH 48/64] [ex/mnist] Added random cropping and random rotations
 to image preprocessing

---
 examples/mnist/train.py | 31 +++++++++++++++++++++++--------
 1 file changed, 23 insertions(+), 8 deletions(-)

diff --git a/examples/mnist/train.py b/examples/mnist/train.py
index 2ed90a72e..099ac6ace 100644
--- a/examples/mnist/train.py
+++ b/examples/mnist/train.py
@@ -383,6 +383,11 @@ def test(model, dataset_loader, cuda):
     accuracy = 100*float(correct) / len(dataset_loader.dataset)
     return accuracy
 
+def random_rotation(img, degrees):
+    #img.rotate(angle, resample, expand, center, fillcolor=fill)
+    angle = torch.randint(-degrees, degrees+1, (1,)).detach().numpy()
+    return img.rotate(angle, False, False, None, fillcolor=0)
+
 if __name__ == "__main__":
     parser = ArgumentParser(description="LogicNets MNIST Classification Example")
     parser.add_argument('--arch', type=str, choices=configs.keys(), default="mnist-s",
@@ -450,17 +455,27 @@ def test(model, dataset_loader, cuda):
         torch.cuda.manual_seed_all(train_cfg['seed'])
         torch.backends.cudnn.deterministic = True
 
-    trans = transform=transforms.Compose([
-                transforms.ToTensor(),
-                transforms.Normalize((0.1307,), (0.3081,)),
-                transforms.Lambda(partial(torch.reshape, shape=(-1,)))
-            ])
+    train_transforms = [
+        transforms.RandomCrop(size=28, padding=1),
+        #transforms.RandomRotation(degrees=7),
+        transforms.Lambda(partial(random_rotation, degrees=4)),
+        transforms.ToTensor(),
+        transforms.Normalize((0.1307,), (0.3081,)),
+        transforms.Lambda(partial(torch.reshape, shape=(-1,)))
+    ]
+    train_trans = transforms.Compose(train_transforms)
+    inf_transforms = [
+        transforms.ToTensor(),
+        transforms.Normalize((0.1307,), (0.3081,)),
+        transforms.Lambda(partial(torch.reshape, shape=(-1,)))
+    ]
+    inf_trans = transforms.Compose(inf_transforms)
 
     # Fetch the datasets
     dataset = {}
-    dataset['train'] = MNIST('./data', train=True, download=True, transform=trans)
-    dataset['valid'] = MNIST('./data', train=False, download=True, transform=trans)
-    dataset['test'] = MNIST('./data', train=False, download=True, transform=trans)
+    dataset['train'] = MNIST('./data', train=True, download=True, transform=train_trans)
+    dataset['valid'] = MNIST('./data', train=False, download=True, transform=inf_trans)
+    dataset['test'] = MNIST('./data', train=False, download=True, transform=inf_trans)
 
     # Instantiate model
     x, y = dataset['train'][0]

From 26a6d36f32048ef02dc552e13ac44753f2fc7bea Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Sat, 4 Mar 2023 10:54:13 +0000
Subject: [PATCH 49/64] [ex/mnist] Updated training preprocessing tranforms

---
 examples/mnist/train.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/examples/mnist/train.py b/examples/mnist/train.py
index 099ac6ace..e3a5f1da6 100644
--- a/examples/mnist/train.py
+++ b/examples/mnist/train.py
@@ -457,7 +457,7 @@ def random_rotation(img, degrees):
 
     train_transforms = [
         transforms.RandomCrop(size=28, padding=1),
-        #transforms.RandomRotation(degrees=7),
+        #transforms.RandomRotation(degrees=4),
         transforms.Lambda(partial(random_rotation, degrees=4)),
         transforms.ToTensor(),
         transforms.Normalize((0.1307,), (0.3081,)),

From 410d4932876d47682a6a75aebdf3758c5e3be6c0 Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Sat, 4 Mar 2023 12:28:57 +0000
Subject: [PATCH 50/64] [abc] Updated pipelining to return #nodes

---
 src/logicnets/abc.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/logicnets/abc.py b/src/logicnets/abc.py
index 14d74c48b..07fd966bf 100644
--- a/src/logicnets/abc.py
+++ b/src/logicnets/abc.py
@@ -195,7 +195,7 @@ def pipeline_tech_mapped_circuit(circuit_file, output_verilog, num_registers, ab
         print(nodes)
         print(out)
         print(err)
-    return out, err
+    return nodes, out, err
 
 def tech_map_to_verilog(circuit_file, output_verilog, abc_path=os.environ["ABC_ROOT"], working_dir=None, verbose=False):
     cmd = [f"{abc_path}/abc", '-c', f"read {circuit_file}; print_stats; write_verilog -fm {output_verilog}"]

From c921b1e2971b3c4c22ebca5a67003c96f7bc4d03 Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Sun, 5 Mar 2023 12:12:42 +0000
Subject: [PATCH 51/64] [ex/jsc] Bugfix when simulating a pipelined design

---
 examples/jet_substructure/simulate_verilog.py | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/examples/jet_substructure/simulate_verilog.py b/examples/jet_substructure/simulate_verilog.py
index 15746b802..8a1764f65 100644
--- a/examples/jet_substructure/simulate_verilog.py
+++ b/examples/jet_substructure/simulate_verilog.py
@@ -105,7 +105,8 @@
     verilog_dir = os.path.dirname(options_cfg["input_verilog"])
     filename = os.path.split(options_cfg["input_verilog"])[-1]
     print(f"Running inference simulation of Verilog-based model ({filename})")
-    model.verilog_inference(verilog_dir, filename, logfile=None, add_registers=options_cfg["num_registers"] == 0, verify=False)
+    model.verilog_inference(verilog_dir, filename, logfile=None, add_registers=options_cfg["num_registers"] != 0, verify=False)
+    model.latency = options_cfg["num_registers"]
     verilog_accuracy = test(model, test_loader, cuda=False)
     print("Verilog-Based Model accuracy: %f" % (verilog_accuracy))
 

From 0740d26c1f6c6487bc8d0a486dcc5dd018ecc3a8 Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Sun, 5 Mar 2023 12:13:56 +0000
Subject: [PATCH 52/64] [verilog] Adds missing clock from ABC-generated
 verilog, if necessary

---
 src/logicnets/verilog.py | 5 ++++-
 1 file changed, 4 insertions(+), 1 deletion(-)

diff --git a/src/logicnets/verilog.py b/src/logicnets/verilog.py
index 9d4f0ab30..2911979e1 100644
--- a/src/logicnets/verilog.py
+++ b/src/logicnets/verilog.py
@@ -101,7 +101,10 @@ def fix_abc_module_name(input_verilog_file, output_verilog_file, old_module_name
             f.write("`timescale 1 ps / 1 ps\n")
         for l in lines:
             if l.__contains__(f"module {old_module_name}"):
-                l = f"module {new_module_name}  (\n"
+                if add_timescale:
+                    l = f"module {new_module_name}  (clock,\n"
+                else:
+                    l = f"module {new_module_name}  (\n"
             f.write(l)
 
 def generate_abc_verilog_wrapper(module_name: str, input_name: str, input_bits: int, output_name: str, output_bits: int, submodule_name: str, num_registers: int, add_timescale: bool = True):

From bc34da0f59eafbcbe8f9f067ed54f95f6da4002b Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Sun, 5 Mar 2023 12:15:26 +0000
Subject: [PATCH 53/64] [ex/jsc] Added FPGA synthesis script

---
 examples/jet_substructure/verilog2bitfile.py | 28 ++++++++++++++++++++
 1 file changed, 28 insertions(+)
 create mode 100644 examples/jet_substructure/verilog2bitfile.py

diff --git a/examples/jet_substructure/verilog2bitfile.py b/examples/jet_substructure/verilog2bitfile.py
new file mode 100644
index 000000000..3dfb7b226
--- /dev/null
+++ b/examples/jet_substructure/verilog2bitfile.py
@@ -0,0 +1,28 @@
+#  Copyright (C) 2021 Xilinx, Inc
+#
+#  Licensed under the Apache License, Version 2.0 (the "License");
+#  you may not use this file except in compliance with the License.
+#  You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing, software
+#  distributed under the License is distributed on an "AS IS" BASIS,
+#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+#  See the License for the specific language governing permissions and
+#  limitations under the License.
+
+from argparse import ArgumentParser
+
+from logicnets.synthesis import synthesize_and_get_resource_counts
+
+if __name__ == "__main__":
+    parser = ArgumentParser(description="Synthesize convert a PyTorch trained model into verilog")
+    parser.add_argument('--log-dir', type=str, default='./log', required=True,
+        help="A location to store the log output of the training run and the output model (default: %(default)s)")
+    parser.add_argument('--clock-period', type=float, default=1.0,
+        help="Target clock frequency to use during Vivado synthesis (default: %(default)s)")
+    args = parser.parse_args()
+    print("Running out-of-context synthesis")
+    ret = synthesize_and_get_resource_counts(args.log_dir, "logicnet", fpga_part="xcu280-fsvh2892-2L-e", clk_period_ns=args.clock_period, post_synthesis = 1)
+

From 7e83a9c2ebb23fa41306a4243a0cd3b367771f26 Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Sun, 5 Mar 2023 12:26:04 +0000
Subject: [PATCH 54/64] [ex/jsc] Bugfix / added AVG ROC-AUC to results

---
 examples/jet_substructure/dump_luts.py | 6 ++++--
 1 file changed, 4 insertions(+), 2 deletions(-)

diff --git a/examples/jet_substructure/dump_luts.py b/examples/jet_substructure/dump_luts.py
index 05952268e..f99d21651 100644
--- a/examples/jet_substructure/dump_luts.py
+++ b/examples/jet_substructure/dump_luts.py
@@ -99,8 +99,9 @@
     # Test the PyTorch model
     print("Running inference of baseline model on training set (%d examples)..." % (dataset_length))
     model.eval()
-    baseline_accuracy = test(model, train_loader, cuda=False)
+    baseline_accuracy, baseline_avg_roc_auc = test(model, test_loader, cuda=False)
     print("Baseline accuracy: %f" % (baseline_accuracy))
+    print("Baseline AVG ROC AUC: %f" % (baseline_avg_roc_auc))
 
     # Instantiate LUT-based model
     lut_model = JetSubstructureLutModel(model_cfg)
@@ -114,8 +115,9 @@
     print("Running inference of LUT-based model training set (%d examples)..." % (dataset_length))
     lut_inference(lut_model, track_used_luts=True)
     lut_model.eval()
-    lut_accuracy = test(lut_model, train_loader, cuda=False)
+    lut_accuracy, lut_avg_roc_auc = test(lut_model, test_loader, cuda=False)
     print("LUT-Based Model accuracy: %f" % (lut_accuracy))
+    print("LUT-Based AVG ROC AUC: %f" % (lut_avg_roc_auc))
     print("Saving LUTs to %s... " % (options_cfg["log_dir"] + "/luts.pth"))
     save_luts(lut_model, options_cfg["log_dir"] + "/luts.pth")
     print("Done!")

From 3b53131bdab15447aa119631fb32f2e029d50d65 Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Sun, 5 Mar 2023 12:35:01 +0000
Subject: [PATCH 55/64] [ex/jsc] Bugfix: added AVG ROC-AUC results

---
 examples/jet_substructure/neq2lut_abc.py | 9 ++++++---
 1 file changed, 6 insertions(+), 3 deletions(-)

diff --git a/examples/jet_substructure/neq2lut_abc.py b/examples/jet_substructure/neq2lut_abc.py
index 1f2cc4709..1d2bd7495 100644
--- a/examples/jet_substructure/neq2lut_abc.py
+++ b/examples/jet_substructure/neq2lut_abc.py
@@ -120,8 +120,9 @@
     # Test the PyTorch model
     print("Running inference on baseline model...")
     model.eval()
-    baseline_accuracy = test(model, test_loader, cuda=False)
+    baseline_accuracy, baseline_avg_roc_auc = test(model, test_loader, cuda=False)
     print("Baseline accuracy: %f" % (baseline_accuracy))
+    print("Baseline AVG ROC AUC: %f" % (baseline_avg_roc_auc))
 
     # Run preprocessing on training set.
     #train_input_file = config['log_dir'] + "/train_input.txt"
@@ -145,10 +146,12 @@
     print("Running inference on LUT-based model...")
     lut_inference(lut_model)
     lut_model.eval()
-    lut_accuracy = test(lut_model, test_loader, cuda=False)
+    lut_accuracy, lut_avg_roc_auc = test(lut_model, test_loader, cuda=False)
     print("LUT-Based Model accuracy: %f" % (lut_accuracy))
+    print("LUT-Based AVG ROC AUC: %f" % (lut_avg_roc_auc))
     modelSave = {   'model_dict': lut_model.state_dict(),
-                    'test_accuracy': lut_accuracy}
+                    'test_accuracy': lut_accuracy,
+                    'test_avg_roc_auc': lut_avg_roc_auc}
 
     torch.save(modelSave, options_cfg["log_dir"] + "/lut_based_model.pth")
     if options_cfg["histograms"] is not None:

From b42cea7c7a750417c94604aca2be406b9cdad286 Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Sun, 5 Mar 2023 12:39:15 +0000
Subject: [PATCH 56/64] [ex/jsc] Bugfix: support measuring AVG ROC-AUC

---
 examples/jet_substructure/simulate_verilog.py | 6 ++++--
 1 file changed, 4 insertions(+), 2 deletions(-)

diff --git a/examples/jet_substructure/simulate_verilog.py b/examples/jet_substructure/simulate_verilog.py
index 8a1764f65..0aecf6f44 100644
--- a/examples/jet_substructure/simulate_verilog.py
+++ b/examples/jet_substructure/simulate_verilog.py
@@ -99,14 +99,16 @@
     # Test the PyTorch model
     print("Running inference on baseline model...")
     model.eval()
-    baseline_accuracy = test(model, test_loader, cuda=False)
+    baseline_accuracy, baseline_avg_roc_auc = test(model, test_loader, cuda=False)
     print("Baseline accuracy: %f" % (baseline_accuracy))
+    print("Baseline AVG ROC AUC: %f" % (baseline_avg_roc_auc))
 
     verilog_dir = os.path.dirname(options_cfg["input_verilog"])
     filename = os.path.split(options_cfg["input_verilog"])[-1]
     print(f"Running inference simulation of Verilog-based model ({filename})")
     model.verilog_inference(verilog_dir, filename, logfile=None, add_registers=options_cfg["num_registers"] != 0, verify=False)
     model.latency = options_cfg["num_registers"]
-    verilog_accuracy = test(model, test_loader, cuda=False)
+    verilog_accuracy, verilog_avg_roc_auc = test(model, test_loader, cuda=False)
     print("Verilog-Based Model accuracy: %f" % (verilog_accuracy))
+    print("Verilog-Based AVG ROC AUC: %f" % (verilog_avg_roc_auc))
 

From 70fb8bfb048a22dfeac3c85b397322e11d55745a Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Mon, 6 Mar 2023 13:33:39 +0000
Subject: [PATCH 57/64] [ex/mnist] Initial version supporting ABC flow

---
 examples/mnist/neq2lut_abc.py | 175 ++++++++++++++++++++++++++++++++++
 1 file changed, 175 insertions(+)
 create mode 100644 examples/mnist/neq2lut_abc.py

diff --git a/examples/mnist/neq2lut_abc.py b/examples/mnist/neq2lut_abc.py
new file mode 100644
index 000000000..69fe9623e
--- /dev/null
+++ b/examples/mnist/neq2lut_abc.py
@@ -0,0 +1,175 @@
+#  Copyright (C) 2021 Xilinx, Inc
+#
+#  Licensed under the Apache License, Version 2.0 (the "License");
+#  you may not use this file except in compliance with the License.
+#  You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing, software
+#  distributed under the License is distributed on an "AS IS" BASIS,
+#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+#  See the License for the specific language governing permissions and
+#  limitations under the License.
+
+import os
+from argparse import ArgumentParser
+from functools import partial
+
+import torch
+from torch.utils.data import DataLoader
+from torchvision.datasets import MNIST
+from torchvision import transforms
+
+from logicnets.nn import    generate_truth_tables, \
+                            lut_inference, \
+                            module_list_to_verilog_module, \
+                            load_histograms
+from logicnets.synthesis import synthesize_and_get_resource_counts_with_abc
+
+from models import MnistNeqModel, MnistLutModel
+from train import configs, model_config, test
+from dataset_dump import dump_io
+
+other_options = {
+    "cuda": None,
+    "log_dir": None,
+    "checkpoint": None,
+    "histograms": None,
+    "freq_thresh": None,
+}
+
+if __name__ == "__main__":
+    parser = ArgumentParser(description="Synthesize convert a PyTorch trained model into verilog using ABC")
+    parser.add_argument('--arch', type=str, choices=configs.keys(), default="mnist-s",
+        help="Specific the neural network model to use (default: %(default)s)")
+    parser.add_argument('--batch-size', type=int, default=None, metavar='N',
+        help="Batch size for evaluation (default: %(default)s)")
+    parser.add_argument('--input-bitwidth', type=int, default=None,
+        help="Bitwidth to use at the input (default: %(default)s)")
+    parser.add_argument('--hidden-bitwidth', type=int, default=None,
+        help="Bitwidth to use for activations in hidden layers (default: %(default)s)")
+    parser.add_argument('--output-bitwidth', type=int, default=None,
+        help="Bitwidth to use at the output (default: %(default)s)")
+    parser.add_argument('--input-fanin', type=int, default=None,
+        help="Fanin to use at the input (default: %(default)s)")
+    parser.add_argument('--hidden-fanin', type=int, default=None,
+        help="Fanin to use for the hidden layers (default: %(default)s)")
+    parser.add_argument('--output-fanin', type=int, default=None,
+        help="Fanin to use at the output (default: %(default)s)")
+    parser.add_argument('--hidden-layers', nargs='+', type=int, default=None,
+        help="A list of hidden layer neuron sizes (default: %(default)s)")
+    parser.add_argument('--input-dropout', type=float, default=None,
+        help="The amount of dropout to apply at the model input (default: %(default)s)")
+    parser.add_argument('--clock-period', type=float, default=1.0,
+        help="Target clock frequency to use during Vivado synthesis (default: %(default)s)")
+    parser.add_argument('--dataset-split', type=str, default='test', choices=['train', 'test'],
+        help="Dataset to use for evaluation (default: %(default)s)")
+    parser.add_argument('--log-dir', type=str, default='./log',
+        help="A location to store the log output of the training run and the output model (default: %(default)s)")
+    parser.add_argument('--checkpoint', type=str, required=True,
+        help="The checkpoint file which contains the model weights")
+    parser.add_argument('--histograms', type=str, default=None,
+        help="The checkpoint histograms of LUT usage (default: %(default)s)")
+    parser.add_argument('--freq-thresh', type=int, default=None,
+        help="Threshold to use to include this truth table into the model (default: %(default)s)")
+    parser.add_argument('--num-registers', type=int, default=0,
+        help="The number of registers to add to the generated verilog (default: %(default)s)")
+    args = parser.parse_args()
+    defaults = configs[args.arch]
+    options = vars(args)
+    del options['arch']
+    config = {}
+    for k in options.keys():
+        config[k] = options[k] if options[k] is not None else defaults[k] # Override defaults, if specified.
+
+    if not os.path.exists(config['log_dir']):
+        os.makedirs(config['log_dir'])
+
+    # Split up configuration options to be more understandable
+    model_cfg = {}
+    for k in model_config.keys():
+        model_cfg[k] = config[k]
+    dataset_cfg = {}
+    for k in dataset_config.keys():
+        dataset_cfg[k] = config[k]
+    options_cfg = {}
+    for k in other_options.keys():
+        if k == 'cuda':
+            continue
+        options_cfg[k] = config[k]
+
+    trans = transform=transforms.Compose([
+                transforms.ToTensor(),
+                transforms.Normalize((0.1307,), (0.3081,)),
+                transforms.Lambda(partial(torch.reshape, shape=(-1,)))
+            ])
+
+    # Fetch the test set
+    dataset = {}
+    dataset["train"] = MNIST('./data', train=True, download=True, transform=trans)
+    dataset["test"] = MNIST('./data', train=False, download=True, transform=trans)
+    train_loader = DataLoader(dataset["train"], batch_size=config['batch_size'], shuffle=False)
+    test_loader = DataLoader(dataset["test"], batch_size=config['batch_size'], shuffle=False)
+
+
+    # Instantiate the PyTorch model
+    x, y = dataset[args.dataset_split][0]
+    model_cfg['input_length'] = len(x)
+    model_cfg['output_length'] = 10
+    model = MnistNeqModel(model_cfg)
+
+    # Load the model weights
+    checkpoint = torch.load(options_cfg['checkpoint'], map_location='cpu')
+    model.load_state_dict(checkpoint['model_dict'])
+
+    # Test the PyTorch model
+    print("Running inference on baseline model...")
+    model.eval()
+    baseline_accuracy = test(model, test_loader, cuda=False)
+    print("Baseline accuracy: %f" % (baseline_accuracy))
+
+    # Run preprocessing on training set.
+    #train_input_file = config['log_dir'] + "/train_input.txt"
+    #train_output_file = config['log_dir'] + "/train_output.txt"
+    #test_input_file = config['log_dir'] + "/test_input.txt"
+    #test_output_file = config['log_dir'] + "/test_output.txt"
+    #print(f"Dumping train I/O to {train_input_file} and {train_output_file}")
+    #dump_io(model, train_loader, train_input_file, train_output_file)
+    #print(f"Dumping test I/O to {test_input_file} and {test_output_file}")
+    #dump_io(model, test_loader, test_input_file, test_output_file)
+
+    # Instantiate LUT-based model
+    lut_model = MnistLutModel(model_cfg)
+    lut_model.load_state_dict(checkpoint['model_dict'])
+
+    # Generate the truth tables in the LUT module
+    print("Converting to NEQs to LUTs...")
+    generate_truth_tables(lut_model, verbose=True)
+
+    # Test the LUT-based model
+    print("Running inference on LUT-based model...")
+    lut_inference(lut_model)
+    lut_model.eval()
+    lut_accuracy = test(lut_model, test_loader, cuda=False)
+    print("LUT-Based Model accuracy: %f" % (lut_accuracy))
+    print("LUT-Based AVG ROC AUC: %f" % (lut_avg_roc_auc))
+    modelSave = {   'model_dict': lut_model.state_dict(),
+                    'test_accuracy': lut_accuracy}
+
+    torch.save(modelSave, options_cfg["log_dir"] + "/lut_based_model.pth")
+    if options_cfg["histograms"] is not None:
+        luts = torch.load(options_cfg["histograms"])
+        load_histograms(lut_model, luts)
+
+    print("Generating verilog in %s..." % (options_cfg["log_dir"]))
+    module_list_to_verilog_module(lut_model.module_list, "logicnet", options_cfg["log_dir"], generate_bench=True, add_registers=False)
+    print("Top level entity stored at: %s/logicnet.v ..." % (options_cfg["log_dir"]))
+
+    print("Running synthesis and verilog technology-mapped verilog in ABC")
+    train_accuracy, test_accuracy, nodes, average_care_set_size = synthesize_and_get_resource_counts_with_abc(options_cfg["log_dir"], lut_model.module_list, pipeline_stages=args.num_registers, freq_thresh=args.freq_thresh, train_input_txt="train_input.txt", train_output_txt="train_output.txt", test_input_txt="test_input.txt", test_output_txt="test_output.txt", bdd_opt_cmd="&ttopt", verbose=False)
+    print(f"Training set accuracy(%): {train_accuracy}")
+    print(f"Test set accuracy(%): {test_accuracy}")
+    print(f"LUT6(#): {nodes}")
+    print(f"Average care set sizes(%): {average_care_set_size}")
+

From 9f40656f4e9be736468bd912fc73c7a22da8f96d Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Mon, 6 Mar 2023 13:34:09 +0000
Subject: [PATCH 58/64] [ex/mnist] Initial version supporting BLIF conversion
 and testing

---
 examples/mnist/blif2verilog.py     | 147 +++++++++++++++++++++++++++++
 examples/mnist/simulate_verilog.py | 118 +++++++++++++++++++++++
 examples/mnist/verilog2bitfile.py  |  28 ++++++
 3 files changed, 293 insertions(+)
 create mode 100644 examples/mnist/blif2verilog.py
 create mode 100644 examples/mnist/simulate_verilog.py
 create mode 100644 examples/mnist/verilog2bitfile.py

diff --git a/examples/mnist/blif2verilog.py b/examples/mnist/blif2verilog.py
new file mode 100644
index 000000000..3acabdaa4
--- /dev/null
+++ b/examples/mnist/blif2verilog.py
@@ -0,0 +1,147 @@
+#  Copyright (C) 2022 Xilinx, Inc
+#
+#  Licensed under the Apache License, Version 2.0 (the "License");
+#  you may not use this file except in compliance with the License.
+#  You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing, software
+#  distributed under the License is distributed on an "AS IS" BASIS,
+#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+#  See the License for the specific language governing permissions and
+#  limitations under the License.
+
+# A script to convert technology-mapped BLIF files to technology mapped verilog.
+
+import os
+import glob
+import shutil
+from argparse import ArgumentParser
+from functools import partial
+
+import torch
+from torch.utils.data import DataLoader
+from torchvision.datasets import MNIST
+from torchvision import transforms
+
+from logicnets.abc import   tech_map_to_verilog,\
+                            putontop_blif,\
+                            pipeline_tech_mapped_circuit
+from logicnets.verilog import   fix_abc_module_name,\
+                                generate_abc_verilog_wrapper
+
+from models import MnistNeqModel
+from train import configs, model_config, test
+
+other_options = {
+    "output_directory": None,
+    "input_blifs": None,
+    "num_registers": None,
+    "generated_module_name_prefix": None,
+}
+
+if __name__ == "__main__":
+    parser = ArgumentParser(description="Convert a technology-mapped BLIF files into a technology-mapped verilog file, using ABC")
+    parser.add_argument('--arch', type=str, choices=configs.keys(), default="mnist-s",
+        help="Specific the neural network model to use (default: %(default)s)")
+    parser.add_argument('--input-bitwidth', type=int, default=None,
+        help="Bitwidth to use at the input (default: %(default)s)")
+    parser.add_argument('--hidden-bitwidth', type=int, default=None,
+        help="Bitwidth to use for activations in hidden layers (default: %(default)s)")
+    parser.add_argument('--output-bitwidth', type=int, default=None,
+        help="Bitwidth to use at the output (default: %(default)s)")
+    parser.add_argument('--input-fanin', type=int, default=None,
+        help="Fanin to use at the input (default: %(default)s)")
+    parser.add_argument('--hidden-fanin', type=int, default=None,
+        help="Fanin to use for the hidden layers (default: %(default)s)")
+    parser.add_argument('--output-fanin', type=int, default=None,
+        help="Fanin to use at the output (default: %(default)s)")
+    parser.add_argument('--hidden-layers', nargs='+', type=int, default=None,
+        help="A list of hidden layer neuron sizes (default: %(default)s)")
+    parser.add_argument('--input-dropout', type=float, default=None,
+        help="The amount of dropout to apply at the model input (default: %(default)s)")
+    parser.add_argument('--dataset-split', type=str, default='test', choices=['train', 'test'],
+        help="Dataset to use for evaluation (default: %(default)s)")
+    parser.add_argument('--input-blifs', nargs='+', type=str, required=True,
+        help="The input BLIF files")
+    parser.add_argument('--output-directory', type=str, default='./log',
+        help="The directory which the generated verilog gets stored. (default: %(default)s)")
+    parser.add_argument('--num-registers', type=int, default=0,
+        help="The number of registers to add to the generated verilog (default: %(default)s)")
+    parser.add_argument('--generated-module-name-prefix', type=str, default='\\aig',
+        help="A prefix which matches the module name in the generated verilog, but no other line of code (default: %(default)s)")
+    args = parser.parse_args()
+    defaults = configs[args.arch]
+    options = vars(args)
+    del options['arch']
+    config = {}
+    for k in options.keys():
+        config[k] = options[k] if options[k] is not None else defaults[k] # Override defaults, if specified.
+
+    if not os.path.exists(args.output_directory):
+        os.makedirs(args.output_directory)
+
+    # Split up configuration options to be more understandable
+    model_cfg = {}
+    for k in model_config.keys():
+        model_cfg[k] = config[k]
+    dataset_cfg = {}
+    for k in dataset_config.keys():
+        dataset_cfg[k] = config[k]
+    options_cfg = {}
+    for k in other_options.keys():
+        options_cfg[k] = config[k]
+
+    trans = transform=transforms.Compose([
+                transforms.ToTensor(),
+                transforms.Normalize((0.1307,), (0.3081,)),
+                transforms.Lambda(partial(torch.reshape, shape=(-1,)))
+            ])
+
+    # Fetch the test set
+    dataset = {}
+    dataset[args.dataset_split] = MNIST('./data', train=args.dataset_split == "train", download=True, transform=trans)
+    test_loader = DataLoader(dataset[args.dataset_split], batch_size=1, shuffle=False)
+
+    # Instantiate the PyTorch model
+    x, y = dataset[args.dataset_split][0]
+    model_cfg['input_length'] = len(x)
+    model_cfg['output_length'] = 10
+    model = MnistNeqModel(model_cfg)
+
+    abc_project_root = options_cfg['output_directory']
+    veropt_dir = options_cfg['output_directory']
+    input_blif = "layers_full_opt.blif"
+    verbose = False
+
+    if len(options_cfg['input_blifs']) > 1:
+        nodes, out, err = putontop_blif([os.path.realpath(blif) for blif in options_cfg['input_blifs']], input_blif, working_dir=abc_project_root, verbose=verbose)
+    else:
+        shutil.copy(os.path.realpath(options_cfg['input_blifs'][0]), f"{abc_project_root}/{input_blif}")
+
+    if options_cfg['num_registers'] == 0:
+        nodes, out, err = tech_map_to_verilog(circuit_file=input_blif, output_verilog=f"layers_full_opt.v", working_dir=abc_project_root, verbose=verbose)
+    else:
+        nodes, out, err = pipeline_tech_mapped_circuit(circuit_file=input_blif, output_verilog=f"layers_full_opt.v", num_registers=options_cfg['num_registers'], working_dir=abc_project_root, verbose=verbose)
+
+    # Fix the resultant verilog file so that it can be simulated
+    fix_abc_module_name(f"{veropt_dir}/layers_full_opt.v", f"{veropt_dir}/layers_full_opt.v", options_cfg["generated_module_name_prefix"], "layers_full_opt", add_timescale=True)
+
+    # Generate top-level entity wrapper
+    module_list = model.module_list
+    _, input_bitwidth = module_list[0].input_quant.get_scale_factor_bits()
+    _, output_bitwidth = module_list[-1].output_quant.get_scale_factor_bits()
+    input_bitwidth, output_bitwidth = int(input_bitwidth), int(output_bitwidth)
+    total_input_bits = module_list[0].in_features*input_bitwidth
+    total_output_bits = module_list[-1].out_features*output_bitwidth
+    module_name="logicnet"
+    veropt_wrapper_str = generate_abc_verilog_wrapper(module_name=module_name, input_name="M0", input_bits=total_input_bits, output_name=f"M{len(module_list)}", output_bits=total_output_bits, submodule_name="layers_full_opt", num_registers=options_cfg['num_registers'])
+    with open(f"{veropt_dir}/{module_name}.v", "w") as f:
+        f.write(veropt_wrapper_str)
+
+    print(f"Adding Nitro-Parts-Lib to {veropt_dir}")
+    source_files = glob.glob(f"{os.environ['NITROPARTSLIB']}/*.v")
+    for f in source_files:
+        shutil.copy(f, f"{veropt_dir}")
+
diff --git a/examples/mnist/simulate_verilog.py b/examples/mnist/simulate_verilog.py
new file mode 100644
index 000000000..0478e6d86
--- /dev/null
+++ b/examples/mnist/simulate_verilog.py
@@ -0,0 +1,118 @@
+#  Copyright (C) 2021 Xilinx, Inc
+#
+#  Licensed under the Apache License, Version 2.0 (the "License");
+#  you may not use this file except in compliance with the License.
+#  You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing, software
+#  distributed under the License is distributed on an "AS IS" BASIS,
+#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+#  See the License for the specific language governing permissions and
+#  limitations under the License.
+
+import os
+from argparse import ArgumentParser
+from functools import partial
+
+import torch
+from torch.utils.data import DataLoader
+from torchvision.datasets import MNIST
+from torchvision import transforms
+
+from models import MnistNeqModel
+from train import configs, model_config, test
+
+other_options = {
+    "checkpoint": None,
+    "input_verilog": None,
+    "num_registers": None,
+}
+
+if __name__ == "__main__":
+    parser = ArgumentParser(description="Synthesize convert a PyTorch trained model into verilog")
+    parser.add_argument('--arch', type=str, choices=configs.keys(), default="mnist-s",
+        help="Specific the neural network model to use (default: %(default)s)")
+    parser.add_argument('--batch-size', type=int, default=None, metavar='N',
+        help="Batch size for evaluation (default: %(default)s)")
+    parser.add_argument('--input-bitwidth', type=int, default=None,
+        help="Bitwidth to use at the input (default: %(default)s)")
+    parser.add_argument('--hidden-bitwidth', type=int, default=None,
+        help="Bitwidth to use for activations in hidden layers (default: %(default)s)")
+    parser.add_argument('--output-bitwidth', type=int, default=None,
+        help="Bitwidth to use at the output (default: %(default)s)")
+    parser.add_argument('--input-fanin', type=int, default=None,
+        help="Fanin to use at the input (default: %(default)s)")
+    parser.add_argument('--hidden-fanin', type=int, default=None,
+        help="Fanin to use for the hidden layers (default: %(default)s)")
+    parser.add_argument('--output-fanin', type=int, default=None,
+        help="Fanin to use at the output (default: %(default)s)")
+    parser.add_argument('--hidden-layers', nargs='+', type=int, default=None,
+        help="A list of hidden layer neuron sizes (default: %(default)s)")
+    parser.add_argument('--input-dropout', type=float, default=None,
+        help="The amount of dropout to apply at the model input (default: %(default)s)")
+    parser.add_argument('--dataset-split', type=str, default='test', choices=['train', 'test'],
+        help="Dataset to use for evaluation (default: %(default)s)")
+    parser.add_argument('--checkpoint', type=str, required=True,
+        help="The checkpoint file which contains the model weights")
+    parser.add_argument('--input-verilog', type=str, required=True,
+        help="The input verilog file to simulate")
+    parser.add_argument('--num-registers', type=int, default=0,
+        help="The number of pipeline registers in the verilog (default: %(default)s)")
+    args = parser.parse_args()
+    defaults = configs[args.arch]
+    options = vars(args)
+    del options['arch']
+    config = {}
+    for k in options.keys():
+        config[k] = options[k] if options[k] is not None else defaults[k] # Override defaults, if specified.
+
+    # Split up configuration options to be more understandable
+    model_cfg = {}
+    for k in model_config.keys():
+        model_cfg[k] = config[k]
+    dataset_cfg = {}
+    for k in dataset_config.keys():
+        dataset_cfg[k] = config[k]
+    options_cfg = {}
+    for k in other_options.keys():
+        if k == 'cuda':
+            continue
+        options_cfg[k] = config[k]
+
+    trans = transform=transforms.Compose([
+                transforms.ToTensor(),
+                transforms.Normalize((0.1307,), (0.3081,)),
+                transforms.Lambda(partial(torch.reshape, shape=(-1,)))
+            ])
+
+    # Fetch the test set
+    dataset = {}
+    dataset[args.dataset_split] = MNIST('./data', train=args.dataset_split == "train", download=True, transform=trans)
+    test_loader = DataLoader(dataset[args.dataset_split], batch_size=config['batch_size'], shuffle=False)
+
+    # Instantiate the PyTorch model
+    x, y = dataset[args.dataset_split][0]
+    model_cfg['input_length'] = len(x)
+    model_cfg['output_length'] = 10
+    model = MnistNeqModel(model_cfg)
+
+    # Load the model weights
+    checkpoint = torch.load(options_cfg['checkpoint'], map_location='cpu')
+    model.load_state_dict(checkpoint['model_dict'])
+
+    # Test the PyTorch model
+    print("Running inference on baseline model...")
+    model.eval()
+    baseline_accuracy = test(model, test_loader, cuda=False)
+    print("Baseline accuracy: %f" % (baseline_accuracy))
+
+    verilog_dir = os.path.dirname(options_cfg["input_verilog"])
+    filename = os.path.split(options_cfg["input_verilog"])[-1]
+    print(f"Running inference simulation of Verilog-based model ({filename})")
+    model.verilog_inference(verilog_dir, filename, logfile=None, add_registers=options_cfg["num_registers"] != 0, verify=False)
+    model.latency = options_cfg["num_registers"]
+    verilog_accuracy = test(model, test_loader, cuda=False)
+    print("Verilog-Based Model accuracy: %f" % (verilog_accuracy))
+
diff --git a/examples/mnist/verilog2bitfile.py b/examples/mnist/verilog2bitfile.py
new file mode 100644
index 000000000..3dfb7b226
--- /dev/null
+++ b/examples/mnist/verilog2bitfile.py
@@ -0,0 +1,28 @@
+#  Copyright (C) 2021 Xilinx, Inc
+#
+#  Licensed under the Apache License, Version 2.0 (the "License");
+#  you may not use this file except in compliance with the License.
+#  You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing, software
+#  distributed under the License is distributed on an "AS IS" BASIS,
+#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+#  See the License for the specific language governing permissions and
+#  limitations under the License.
+
+from argparse import ArgumentParser
+
+from logicnets.synthesis import synthesize_and_get_resource_counts
+
+if __name__ == "__main__":
+    parser = ArgumentParser(description="Synthesize convert a PyTorch trained model into verilog")
+    parser.add_argument('--log-dir', type=str, default='./log', required=True,
+        help="A location to store the log output of the training run and the output model (default: %(default)s)")
+    parser.add_argument('--clock-period', type=float, default=1.0,
+        help="Target clock frequency to use during Vivado synthesis (default: %(default)s)")
+    args = parser.parse_args()
+    print("Running out-of-context synthesis")
+    ret = synthesize_and_get_resource_counts(args.log_dir, "logicnet", fpga_part="xcu280-fsvh2892-2L-e", clk_period_ns=args.clock_period, post_synthesis = 1)
+

From e1b3d16823c1b5f7920ecdc108fdd4e6116bc8a1 Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Mon, 6 Mar 2023 13:53:53 +0000
Subject: [PATCH 59/64] [ex/mnist] Bugfix in dataset loader

---
 examples/mnist/blif2verilog.py | 3 ---
 examples/mnist/neq2lut_abc.py  | 3 ---
 2 files changed, 6 deletions(-)

diff --git a/examples/mnist/blif2verilog.py b/examples/mnist/blif2verilog.py
index 3acabdaa4..1c5feda7d 100644
--- a/examples/mnist/blif2verilog.py
+++ b/examples/mnist/blif2verilog.py
@@ -86,9 +86,6 @@
     model_cfg = {}
     for k in model_config.keys():
         model_cfg[k] = config[k]
-    dataset_cfg = {}
-    for k in dataset_config.keys():
-        dataset_cfg[k] = config[k]
     options_cfg = {}
     for k in other_options.keys():
         options_cfg[k] = config[k]
diff --git a/examples/mnist/neq2lut_abc.py b/examples/mnist/neq2lut_abc.py
index 69fe9623e..9ab762f8c 100644
--- a/examples/mnist/neq2lut_abc.py
+++ b/examples/mnist/neq2lut_abc.py
@@ -90,9 +90,6 @@
     model_cfg = {}
     for k in model_config.keys():
         model_cfg[k] = config[k]
-    dataset_cfg = {}
-    for k in dataset_config.keys():
-        dataset_cfg[k] = config[k]
     options_cfg = {}
     for k in other_options.keys():
         if k == 'cuda':

From c3b33a9d8e650349f87cc490cca142faf00259fa Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Mon, 6 Mar 2023 13:57:18 +0000
Subject: [PATCH 60/64] [ex/mnist] Bugfix in dataset configuration

---
 examples/mnist/simulate_verilog.py | 3 ---
 1 file changed, 3 deletions(-)

diff --git a/examples/mnist/simulate_verilog.py b/examples/mnist/simulate_verilog.py
index 0478e6d86..bfcbb8056 100644
--- a/examples/mnist/simulate_verilog.py
+++ b/examples/mnist/simulate_verilog.py
@@ -72,9 +72,6 @@
     model_cfg = {}
     for k in model_config.keys():
         model_cfg[k] = config[k]
-    dataset_cfg = {}
-    for k in dataset_config.keys():
-        dataset_cfg[k] = config[k]
     options_cfg = {}
     for k in other_options.keys():
         if k == 'cuda':

From 3bf4be70b5afa72588a7c436fabe1d4bfae4f47a Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Thu, 12 Sep 2024 18:14:18 +0100
Subject: [PATCH 61/64] [abc] Added patch for ABC when input bits>1000

---
 examples/mnist/abc.patch | 49 ++++++++++++++++++++++++++++++++++++++++
 1 file changed, 49 insertions(+)
 create mode 100644 examples/mnist/abc.patch

diff --git a/examples/mnist/abc.patch b/examples/mnist/abc.patch
new file mode 100644
index 000000000..8de1ebdbc
--- /dev/null
+++ b/examples/mnist/abc.patch
@@ -0,0 +1,49 @@
+diff --git a/src/aig/gia/giaMinLut.c b/src/aig/gia/giaMinLut.c
+index 5304486d..e08ebec5 100644
+--- a/src/aig/gia/giaMinLut.c
++++ b/src/aig/gia/giaMinLut.c
+@@ -193,7 +193,7 @@ Gia_Man_t * Vec_WrdReadTest( char * pFileName )
+ void Vec_WrdReadText( char * pFileName, Vec_Wrd_t ** pvSimI, Vec_Wrd_t ** pvSimO, int nIns, int nOuts )
+ {
+     int i, nSize, iLine, nLines, nWords;
+-    char pLine[1000];
++    char pLine[2000];
+     Vec_Wrd_t * vSimI, * vSimO;
+     FILE * pFile = fopen( pFileName, "rb" );
+     if ( pFile == NULL )
+@@ -214,7 +214,7 @@ void Vec_WrdReadText( char * pFileName, Vec_Wrd_t ** pvSimI, Vec_Wrd_t ** pvSimO
+     nWords = (nLines + 63)/64;
+     vSimI  = Vec_WrdStart( nIns *nWords );
+     vSimO  = Vec_WrdStart( nOuts*nWords );
+-    for ( iLine = 0; fgets( pLine, 1000, pFile ); iLine++ )
++    for ( iLine = 0; fgets( pLine, 2000, pFile ); iLine++ )
+     {
+         for ( i = 0; i < nIns; i++ )
+             if ( pLine[nIns-1-i] == '1' )
+@@ -233,7 +233,7 @@ void Vec_WrdReadText( char * pFileName, Vec_Wrd_t ** pvSimI, Vec_Wrd_t ** pvSimO
+ int Vec_WrdReadText2( char * pFileName, Vec_Wrd_t ** pvSimI )
+ {
+     int i, nSize, iLine, nLines, nWords, nIns;
+-    char pLine[1000];
++    char pLine[2000];
+     Vec_Wrd_t * vSimI;
+     FILE * pFile = fopen( pFileName, "rb" );
+     if ( pFile == NULL )
+@@ -241,7 +241,7 @@ int Vec_WrdReadText2( char * pFileName, Vec_Wrd_t ** pvSimI )
+         printf( "Cannot open file \"%s\" for reading.\n", pFileName );
+         return 0;
+     }
+-    if ( !fgets(pLine, 1000, pFile) || (nIns = strlen(pLine)-1) < 1 )
++    if ( !fgets(pLine, 2000, pFile) || (nIns = strlen(pLine)-1) < 1 )
+     {
+         printf( "Cannot find the number of inputs in file \"%s\".\n", pFileName );
+         fclose( pFile );
+@@ -259,7 +259,7 @@ int Vec_WrdReadText2( char * pFileName, Vec_Wrd_t ** pvSimI )
+     nLines = nSize / (nIns + 1);
+     nWords = (nLines + 63)/64;
+     vSimI  = Vec_WrdStart( nIns *nWords );
+-    for ( iLine = 0; fgets( pLine, 1000, pFile ); iLine++ )
++    for ( iLine = 0; fgets( pLine, 2000, pFile ); iLine++ )
+     {
+         for ( i = 0; i < nIns; i++ )
+             if ( pLine[nIns-1-i] == '1' )

From 3713b6dbdd8100dbd9fa888075e00be2bb1d144d Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Mon, 18 Nov 2024 14:21:05 +0000
Subject: [PATCH 62/64] [example/jsc] Bugfix

---
 examples/jet_substructure/dump_luts.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/examples/jet_substructure/dump_luts.py b/examples/jet_substructure/dump_luts.py
index f99d21651..c5acfb8b2 100644
--- a/examples/jet_substructure/dump_luts.py
+++ b/examples/jet_substructure/dump_luts.py
@@ -99,7 +99,7 @@
     # Test the PyTorch model
     print("Running inference of baseline model on training set (%d examples)..." % (dataset_length))
     model.eval()
-    baseline_accuracy, baseline_avg_roc_auc = test(model, test_loader, cuda=False)
+    baseline_accuracy, baseline_avg_roc_auc = test(model, train_loader, cuda=False)
     print("Baseline accuracy: %f" % (baseline_accuracy))
     print("Baseline AVG ROC AUC: %f" % (baseline_avg_roc_auc))
 
@@ -115,7 +115,7 @@
     print("Running inference of LUT-based model training set (%d examples)..." % (dataset_length))
     lut_inference(lut_model, track_used_luts=True)
     lut_model.eval()
-    lut_accuracy, lut_avg_roc_auc = test(lut_model, test_loader, cuda=False)
+    lut_accuracy, lut_avg_roc_auc = test(lut_model, train_loader, cuda=False)
     print("LUT-Based Model accuracy: %f" % (lut_accuracy))
     print("LUT-Based AVG ROC AUC: %f" % (lut_avg_roc_auc))
     print("Saving LUTs to %s... " % (options_cfg["log_dir"] + "/luts.pth"))

From 0165476cc4b8d29fed7aaeb436322b4a0184106c Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Mon, 18 Nov 2024 14:23:14 +0000
Subject: [PATCH 63/64] [example/jsc] Only insert timescale if registers

---
 examples/jet_substructure/blif2verilog.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/examples/jet_substructure/blif2verilog.py b/examples/jet_substructure/blif2verilog.py
index dc55f1afa..929de9610 100644
--- a/examples/jet_substructure/blif2verilog.py
+++ b/examples/jet_substructure/blif2verilog.py
@@ -120,7 +120,7 @@
         nodes, out, err = pipeline_tech_mapped_circuit(circuit_file=input_blif, output_verilog=f"layers_full_opt.v", num_registers=options_cfg['num_registers'], working_dir=abc_project_root, verbose=verbose)
 
     # Fix the resultant verilog file so that it can be simulated
-    fix_abc_module_name(f"{veropt_dir}/layers_full_opt.v", f"{veropt_dir}/layers_full_opt.v", options_cfg["generated_module_name_prefix"], "layers_full_opt", add_timescale=True)
+    fix_abc_module_name(f"{veropt_dir}/layers_full_opt.v", f"{veropt_dir}/layers_full_opt.v", options_cfg["generated_module_name_prefix"], "layers_full_opt", add_timescale=options_cfg['num_registers'] != 0)
 
     # Generate top-level entity wrapper
     module_list = model.module_list

From fec8657b502316d466c31f1afb97e9300a210679 Mon Sep 17 00:00:00 2001
From: Nick Fraser <icanlosh@gmail.com>
Date: Mon, 18 Nov 2024 14:18:54 +0000
Subject: [PATCH 64/64] [docker] Bugfixes to ABC build

---
 docker/Dockerfile.cpu | 7 +++++--
 1 file changed, 5 insertions(+), 2 deletions(-)

diff --git a/docker/Dockerfile.cpu b/docker/Dockerfile.cpu
index b42e49317..0467a8fa4 100644
--- a/docker/Dockerfile.cpu
+++ b/docker/Dockerfile.cpu
@@ -29,7 +29,7 @@ RUN apt-get -qq update && apt-get -qq -y install curl bzip2 \
     && rm -rf /var/lib/apt/lists/* /var/log/dpkg.log
 
 # Install LogicNets system prerequisites
-RUN apt-get -qq update && apt-get -qq -y install verilator build-essential libx11-6 git \
+RUN apt-get -qq update && apt-get -qq -y install verilator build-essential libx11-6 git libreadline-dev \
     && apt-get autoclean \
     && rm -rf /var/lib/apt/lists/* /var/log/dpkg.log
 
@@ -42,11 +42,14 @@ RUN  git clone https://github.com/dirjud/Nitro-Parts-lib-Xilinx.git
 ENV NITROPARTSLIB=/workspace/Nitro-Parts-lib-Xilinx
 
 # Adding LogicNets dependency on ABC
+COPY examples/mnist/abc.patch /workspace/
 RUN git clone https://github.com/berkeley-abc/abc.git \
     && cd abc \
     && git checkout 813a0f1ff1ae7512cb7947f54cd3f2ab252848c8 \
+    && git apply /workspace/abc.patch \
+    && rm -f /workspace/abc.patch \
     && make -j`nproc`
-ENV ABC_ROOT=/workspace/ABC
+ENV ABC_ROOT=/workspace/abc
 
 # Create the user account to run LogicNets
 RUN groupadd -g $GID $GNAME