sandialabs
diff --git a/‎applications/dnn/calibration.py‎
Lines changed: 4 additions & 1 deletion b/‎applications/dnn/calibration.py‎
Lines changed: 4 additions & 1 deletion
diff --git a/‎applications/dnn/dnn_inference_params.py‎
Lines changed: 18 additions & 39 deletions b/‎applications/dnn/dnn_inference_params.py‎
Lines changed: 18 additions & 39 deletions
diff --git a/‎applications/dnn/inference/interface/inference_net.py‎
Lines changed: 0 additions & 3 deletions b/‎applications/dnn/inference/interface/inference_net.py‎
Lines changed: 0 additions & 3 deletions
diff --git a/‎applications/dnn/inference/readme.md‎
Lines changed: 1 addition & 1 deletion b/‎applications/dnn/inference/readme.md‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎applications/dnn/keras/cifar10_resnet/calibrate_adcs.py‎
Lines changed: 3 additions & 3 deletions b/‎applications/dnn/keras/cifar10_resnet/calibrate_adcs.py‎
Lines changed: 3 additions & 3 deletions
diff --git a/‎applications/dnn/keras/cifar10_resnet/calibrate_inputs.py‎
Lines changed: 6 additions & 3 deletions b/‎applications/dnn/keras/cifar10_resnet/calibrate_inputs.py‎
Lines changed: 6 additions & 3 deletions
diff --git a/‎applications/dnn/keras/cifar10_resnet/inference_cifar10_resnet.py‎
Lines changed: 1 addition & 8 deletions b/‎applications/dnn/keras/cifar10_resnet/inference_cifar10_resnet.py‎
Lines changed: 1 addition & 8 deletions
@@ -16,7 +16,7 @@
 import numpy.typing as npt
 import numpy as np
 from scipy.optimize import minimize
-from simulator.parameters.core_parameters import CoreStyle
+from simulator.parameters.core_parameters import CoreStyle, BitSlicedCoreStyle
 from simulator.backend import ComputeBackend
 xp = ComputeBackend()
 
@@ -30,6 +30,9 @@ def calibrate_input_limits(
     input values. This function is intended for use with ResNet CNNs where
     all but the first layer is precded by a ReLU, so inputs are strictly positive.
 
+    Note that this method may not work well for the first layer which has a different
+    value distribution from the other layers!
+
     Args:
         all_xbar_inputs: list of arrays, each array contains profiled input
             values for a layer
 
@@ -35,6 +35,8 @@ def dnn_inference_params(**kwargs):
 
     Rp_row = kwargs.get("Rp_row",0)
     Rp_col = kwargs.get("Rp_col",0)
+    Rp_row_terminal = kwargs.get("Rp_row_terminal",0)
+    Rp_col_terminal = kwargs.get("Rp_col_terminal",0)
     NrowsMax = kwargs.get("NrowsMax",None)
     NcolsMax = kwargs.get("NcolsMax",None)
     weight_bits = kwargs.get("weight_bits",0)
@@ -47,13 +49,14 @@ def dnn_inference_params(**kwargs):
     adc_type = kwargs.get("adc_type","generic")
     positiveInputsOnly = kwargs.get("positiveInputsOnly",False)
     interleaved_posneg = kwargs.get("interleaved_posneg",False)
+    current_from_input = kwargs.get("current_from_input",True)
+    selected_rows = kwargs.get("selected_rows","top")
     subtract_current_in_xbar = kwargs.get("subtract_current_in_xbar",True)
     Rmin = kwargs.get("Rmin", 1000)
     Rmax = kwargs.get("Rmax", 10000)
     Vread = kwargs.get("Vread",0.1)
     infinite_on_off_ratio = kwargs.get("infinite_on_off_ratio", True)
-    gate_input = kwargs.get("gate_input",True)
-
+    
     Nslices = kwargs.get("Nslices",1)    
     digital_offset = kwargs.get("digital_offset",True)
     adc_range_option = kwargs.get("adc_range_option","CALIBRATED")
@@ -64,19 +67,16 @@ def dnn_inference_params(**kwargs):
     y_par = kwargs.get("y_par",1)
     useGPU = kwargs.get("useGPU",False)
     gpu_id = kwargs.get("gpu_id",0)
-    disable_fast_balanced = kwargs.get("disable_fast_balanced",False)
 
     profile_xbar_inputs = kwargs.get("profile_xbar_inputs",False)
     profile_adc_inputs = kwargs.get("profile_adc_inputs",False)
-    profile_adc_reluAware = kwargs.get("profile_adc_reluAware",False)
     ntest = kwargs.get("ntest",1)
 
     balanced_style = kwargs.get("balanced_style","ONE_SIDED")
     input_bitslicing = kwargs.get("input_bitslicing",False)
     input_slice_size = kwargs.get("input_slice_size",1)
     adc_per_ibit = kwargs.get("adc_per_ibit",False)
-    disable_parasitics_slices = kwargs.get("disable_parasitics_slices",None)
-
+    
     ################  create parameter objects with all core settings
     params = CrossSimParameters()
 
@@ -85,27 +85,9 @@ def dnn_inference_params(**kwargs):
     if useGPU:
         params.simulation.gpu_id = gpu_id
 
-    # Enable conv matmul?
-    # These cases cannot be realistically modeled with matmul
-    noCM_cond1 = (Rp_col > 0)
-    noCM_cond2 = (Rp_row > 0 and not gate_input)
-    noCM_cond3 = (noise_model == "generic" and alpha_noise > 0)
-    noCM_cond4 = (noise_model != "none" and noise_model != "generic")
-    if not ideal and any([noCM_cond1, noCM_cond2, noCM_cond3, noCM_cond4]):
-        params.simulation.disable_fast_matmul = True
-    else:
-        params.simulation.disable_fast_matmul = False
-        x_par, y_par = 1, 1
-
-    if profile_adc_inputs:
-        x_par, y_par = 1, 1
-
-    # Multiple convolutional MVMs in parallel? (only used if disable_fast_matmul = True)
-    params.simulation.convolution.x_par = int(x_par) # Number of sliding window steps to do in parallel (x)
-    params.simulation.convolution.y_par = int(y_par) # Number of sliding window steps to do in parallel (y)
-    
-    if core_style == "BALANCED":
-        params.simulation.disable_fast_balanced = disable_fast_balanced
+    # Parameters for SW packing mode (only used if simulation.disable_fast_matmul = True)
+    params.simulation.convolution.x_par = int(x_par)
+    params.simulation.convolution.y_par = int(y_par)
 
     if ideal:
         return params
@@ -170,20 +152,21 @@ def dnn_inference_params(**kwargs):
 
     ############### Parasitic resistance
 
-    if Rp_col > 0 or Rp_row > 0:
+    if Rp_col > 0 or Rp_row > 0 or Rp_col_terminal > 0 and Rp_row_terminal > 0:
         # Bit line parasitic resistance
         params.xbar.array.parasitics.enable = True
-        params.xbar.array.parasitics.Rp_col = Rp_col/Rmin
-        params.xbar.array.parasitics.Rp_row = Rp_row/Rmin
-        params.xbar.array.parasitics.gate_input = gate_input
-
-        if gate_input and Rp_col == 0:
-            params.xbar.array.parasitics.enable = False
+        params.xbar.array.parasitics.Rp_col = Rp_col
+        params.xbar.array.parasitics.Rp_row = Rp_row
+        params.xbar.array.parasitics.Rp_col_terminal = Rp_col_terminal
+        params.xbar.array.parasitics.Rp_row_terminal = Rp_row_terminal
+        params.xbar.array.parasitics.current_from_input = current_from_input
+        params.xbar.array.parasitics.selected_rows = selected_rows
 
         # Numeric params related to parasitic resistance simulation
         params.simulation.Niters_max_parasitics = 100
         params.simulation.Verr_th_mvm = 2e-4
         params.simulation.relaxation_gamma = 0.9 # under-relaxation
+        params.simulation.Verr_matmul_criterion = "max_mean" # max over array, max over MVMs
 
     ############### Weight bit slicing
 
@@ -202,10 +185,6 @@ def dnn_inference_params(**kwargs):
         else:
             cell_bits = int(np.ceil(weight_bits/Nslices))
         params.core.bit_sliced.num_slices = Nslices
-        if disable_parasitics_slices is not None:
-            params.xbar.array.parasitics.disable_slices = disable_parasitics_slices
-        else:
-            params.xbar.array.parasitics.disable_slices = [False]*Nslices
 
     # Weights
     params.core.weight_bits = int(weight_bits)
@@ -220,7 +199,7 @@ def dnn_inference_params(**kwargs):
     ###################### Analytics
 
     params.simulation.analytics.profile_xbar_inputs = profile_xbar_inputs
-    params.simulation.analytics.profile_adc_inputs = (profile_adc_inputs and not profile_adc_reluAware)
+    params.simulation.analytics.profile_adc_inputs = profile_adc_inputs
     params.simulation.analytics.ntest = ntest
 
     ###################### DAC settings
 
@@ -105,9 +105,6 @@ def set_params(**kwargs):
     params.simulation.convolution.x_par = int(x_par) # Number of sliding window steps to do in parallel (x)
     params.simulation.convolution.y_par = int(y_par) # Number of sliding window steps to do in parallel (y)
 
-    if export_conductances:
-        params.simulation.disable_fast_balanced = True
-
     if export_conductances:
         params.simulation.disable_fast_balanced = True
 
 
@@ -49,4 +49,4 @@ More details on this process can be found in Section 9.4 of the manual.
 
 The optimized ADC limits are only valid for a specific combination of neural network and hardware settings. The ``adc_limits`` directory contains calibrated ADC limits for a number of neural networks that are part of the ``cross-sim-models`` submodule, but does not account for every possible simulation configuration with these models. The most extensive set of ADC limits we have generated are for the ResNet50-v1.5 network (part of the MLPerf Inference benchmark). These can be found inside the ``adc_limits/imagenet`` and ``adc_limits/imagenet_bitslicing`` folders. See ``interface/dnn_setup.py`` to see the simulation settings that are matched to these different calibrated ADC limits.
 
-[1] T. P. Xiao, B. Feinberg, C. H. Bennett, V. Prabhakar, P. Saxena, V. Agrawal, S. Agarwal, and M. J. Marinella, "On the accuracy of analog neural network inference accelerators," _IEEE Circuits and Systems Magazine_, 22(4), pp. 26-48, 2022.
+[1] T. P. Xiao, B. Feinberg, C. H. Bennett, V. Prabhakar, P. Saxena, V. Agrawal, S. Agarwal, and M. J. Marinella, "On the accuracy of analog neural network inference accelerators," _IEEE Circuits and Systems Magazine_, 22(4), pp. 26-48, 2022.
@@ -31,10 +31,10 @@
 # n = 3 : ResNet-20 (272K weights)
 # n = 5 : ResNet-32 (467K weights)
 # n = 9 : ResNet-56 (856K weights)
-n = 9
+n = 3
 
 useGPU = True # use GPU?
-N = 1000 # number of images
+N = 500 # number of images
 batch_size = 32
 Nruns = 1
 print_progress = True
@@ -84,7 +84,7 @@
     'Rp_col' : 0, # ohms
     'interleaved_posneg' : False,
     'subtract_current_in_xbar' : True,
-    'gate_input' : False,
+    'current_from_input' : True,
     ## Input quantization
     'input_bits' : 8,
     'input_bitslicing' : False,
 
@@ -31,10 +31,10 @@
 # n = 3 : ResNet-20 (272K weights)
 # n = 5 : ResNet-32 (467K weights)
 # n = 9 : ResNet-56 (856K weights)
-n = 9
+n = 3
 
 useGPU = True # use GPU?
-N = 1000 # number of images
+N = 500 # number of images
 batch_size = 32
 Nruns = 1
 print_progress = True
@@ -84,7 +84,7 @@
     'Rp_col' : 0, # ohms
     'interleaved_posneg' : False,
     'subtract_current_in_xbar' : True,
-    'gate_input' : False,
+    'current_from_input' : True,
     ## Input quantization
     'input_bits' : 0,
     'input_bitslicing' : False,
@@ -149,5 +149,8 @@
 print("Optimizing input limits")
 calibrated_ranges = calibrate_input_limits(profiled_inputs, Nbits=8)
 
+# Manually calibrate first layer's limits based on value range of CIFAR-10 images
+calibrated_ranges[0,:] = np.array([-2.64, 2.64])
+
 np.save("./calibrated_config/input_limits_ResNet{:d}.npy".format(depth),
     calibrated_ranges)
@@ -77,7 +77,7 @@
     'Rp_col' : 0, # ohms
     'interleaved_posneg' : False,
     'subtract_current_in_xbar' : True,
-    'gate_input' : False,
+    'current_from_input' : True,
     ## Input quantization
     'input_bits' : 8,
     'input_bitslicing' : False,
@@ -97,19 +97,12 @@
 ### Load ADC limits
 adc_ranges = find_adc_range(base_params_args, n_layers, depth)
 
-### Load (x_par, y_par) values
-xy_pars = np.load("./calibrated_config/resnet{:d}_xy.npy".format(depth))
-if base_params_args['Rp_row'] > 0 or base_params_args['Rp_col'] > 0:
-    xy_pars = np.load("./calibrated_config/resnet{:d}_xy_parasitics.npy".format(depth))
-
 ### Set the parameters
 for k in range(n_layers):
     params_args_k = base_params_args.copy()
     params_args_k['positiveInputsOnly'] = (False if k == 0 else True)
     params_args_k['input_range'] = input_ranges[k]
     params_args_k['adc_range'] = adc_ranges[k]
-    params_args_k['x_par'] = xy_pars[k,0]
-    params_args_k['y_par'] = xy_pars[k,1]
     params_list[k] = dnn_inference_params(**params_args_k)
 
 # Convert Keras layers to analog layers
Original file line number	Diff line number	Diff line change
`@@ -49,4 +49,4 @@ More details on this process can be found in Section 9.4 of the manual.`
`49`	`49`
`50`	`50`	The optimized ADC limits are only valid for a specific combination of neural network and hardware settings. The ``adc_limits`` directory contains calibrated ADC limits for a number of neural networks that are part of the ``cross-sim-models`` submodule, but does not account for every possible simulation configuration with these models. The most extensive set of ADC limits we have generated are for the ResNet50-v1.5 network (part of the MLPerf Inference benchmark). These can be found inside the ``adc_limits/imagenet`` and ``adc_limits/imagenet_bitslicing`` folders. See ``interface/dnn_setup.py`` to see the simulation settings that are matched to these different calibrated ADC limits.
`51`	`51`
`52`		`-[1] T. P. Xiao, B. Feinberg, C. H. Bennett, V. Prabhakar, P. Saxena, V. Agrawal, S. Agarwal, and M. J. Marinella, "On the accuracy of analog neural network inference accelerators," _IEEE Circuits and Systems Magazine_, 22(4), pp. 26-48, 2022.`
	`52`	`+[1] T. P. Xiao, B. Feinberg, C. H. Bennett, V. Prabhakar, P. Saxena, V. Agrawal, S. Agarwal, and M. J. Marinella, "On the accuracy of analog neural network inference accelerators," _IEEE Circuits and Systems Magazine_, 22(4), pp. 26-48, 2022.`