From 788fe406b5e6cbc76c1c32a750aa12c10f88d512 Mon Sep 17 00:00:00 2001
From: David Harris <david_harris@hmc.edu>
Date: Tue, 31 May 2022 14:58:11 +0000
Subject: [PATCH 01/14] Moved delegation logic from privmode to trap to
 simplify interface

---
 pipelined/src/privileged/privileged.sv |  9 +++++----
 pipelined/src/privileged/privmode.sv   | 13 +++----------
 pipelined/src/privileged/trap.sv       |  7 +++++--
 3 files changed, 13 insertions(+), 16 deletions(-)

diff --git a/pipelined/src/privileged/privileged.sv b/pipelined/src/privileged/privileged.sv
index 43e2f8f0..a65039bf 100644
--- a/pipelined/src/privileged/privileged.sv
+++ b/pipelined/src/privileged/privileged.sv
@@ -99,13 +99,14 @@ module privileged (
   logic       STATUS_MIE, STATUS_SIE;
   logic [11:0] MIP_REGW, MIE_REGW;
   logic [1:0] NextPrivilegeModeM;
+  logic       DelegateM;
 
   ///////////////////////////////////////////
   // track the current privilege level
   ///////////////////////////////////////////
 
-  privmode privmode(.clk, .reset, .StallW, .TrapM, .mretM, .sretM, .InterruptM, .CauseM, 
-                    .MEDELEG_REGW, .MIDELEG_REGW, .STATUS_MPP, .STATUS_SPP, .NextPrivilegeModeM, .PrivilegeModeW);
+  privmode privmode(.clk, .reset, .StallW, .TrapM, .mretM, .sretM, .DelegateM,
+                    .STATUS_MPP, .STATUS_SPP, .NextPrivilegeModeM, .PrivilegeModeW);
 
   ///////////////////////////////////////////
   // decode privileged instructions
@@ -158,11 +159,11 @@ module privileged (
             .LoadPageFaultM, .StoreAmoPageFaultM,
             .mretM, .sretM, 
             .PrivilegeModeW, 
-            .MIP_REGW, .MIE_REGW, .MIDELEG_REGW,
+            .MIP_REGW, .MIE_REGW, .MIDELEG_REGW, .MEDELEG_REGW,
             .STATUS_MIE, .STATUS_SIE,
             .InstrValidM, .CommittedM,  
             .TrapM, .RetM,
-            .InterruptM, .IntPendingM,
+            .InterruptM, .IntPendingM, .DelegateM,
             .CauseM);
 endmodule
 
diff --git a/pipelined/src/privileged/privmode.sv b/pipelined/src/privileged/privmode.sv
index 9446c08c..768d8a36 100644
--- a/pipelined/src/privileged/privmode.sv
+++ b/pipelined/src/privileged/privmode.sv
@@ -33,25 +33,18 @@
 
 module privmode (
   input  logic             clk, reset,
-  input  logic             StallW, TrapM, mretM, sretM, InterruptM,
-  input  logic [`LOG_XLEN-1:0] CauseM, 
-  input  logic [`XLEN-1:0] MEDELEG_REGW,
-  input  logic [11:0]      MIDELEG_REGW,
+  input  logic             StallW, TrapM, mretM, sretM,
+  input  logic             DelegateM,
   input  logic [1:0]       STATUS_MPP,
   input  logic             STATUS_SPP,
   output logic [1:0]       NextPrivilegeModeM, PrivilegeModeW
 ); 
   
   if (`U_SUPPORTED) begin:privmode
-    logic       md;
-
-    // get bits of DELEG registers based on CAUSE
-    assign md = InterruptM ? MIDELEG_REGW[CauseM[3:0]] : MEDELEG_REGW[CauseM];
-    
     // PrivilegeMode FSM
     always_comb begin
       if (TrapM) begin // Change privilege based on DELEG registers (see 3.1.8)
-        if (`S_SUPPORTED & md & (PrivilegeModeW == `U_MODE | PrivilegeModeW == `S_MODE))
+        if (`S_SUPPORTED & DelegateM)
                           NextPrivilegeModeM = `S_MODE;
         else              NextPrivilegeModeM = `M_MODE;
       end else if (mretM) NextPrivilegeModeM = STATUS_MPP;
diff --git a/pipelined/src/privileged/trap.sv b/pipelined/src/privileged/trap.sv
index 6225b9c0..7bee52a0 100644
--- a/pipelined/src/privileged/trap.sv
+++ b/pipelined/src/privileged/trap.sv
@@ -39,11 +39,12 @@ module trap (
   (* mark_debug = "true" *) input logic 		   LoadPageFaultM, StoreAmoPageFaultM,
   (* mark_debug = "true" *) input logic 		   mretM, sretM, 
   input logic [1:0] 	   PrivilegeModeW, 
-  (* mark_debug = "true" *) input logic [11:0] 	   MIP_REGW, MIE_REGW, MIDELEG_REGW,
+  (* mark_debug = "true" *) input logic [11:0] 	   MIP_REGW, MIE_REGW, MIDELEG_REGW, 
+  input logic [`XLEN-1:0] MEDELEG_REGW,
   input logic 		   STATUS_MIE, STATUS_SIE,
   input logic 		   InstrValidM, CommittedM, 
   output logic 		   TrapM, RetM,
-  output logic 		   InterruptM, IntPendingM,
+  output logic 		   InterruptM, IntPendingM, DelegateM,
   output logic [`LOG_XLEN-1:0] CauseM 
 );
 
@@ -63,6 +64,8 @@ module trap (
   assign IntPendingM = |PendingIntsM;
   assign ValidIntsM = {12{MIntGlobalEnM}} & PendingIntsM & ~MIDELEG_REGW | {12{SIntGlobalEnM}} & PendingIntsM & MIDELEG_REGW; 
   assign InterruptM = (|ValidIntsM) && InstrValidM && ~(CommittedM);  // *** RT. CommittedM is a temporary hack to prevent integer division from having an interrupt during divide.
+  assign DelegateM = (InterruptM ? MIDELEG_REGW[CauseM[3:0]] : MEDELEG_REGW[CauseM]) & 
+                     (PrivilegeModeW == `U_MODE | PrivilegeModeW == `S_MODE);
 
   ///////////////////////////////////////////
   // Trigger Traps and RET

From 4ed7933aa3de3821b4829d50d5cff2f0cbe1c954 Mon Sep 17 00:00:00 2001
From: Katherine Parry <kparry4@gmail.com>
Date: Tue, 31 May 2022 16:18:50 +0000
Subject: [PATCH 02/14] added unpackinput.sv

---
 addins/riscv-arch-test            |   2 +-
 pipelined/regression/sim-fp-batch |   2 +-
 pipelined/src/fpu/fcvt.sv         |  14 +-
 pipelined/src/fpu/unpack.sv       | 538 +-----------------------------
 pipelined/src/fpu/unpackinput.sv  | 402 ++++++++++++++++++++++
 pipelined/src/generic/lzc.sv      |   6 +-
 6 files changed, 424 insertions(+), 540 deletions(-)
 create mode 100644 pipelined/src/fpu/unpackinput.sv

diff --git a/addins/riscv-arch-test b/addins/riscv-arch-test
index 307c77b2..be67c99b 160000
--- a/addins/riscv-arch-test
+++ b/addins/riscv-arch-test
@@ -1 +1 @@
-Subproject commit 307c77b26e070ae85ffea665ad9b642b40e33c86
+Subproject commit be67c99bd461742aa1c100bcc0732657faae2230
diff --git a/pipelined/regression/sim-fp-batch b/pipelined/regression/sim-fp-batch
index 7e2c6a34..ca0ba3d3 100755
--- a/pipelined/regression/sim-fp-batch
+++ b/pipelined/regression/sim-fp-batch
@@ -7,4 +7,4 @@
 # sqrt   - test square root
 # all    - test everything
 
-vsim -c -do "do fp.do rv64fp fma"
\ No newline at end of file
+vsim -c -do "do fp.do rv64fp cvtfp"
\ No newline at end of file
diff --git a/pipelined/src/fpu/fcvt.sv b/pipelined/src/fpu/fcvt.sv
index bebd0ef1..227b0098 100644
--- a/pipelined/src/fpu/fcvt.sv
+++ b/pipelined/src/fpu/fcvt.sv
@@ -42,7 +42,7 @@ module fcvt (
     logic [`XLEN-1:0]       TrimInt;    // integer trimmed to the correct size
     logic [`LGLEN-1:0]      LzcIn;      // input to the Leading Zero Counter (priority encoder)
     logic [`NE:0]           CalcExp;    // the calculated expoent
-	logic [$clog2(`LGLEN)-1:0] ShiftAmt;  // how much to shift by
+	logic [$clog2(`LGLEN+1)-1:0] ShiftAmt;  // how much to shift by
     logic [`LGLEN+`NF:0]    ShiftIn;    // number to be shifted
     logic                   ResDenormUf;// does the result underflow or is denormalized
     logic                   ResUf;      // does the result underflow
@@ -72,7 +72,7 @@ module fcvt (
     logic                   Int64;      // is the integer 64 bits?
     logic                   IntToFp;       // is the opperation an int->fp conversion?
     logic                   ToInt;      // is the opperation an fp->int conversion?
-    logic [$clog2(`LGLEN)-1:0] ZeroCnt; // output from the LZC
+    logic [$clog2(`LGLEN+1)-1:0] ZeroCnt; // output from the LZC
 
 
     // seperate OpCtrl for code readability
@@ -143,9 +143,9 @@ module fcvt (
     //              - only shift fp -> fp if the intital value is denormalized
     //                  - this is a problem because the input to the lzc was the fraction rather than the mantissa
     //                  - rather have a few and-gates than an extra bit in the priority encoder??? *** is this true?
-    assign ShiftAmt = ToInt ? CalcExp[$clog2(`LGLEN)-1:0]&{$clog2(`LGLEN){~CalcExp[`NE]}} :
-                    ResDenormUf&~IntToFp ? ($clog2(`LGLEN))'(`NF-1)+CalcExp[$clog2(`LGLEN)-1:0] : 
-                              (ZeroCnt+1)&{$clog2(`LGLEN){XDenormE|IntToFp}};
+    assign ShiftAmt = ToInt ? CalcExp[$clog2(`LGLEN+1)-1:0]&{$clog2(`LGLEN+1){~CalcExp[`NE]}} :
+                    ResDenormUf&~IntToFp ? ($clog2(`LGLEN+1))'(`NF-1)+CalcExp[$clog2(`LGLEN+1)-1:0] : 
+                              (ZeroCnt+1)&{$clog2(`LGLEN+1){XDenormE|IntToFp}};
     
     // shift
     //      fp -> int: |  `XLEN  zeros |     Mantissa      | 0's if nessisary | << CalcExp
@@ -255,13 +255,13 @@ module fcvt (
     //                  |     keep        |
     //
     //              - if the input is denormalized then we dont shift... so the  "- (ZeroCnt+1)" is just leftovers from other options
-    //      int -> fp : largest bias  XLEN - Largest bias + new bias - 1 - ZeroCnt = XLEN + NewBias - 1 - ZeroCnt
+    //      int -> fp : largest bias +  XLEN - Largest bias + new bias - 1 - ZeroCnt = XLEN + NewBias - 1 - ZeroCnt
     //              Process:
     //                  - shifted right by XLEN (XLEN)
     //                  - shift left to normilize (-1-ZeroCnt)
     //                  - newBias to make the biased exponent
     //          
-    assign CalcExp = {1'b0, OldExp} - (`NE+1)'(`BIAS) + {2'b0, NewBias} - {{`NE{1'b0}}, XDenormE|IntToFp} - {{`NE-$clog2(`LGLEN)+1{1'b0}}, (ZeroCnt&{$clog2(`LGLEN){XDenormE|IntToFp}})};
+    assign CalcExp = {1'b0, OldExp} - (`NE+1)'(`BIAS) + {2'b0, NewBias} - {{`NE{1'b0}}, XDenormE|IntToFp} - {{`NE-$clog2(`LGLEN+1)+1{1'b0}}, (ZeroCnt&{$clog2(`LGLEN+1){XDenormE|IntToFp}})};
     // find if the result is dnormal or underflows
     //      - if Calculated expoenent is 0 or negitive (and the input/result is not exactaly 0)
     //      - can't underflow an integer to Fp conversion
diff --git a/pipelined/src/fpu/unpack.sv b/pipelined/src/fpu/unpack.sv
index a10d1f8c..9e691e27 100644
--- a/pipelined/src/fpu/unpack.sv
+++ b/pipelined/src/fpu/unpack.sv
@@ -21,538 +21,20 @@ module unpack (
     logic           XExpZero, YExpZero, ZExpZero; // is the exponent zero
     logic           YExpMaxE, ZExpMaxE;  // is the exponent all 1s
     
-    if (`FPSIZES == 1) begin        // if there is only one floating point format supported
+    unpackinput unpackinputX (.In(X), .FmtE, .Sgn(XSgnE), .Exp(XExpE), .Man(XManE), 
+                            .NaN(XNaNE), .SNaN(XSNaNE), .Denorm(XDenormE), 
+                            .Zero(XZeroE), .Inf(XInfE), .ExpMax(XExpMaxE), .ExpZero(XExpZero));
 
-        // sign bit
-        assign XSgnE = X[`FLEN-1];
-        assign YSgnE = Y[`FLEN-1];
-        assign ZSgnE = Z[`FLEN-1];
+    unpackinput unpackinputY (.In(Y), .FmtE, .Sgn(YSgnE), .Exp(YExpE), .Man(YManE), 
+                            .NaN(YNaNE), .SNaN(YSNaNE), .Denorm(YDenormE), 
+                            .Zero(YZeroE), .Inf(YInfE), .ExpMax(YExpMaxE), .ExpZero(YExpZero));
 
-        // exponent
-        assign XExpE = {X[`FLEN-2:`NF+1], X[`NF]|XDenormE};
-        assign YExpE = {Y[`FLEN-2:`NF+1], Y[`NF]|YDenormE};
-        assign ZExpE = {Z[`FLEN-2:`NF+1], Z[`NF]|ZDenormE};
-
-        // fraction (no assumed 1)
-        assign XFracE = X[`NF-1:0];
-        assign YFracE = Y[`NF-1:0];
-        assign ZFracE = Z[`NF-1:0];
-
-        // is the exponent non-zero
-        assign XExpNonzero = |XExpE; 
-        assign YExpNonzero = |YExpE;
-        assign ZExpNonzero = |ZExpE;
-
-        // is the exponent all 1's
-        assign XExpMaxE = &XExpE;
-        assign YExpMaxE = &YExpE;
-        assign ZExpMaxE = &ZExpE;
-
-
-        // is the input (in it's original format) denormalized
-        assign XDenormE = ~|X[`FLEN-2:`NF] & ~XFracZero; 
-        assign YDenormE = ~|Y[`FLEN-2:`NF] & ~YFracZero; 
-        assign ZDenormE = ~|Z[`FLEN-2:`NF] & ~ZFracZero; 
-    
-
-    end else if (`FPSIZES == 2) begin   // if there are 2 floating point formats supported
-        //***need better names for these constants
-        // largest format | smaller format
-        //----------------------------------
-        //      `FLEN     |     `LEN1       length of floating point number
-        //      `NE       |     `NE1        length of exponent
-        //      `NF       |     `NF1        length of fraction
-        //      `BIAS     |     `BIAS1      exponent's bias value
-        //      `FMT      |     `FMT1       precision's format value - Q=11 D=01 S=00 H=10
-
-        // Possible combinantions specified by spec:
-        //      double and single
-        //      single and half
-
-        // Not needed but can also handle:
-        //      quad   and double
-        //      quad   and single
-        //      quad   and half
-        //      double and half
-
-        logic  [`LEN1-1:0]  XLen1, YLen1, ZLen1; // Remove NaN boxing or NaN, if not properly NaN boxed
-
-        // Check NaN boxing, If the value is not properly NaN boxed, set the value to a quiet NaN
-        assign XLen1 = &X[`FLEN-1:`LEN1] ? X[`LEN1-1:0] : {1'b0, {`NE1+1{1'b1}}, (`NF1-1)'(0)};
-        assign YLen1 = &Y[`FLEN-1:`LEN1] ? Y[`LEN1-1:0] : {1'b0, {`NE1+1{1'b1}}, (`NF1-1)'(0)};
-        assign ZLen1 = &Z[`FLEN-1:`LEN1] ? Z[`LEN1-1:0] : {1'b0, {`NE1+1{1'b1}}, (`NF1-1)'(0)};  
-
-        // choose sign bit depending on format - 1=larger precsion 0=smaller precision
-        assign XSgnE = FmtE ? X[`FLEN-1] : XLen1[`LEN1-1];
-        assign YSgnE = FmtE ? Y[`FLEN-1] : YLen1[`LEN1-1];
-        assign ZSgnE = FmtE ? Z[`FLEN-1] : ZLen1[`LEN1-1];
-
-        // example double to single conversion:
-        // 1023 = 0011 1111 1111
-        // 127  = 0000 0111 1111 (subtract this)
-        // 896  = 0011 1000 0000
-        // sexp = 0000 bbbb bbbb (add this) b = bit d = ~b 
-        // dexp = 0bdd dbbb bbbb 
-        // also need to take into account possible zero/denorm/inf/NaN values
-
-        // extract the exponent, converting the smaller exponent into the larger precision if nessisary
-        //      - if the original precision had a denormal number convert the exponent value 1
-        assign XExpE = FmtE ? {X[`FLEN-2:`NF+1], X[`NF]|XDenormE} : {XLen1[`LEN1-2], {`NE-`NE1{~XLen1[`LEN1-2]}}, XLen1[`LEN1-3:`NF1+1], XLen1[`NF1]|XDenormE}; 
-        assign YExpE = FmtE ? {Y[`FLEN-2:`NF+1], Y[`NF]|YDenormE} : {YLen1[`LEN1-2], {`NE-`NE1{~YLen1[`LEN1-2]}}, YLen1[`LEN1-3:`NF1+1], YLen1[`NF1]|YDenormE}; 
-        assign ZExpE = FmtE ? {Z[`FLEN-2:`NF+1], Z[`NF]|ZDenormE} : {ZLen1[`LEN1-2], {`NE-`NE1{~ZLen1[`LEN1-2]}}, ZLen1[`LEN1-3:`NF1+1], ZLen1[`NF1]|ZDenormE}; 
-
-        // is the input (in it's original format) denormalized
-
-                    // is the input (in it's original format) denormalized
-        assign XDenormE = (FmtE ? ~|X[`FLEN-2:`NF] : ~|XLen1[`LEN1-2:`NF1]) & ~XFracZero; 
-        assign YDenormE = (FmtE ? ~|Y[`FLEN-2:`NF] : ~|YLen1[`LEN1-2:`NF1]) & ~YFracZero; 
-        assign ZDenormE = (FmtE ? ~|Z[`FLEN-2:`NF] : ~|ZLen1[`LEN1-2:`NF1]) & ~ZFracZero; 
-
-        // extract the fraction, add trailing zeroes to the mantissa if nessisary
-        assign XFracE = FmtE ? X[`NF-1:0] : {XLen1[`NF1-1:0], (`NF-`NF1)'(0)};
-        assign YFracE = FmtE ? Y[`NF-1:0] : {YLen1[`NF1-1:0], (`NF-`NF1)'(0)};
-        assign ZFracE = FmtE ? Z[`NF-1:0] : {ZLen1[`NF1-1:0], (`NF-`NF1)'(0)};
-
-        // is the exponent non-zero
-        assign XExpNonzero = FmtE ? |X[`FLEN-2:`NF] : |XLen1[`LEN1-2:`NF1]; 
-        assign YExpNonzero = FmtE ? |Y[`FLEN-2:`NF] : |YLen1[`LEN1-2:`NF1];
-        assign ZExpNonzero = FmtE ? |Z[`FLEN-2:`NF] : |ZLen1[`LEN1-2:`NF1];
-
-        // is the exponent all 1's
-        assign XExpMaxE = FmtE ? &X[`FLEN-2:`NF] : &XLen1[`LEN1-2:`NF1];
-        assign YExpMaxE = FmtE ? &Y[`FLEN-2:`NF] : &YLen1[`LEN1-2:`NF1];
-        assign ZExpMaxE = FmtE ? &Z[`FLEN-2:`NF] : &ZLen1[`LEN1-2:`NF1];
-    
-
-    end else if (`FPSIZES == 3) begin       // three floating point precsions supported
-
-        //***need better names for these constants
-        // largest format | larger format  | smallest format
-        //---------------------------------------------------
-        //      `FLEN     |     `LEN1      |    `LEN2       length of floating point number
-        //      `NE       |     `NE1       |    `NE2        length of exponent
-        //      `NF       |     `NF1       |    `NF2        length of fraction
-        //      `BIAS     |     `BIAS1     |    `BIAS2      exponent's bias value
-        //      `FMT      |     `FMT1      |    `FMT2       precision's format value - Q=11 D=01 S=00 H=10
-
-        // Possible combinantions specified by spec:
-        //      quad   and double and single
-        //      double and single and half
-
-        // Not needed but can also handle:
-        //      quad   and double and half
-        //      quad   and single and half
-
-        logic  [`LEN1-1:0]  XLen1, YLen1, ZLen1; // Remove NaN boxing or NaN, if not properly NaN boxed for larger percision
-        logic  [`LEN2-1:0]  XLen2, YLen2, ZLen2; // Remove NaN boxing or NaN, if not properly NaN boxed for smallest precision
-        
-        // Check NaN boxing, If the value is not properly NaN boxed, set the value to a quiet NaN - for larger precision
-        assign XLen1 = &X[`FLEN-1:`LEN1] ? X[`LEN1-1:0] : {1'b0, {`NE1+1{1'b1}}, (`NF1-1)'(0)};
-        assign YLen1 = &Y[`FLEN-1:`LEN1] ? Y[`LEN1-1:0] : {1'b0, {`NE1+1{1'b1}}, (`NF1-1)'(0)};
-        assign ZLen1 = &Z[`FLEN-1:`LEN1] ? Z[`LEN1-1:0] : {1'b0, {`NE1+1{1'b1}}, (`NF1-1)'(0)}; 
-
-        // Check NaN boxing, If the value is not properly NaN boxed, set the value to a quiet NaN - for smaller precision
-        assign XLen2 = &X[`FLEN-1:`LEN2] ? X[`LEN2-1:0] : {1'b0, {`NE2+1{1'b1}}, (`NF2-1)'(0)};
-        assign YLen2 = &Y[`FLEN-1:`LEN2] ? Y[`LEN2-1:0] : {1'b0, {`NE2+1{1'b1}}, (`NF2-1)'(0)};
-        assign ZLen2 = &Z[`FLEN-1:`LEN2] ? Z[`LEN2-1:0] : {1'b0, {`NE2+1{1'b1}}, (`NF2-1)'(0)}; 
-
-        // There are 2 case statements
-        //      - one for other singals and one for sgn/exp/frac
-        //      - need two for the dependencies in the expoenent calculation
-        //*** pull out the ~FracZero and and it at the end
-        always_comb begin
-            case (FmtE)
-                `FMT: begin // if input is largest precision (`FLEN - ie quad or double)
-
-                    // This is the original format so set OrigDenorm to 0
-                    XDenormE = ~|X[`FLEN-2:`NF] & ~XFracZero; 
-                    YDenormE = ~|Y[`FLEN-2:`NF] & ~YFracZero; 
-                    ZDenormE = ~|Z[`FLEN-2:`NF] & ~ZFracZero; 
-
-                    // is the exponent non-zero
-                    XExpNonzero = |X[`FLEN-2:`NF]; 
-                    YExpNonzero = |Y[`FLEN-2:`NF];
-                    ZExpNonzero = |Z[`FLEN-2:`NF];
-
-                    // is the exponent all 1's
-                    XExpMaxE = &X[`FLEN-2:`NF];
-                    YExpMaxE = &Y[`FLEN-2:`NF];
-                    ZExpMaxE = &Z[`FLEN-2:`NF];
-                end
-                `FMT1: begin    // if input is larger precsion (`LEN1 - double or single)
-
-                    // is the input (in it's original format) denormalized
-                    XDenormE = ~|XLen1[`LEN1-2:`NF1] & ~XFracZero; 
-                    YDenormE = ~|YLen1[`LEN1-2:`NF1] & ~YFracZero; 
-                    ZDenormE = ~|ZLen1[`LEN1-2:`NF1] & ~ZFracZero; 
-
-                    // is the exponent non-zero
-                    XExpNonzero = |XLen1[`LEN1-2:`NF1]; 
-                    YExpNonzero = |YLen1[`LEN1-2:`NF1];
-                    ZExpNonzero = |ZLen1[`LEN1-2:`NF1];
-
-                    // is the exponent all 1's
-                    XExpMaxE = &XLen1[`LEN1-2:`NF1];
-                    YExpMaxE = &YLen1[`LEN1-2:`NF1];
-                    ZExpMaxE = &ZLen1[`LEN1-2:`NF1];
-                end
-                `FMT2: begin        // if input is smallest precsion (`LEN2 - single or half)
-
-                    // is the input (in it's original format) denormalized
-                    XDenormE = ~|XLen2[`LEN2-2:`NF2] & ~XFracZero; 
-                    YDenormE = ~|YLen2[`LEN2-2:`NF2] & ~YFracZero; 
-                    ZDenormE = ~|ZLen2[`LEN2-2:`NF2] & ~ZFracZero; 
-
-                    // is the exponent non-zero
-                    XExpNonzero = |XLen2[`LEN2-2:`NF2]; 
-                    YExpNonzero = |YLen2[`LEN2-2:`NF2];
-                    ZExpNonzero = |ZLen2[`LEN2-2:`NF2];
-
-                    // is the exponent all 1's
-                    XExpMaxE = &XLen2[`LEN2-2:`NF2];
-                    YExpMaxE = &YLen2[`LEN2-2:`NF2];
-                    ZExpMaxE = &ZLen2[`LEN2-2:`NF2];
-                end
-                default: begin
-                    XDenormE = 0; 
-                    YDenormE = 0; 
-                    ZDenormE = 0; 
-                    XExpNonzero = 0; 
-                    YExpNonzero = 0;
-                    ZExpNonzero = 0;
-                    XExpMaxE = 0;
-                    YExpMaxE = 0;
-                    ZExpMaxE = 0;
-                end
-            endcase
-        end
-        always_comb begin
-            case (FmtE)
-                `FMT: begin // if input is largest precision (`FLEN - ie quad or double)
-                    // extract the sign bit
-                    XSgnE = X[`FLEN-1];
-                    YSgnE = Y[`FLEN-1];
-                    ZSgnE = Z[`FLEN-1];
-
-                    // extract the exponent
-                    XExpE = {X[`FLEN-2:`NF+1], X[`NF]|XDenormE};
-                    YExpE = {Y[`FLEN-2:`NF+1], Y[`NF]|YDenormE};
-                    ZExpE = {Z[`FLEN-2:`NF+1], Z[`NF]|ZDenormE};
-
-                    // extract the fraction
-                    XFracE = X[`NF-1:0];
-                    YFracE = Y[`NF-1:0];
-                    ZFracE = Z[`NF-1:0];
-                end
-                `FMT1: begin    // if input is larger precsion (`LEN1 - double or single)
-
-                    // extract the sign bit
-                    XSgnE = XLen1[`LEN1-1];
-                    YSgnE = YLen1[`LEN1-1];
-                    ZSgnE = ZLen1[`LEN1-1];
-
-                    // example double to single conversion:
-                    // 1023 = 0011 1111 1111
-                    // 127  = 0000 0111 1111 (subtract this)
-                    // 896  = 0011 1000 0000
-                    // sexp = 0000 bbbb bbbb (add this) b = bit d = ~b 
-                    // dexp = 0bdd dbbb bbbb 
-                    // also need to take into account possible zero/denorm/inf/NaN values
-
-                    // convert the larger precision's exponent to use the largest precision's bias
-                    XExpE = {XLen1[`LEN1-2], {`NE-`NE1{~XLen1[`LEN1-2]}}, XLen1[`LEN1-3:`NF1+1], XLen1[`NF1]|XDenormE}; 
-                    YExpE = {YLen1[`LEN1-2], {`NE-`NE1{~YLen1[`LEN1-2]}}, YLen1[`LEN1-3:`NF1+1], YLen1[`NF1]|YDenormE}; 
-                    ZExpE = {ZLen1[`LEN1-2], {`NE-`NE1{~ZLen1[`LEN1-2]}}, ZLen1[`LEN1-3:`NF1+1], ZLen1[`NF1]|ZDenormE}; 
-
-                    // extract the fraction and add the nessesary trailing zeros
-                    XFracE = {XLen1[`NF1-1:0], (`NF-`NF1)'(0)};
-                    YFracE = {YLen1[`NF1-1:0], (`NF-`NF1)'(0)};
-                    ZFracE = {ZLen1[`NF1-1:0], (`NF-`NF1)'(0)};
-                end
-                `FMT2: begin        // if input is smallest precsion (`LEN2 - single or half)
-
-                    // exctract the sign bit
-                    XSgnE = XLen2[`LEN2-1];
-                    YSgnE = YLen2[`LEN2-1];
-                    ZSgnE = ZLen2[`LEN2-1];
-
-                    // example double to single conversion:
-                    // 1023 = 0011 1111 1111
-                    // 127  = 0000 0111 1111 (subtract this)
-                    // 896  = 0011 1000 0000
-                    // sexp = 0000 bbbb bbbb (add this) b = bit d = ~b 
-                    // dexp = 0bdd dbbb bbbb 
-                    // also need to take into account possible zero/denorm/inf/NaN values
-                    
-                    // convert the smallest precision's exponent to use the largest precision's bias
-                    XExpE = XDenormE ? {1'b0, {`NE-`NE2{1'b1}}, (`NE2-1)'(1)} : {XLen2[`LEN2-2], {`NE-`NE2{~XLen2[`LEN2-2]}}, XLen2[`LEN2-3:`NF2]}; 
-                    YExpE = YDenormE ? {1'b0, {`NE-`NE2{1'b1}}, (`NE2-1)'(1)} : {YLen2[`LEN2-2], {`NE-`NE2{~YLen2[`LEN2-2]}}, YLen2[`LEN2-3:`NF2]}; 
-                    ZExpE = ZDenormE ? {1'b0, {`NE-`NE2{1'b1}}, (`NE2-1)'(1)} : {ZLen2[`LEN2-2], {`NE-`NE2{~ZLen2[`LEN2-2]}}, ZLen2[`LEN2-3:`NF2]}; 
-
-                    // extract the fraction and add the nessesary trailing zeros
-                    XFracE = {XLen2[`NF2-1:0], (`NF-`NF2)'(0)};
-                    YFracE = {YLen2[`NF2-1:0], (`NF-`NF2)'(0)};
-                    ZFracE = {ZLen2[`NF2-1:0], (`NF-`NF2)'(0)};
-                end
-                default: begin
-                    XSgnE = 0;
-                    YSgnE = 0;
-                    ZSgnE = 0;
-                    XExpE = 0; 
-                    YExpE = 0;
-                    ZExpE = 0; 
-                    XFracE = 0;
-                    YFracE = 0;
-                    ZFracE = 0;
-                end
-            endcase
-        end
-
-    end else if (`FPSIZES == 4) begin      // if all precsisons are supported - quad, double, single, and half
-    
-        //    quad   |  double  |  single  |  half    
-        //-------------------------------------------------------------------
-        //   `Q_LEN  |  `D_LEN  |  `S_LEN  |  `H_LEN     length of floating point number
-        //   `Q_NE   |  `D_NE   |  `S_NE   |  `H_NE      length of exponent
-        //   `Q_NF   |  `D_NF   |  `S_NF   |  `H_NF      length of fraction
-        //   `Q_BIAS |  `D_BIAS |  `S_BIAS |  `H_BIAS    exponent's bias value
-        //   `Q_FMT  |  `D_FMT  |  `S_FMT  |  `H_FMT     precision's format value - Q=11 D=01 S=00 H=10
-
-
-        logic  [`D_LEN-1:0]  XLen1, YLen1, ZLen1; // Remove NaN boxing or NaN, if not properly NaN boxed for double percision
-        logic  [`S_LEN-1:0]  XLen2, YLen2, ZLen2; // Remove NaN boxing or NaN, if not properly NaN boxed for single percision
-        logic  [`H_LEN-1:0]  XLen3, YLen3, ZLen3; // Remove NaN boxing or NaN, if not properly NaN boxed for half percision
-        
-        // Check NaN boxing, If the value is not properly NaN boxed, set the value to a quiet NaN - for double precision
-        assign XLen1 = &X[`Q_LEN-1:`D_LEN] ? X[`D_LEN-1:0] : {1'b0, {`D_NE+1{1'b1}}, (`D_NF-1)'(0)};
-        assign YLen1 = &Y[`Q_LEN-1:`D_LEN] ? Y[`D_LEN-1:0] : {1'b0, {`D_NE+1{1'b1}}, (`D_NF-1)'(0)};
-        assign ZLen1 = &Z[`Q_LEN-1:`D_LEN] ? Z[`D_LEN-1:0] : {1'b0, {`D_NE+1{1'b1}}, (`D_NF-1)'(0)}; 
-
-        // Check NaN boxing, If the value is not properly NaN boxed, set the value to a quiet NaN - for single precision
-        assign XLen2 = &X[`Q_LEN-1:`S_LEN] ? X[`S_LEN-1:0] : {1'b0, {`S_NE+1{1'b1}}, (`S_NF-1)'(0)};
-        assign YLen2 = &Y[`Q_LEN-1:`S_LEN] ? Y[`S_LEN-1:0] : {1'b0, {`S_NE+1{1'b1}}, (`S_NF-1)'(0)};
-        assign ZLen2 = &Z[`Q_LEN-1:`S_LEN] ? Z[`S_LEN-1:0] : {1'b0, {`S_NE+1{1'b1}}, (`S_NF-1)'(0)}; 
-
-        // Check NaN boxing, If the value is not properly NaN boxed, set the value to a quiet NaN - for half precision
-        assign XLen3 = &X[`Q_LEN-1:`H_LEN] ? X[`H_LEN-1:0] : {1'b0, {`H_NE+1{1'b1}}, (`H_NF-1)'(0)};
-        assign YLen3 = &Y[`Q_LEN-1:`H_LEN] ? Y[`H_LEN-1:0] : {1'b0, {`H_NE+1{1'b1}}, (`H_NF-1)'(0)};
-        assign ZLen3 = &Z[`Q_LEN-1:`H_LEN] ? Z[`H_LEN-1:0] : {1'b0, {`H_NE+1{1'b1}}, (`H_NF-1)'(0)}; 
-
-
-        // There are 2 case statements
-        //      - one for other singals and one for sgn/exp/frac
-        //      - need two for the dependencies in the expoenent calculation
-        always_comb begin
-            case (FmtE)
-                2'b11: begin  // if input is quad percision
-
-                    // is the input (in it's original format) denormalized
-                    XDenormE = ~|X[`Q_LEN-2:`Q_NF] & ~XFracZero; 
-                    YDenormE = ~|Y[`Q_LEN-2:`Q_NF] & ~YFracZero; 
-                    ZDenormE = ~|Z[`Q_LEN-2:`Q_NF] & ~ZFracZero; 
-
-                    // is the exponent non-zero
-                    XExpNonzero = |X[`Q_LEN-2:`Q_NF]; 
-                    YExpNonzero = |Y[`Q_LEN-2:`Q_NF];
-                    ZExpNonzero = |Z[`Q_LEN-2:`Q_NF];
-
-                    // is the exponent all 1's
-                    XExpMaxE = &X[`Q_LEN-2:`Q_NF];
-                    YExpMaxE = &Y[`Q_LEN-2:`Q_NF];
-                    ZExpMaxE = &Z[`Q_LEN-2:`Q_NF];
-                end
-                2'b01: begin  // if input is double percision
-
-                    // is the exponent all 1's
-                    XExpMaxE = &XLen1[`D_LEN-2:`D_NF];
-                    YExpMaxE = &YLen1[`D_LEN-2:`D_NF];
-                    ZExpMaxE = &ZLen1[`D_LEN-2:`D_NF];
-
-                    // is the input (in it's original format) denormalized
-                    XDenormE = ~|XLen1[`D_LEN-2:`D_NF] & ~XFracZero; 
-                    YDenormE = ~|YLen1[`D_LEN-2:`D_NF] & ~YFracZero; 
-                    ZDenormE = ~|ZLen1[`D_LEN-2:`D_NF] & ~ZFracZero; 
-
-                    // is the exponent non-zero
-                    XExpNonzero = |XLen1[`D_LEN-2:`D_NF]; 
-                    YExpNonzero = |YLen1[`D_LEN-2:`D_NF];
-                    ZExpNonzero = |ZLen1[`D_LEN-2:`D_NF];
-                end
-                2'b00: begin      // if input is single percision
-
-                    // is the exponent all 1's
-                    XExpMaxE = &XLen2[`S_LEN-2:`S_NF];
-                    YExpMaxE = &YLen2[`S_LEN-2:`S_NF];
-                    ZExpMaxE = &ZLen2[`S_LEN-2:`S_NF];
-
-                    // is the input (in it's original format) denormalized
-                    XDenormE = ~|XLen2[`S_LEN-2:`S_NF] & ~XFracZero; 
-                    YDenormE = ~|YLen2[`S_LEN-2:`S_NF] & ~YFracZero; 
-                    ZDenormE = ~|ZLen2[`S_LEN-2:`S_NF] & ~ZFracZero; 
-
-                    // is the exponent non-zero
-                    XExpNonzero = |XLen2[`S_LEN-2:`S_NF]; 
-                    YExpNonzero = |YLen2[`S_LEN-2:`S_NF];
-                    ZExpNonzero = |ZLen2[`S_LEN-2:`S_NF];
-                end
-                2'b10: begin      // if input is half percision
-
-                    // is the exponent all 1's
-                    XExpMaxE = &XLen3[`H_LEN-2:`H_NF];
-                    YExpMaxE = &YLen3[`H_LEN-2:`H_NF];
-                    ZExpMaxE = &ZLen3[`H_LEN-2:`H_NF];
-
-                    // is the input (in it's original format) denormalized
-                    XDenormE = ~|XLen3[`H_LEN-2:`H_NF] & ~XFracZero; 
-                    YDenormE = ~|YLen3[`H_LEN-2:`H_NF] & ~YFracZero; 
-                    ZDenormE = ~|ZLen3[`H_LEN-2:`H_NF] & ~ZFracZero; 
-
-                    // is the exponent non-zero
-                    XExpNonzero = |XLen3[`H_LEN-2:`H_NF]; 
-                    YExpNonzero = |YLen3[`H_LEN-2:`H_NF];
-                    ZExpNonzero = |ZLen3[`H_LEN-2:`H_NF];
-                end
-            endcase
-        end
-
-        always_comb begin
-            case (FmtE)
-                2'b11: begin  // if input is quad percision
-                    // extract sign bit
-                    XSgnE = X[`Q_LEN-1];
-                    YSgnE = Y[`Q_LEN-1];
-                    ZSgnE = Z[`Q_LEN-1];
-
-                    // extract the exponent
-                    XExpE = {X[`Q_LEN-2:`Q_NF+1], X[`Q_NF]|XDenormE};
-                    YExpE = {Y[`Q_LEN-2:`Q_NF+1], Y[`Q_NF]|YDenormE};
-                    ZExpE = {Z[`Q_LEN-2:`Q_NF+1], Z[`Q_NF]|ZDenormE};
-
-                    // extract the fraction
-                    XFracE = X[`Q_NF-1:0];
-                    YFracE = Y[`Q_NF-1:0];
-                    ZFracE = Z[`Q_NF-1:0];
-                end
-                2'b01: begin  // if input is double percision
-                    // extract sign bit
-                    XSgnE = XLen1[`D_LEN-1];
-                    YSgnE = YLen1[`D_LEN-1];
-                    ZSgnE = ZLen1[`D_LEN-1];
-
-                    // example double to single conversion:
-                    // 1023 = 0011 1111 1111
-                    // 127  = 0000 0111 1111 (subtract this)
-                    // 896  = 0011 1000 0000
-                    // sexp = 0000 bbbb bbbb (add this) b = bit d = ~b 
-                    // dexp = 0bdd dbbb bbbb 
-                    // also need to take into account possible zero/denorm/inf/NaN values
-                    
-                    // convert the double precsion exponent into quad precsion
-
-                    XExpE = {XLen1[`D_LEN-2], {`Q_NE-`D_NE{~XLen1[`D_LEN-2]}}, XLen1[`D_LEN-3:`D_NF+1], XLen1[`D_NF]|XDenormE}; 
-                    YExpE = {YLen1[`D_LEN-2], {`Q_NE-`D_NE{~YLen1[`D_LEN-2]}}, YLen1[`D_LEN-3:`D_NF+1], YLen1[`D_NF]|YDenormE}; 
-                    ZExpE = {ZLen1[`D_LEN-2], {`Q_NE-`D_NE{~ZLen1[`D_LEN-2]}}, ZLen1[`D_LEN-3:`D_NF+1], ZLen1[`D_NF]|ZDenormE}; 
-
-                    // extract the fraction and add the nessesary trailing zeros
-                    XFracE = {XLen1[`D_NF-1:0], (`Q_NF-`D_NF)'(0)};
-                    YFracE = {YLen1[`D_NF-1:0], (`Q_NF-`D_NF)'(0)};
-                    ZFracE = {ZLen1[`D_NF-1:0], (`Q_NF-`D_NF)'(0)};
-                end
-                2'b00: begin      // if input is single percision
-                    // extract sign bit
-                    XSgnE = XLen2[`S_LEN-1];
-                    YSgnE = YLen2[`S_LEN-1];
-                    ZSgnE = ZLen2[`S_LEN-1];
-
-                    // example double to single conversion:
-                    // 1023 = 0011 1111 1111
-                    // 127  = 0000 0111 1111 (subtract this)
-                    // 896  = 0011 1000 0000
-                    // sexp = 0000 bbbb bbbb (add this) b = bit d = ~b 
-                    // dexp = 0bdd dbbb bbbb 
-                    // also need to take into account possible zero/denorm/inf/NaN values
-                    
-                    // convert the single precsion exponent into quad precsion
-                    XExpE = {XLen2[`S_LEN-2], {`Q_NE-`S_NE{~XLen2[`S_LEN-2]}}, XLen2[`S_LEN-3:`S_NF+1], XLen2[`S_NF]|XDenormE}; 
-                    YExpE = {YLen2[`S_LEN-2], {`Q_NE-`S_NE{~YLen2[`S_LEN-2]}}, YLen2[`S_LEN-3:`S_NF+1], YLen2[`S_NF]|YDenormE}; 
-                    ZExpE = {ZLen2[`S_LEN-2], {`Q_NE-`S_NE{~ZLen2[`S_LEN-2]}}, ZLen2[`S_LEN-3:`S_NF+1], ZLen2[`S_NF]|ZDenormE}; 
-
-                    // extract the fraction and add the nessesary trailing zeros
-                    XFracE = {XLen2[`S_NF-1:0], (`Q_NF-`S_NF)'(0)};
-                    YFracE = {YLen2[`S_NF-1:0], (`Q_NF-`S_NF)'(0)};
-                    ZFracE = {ZLen2[`S_NF-1:0], (`Q_NF-`S_NF)'(0)};
-                end
-                2'b10: begin      // if input is half percision
-                    // extract sign bit
-                    XSgnE = XLen3[`H_LEN-1];
-                    YSgnE = YLen3[`H_LEN-1];
-                    ZSgnE = ZLen3[`H_LEN-1];
-
-                    // example double to single conversion:
-                    // 1023 = 0011 1111 1111
-                    // 127  = 0000 0111 1111 (subtract this)
-                    // 896  = 0011 1000 0000
-                    // sexp = 0000 bbbb bbbb (add this) b = bit d = ~b 
-                    // dexp = 0bdd dbbb bbbb 
-                    // also need to take into account possible zero/denorm/inf/NaN values
-
-                    // convert the half precsion exponent into quad precsion
-                    XExpE = {XLen3[`H_LEN-2], {`Q_NE-`H_NE{~XLen3[`H_LEN-2]}}, XLen3[`H_LEN-3:`H_NF+1], XLen3[`H_NF]|XDenormE}; 
-                    YExpE = {YLen3[`H_LEN-2], {`Q_NE-`H_NE{~YLen3[`H_LEN-2]}}, YLen3[`H_LEN-3:`H_NF+1], YLen3[`H_NF]|YDenormE}; 
-                    ZExpE = {ZLen3[`H_LEN-2], {`Q_NE-`H_NE{~ZLen3[`H_LEN-2]}}, ZLen3[`H_LEN-3:`H_NF+1], ZLen3[`H_NF]|ZDenormE}; 
-
-                    // extract the fraction and add the nessesary trailing zeros
-                    XFracE = {XLen3[`H_NF-1:0], (`Q_NF-`H_NF)'(0)};
-                    YFracE = {YLen3[`H_NF-1:0], (`Q_NF-`H_NF)'(0)};
-                    ZFracE = {ZLen3[`H_NF-1:0], (`Q_NF-`H_NF)'(0)};
-                end
-            endcase
-        end
-
-    end
-
-    // is the exponent all 0's
-    assign XExpZero = ~XExpNonzero;
-    assign YExpZero = ~YExpNonzero;
-    assign ZExpZero = ~ZExpNonzero;
-
-    // is the fraction zero
-    assign XFracZero = ~|XFracE;
-    assign YFracZero = ~|YFracE;
-    assign ZFracZero = ~|ZFracE;
-
-    // add the assumed one (or zero if denormal or zero) to create the mantissa
-    assign XManE = {XExpNonzero, XFracE};
-    assign YManE = {YExpNonzero, YFracE};
-    assign ZManE = {ZExpNonzero, ZFracE};
+    unpackinput unpackinputZ (.In(Z), .FmtE, .Sgn(ZSgnE), .Exp(ZExpE), .Man(ZManE), 
+                            .NaN(ZNaNE), .SNaN(ZSNaNE), .Denorm(ZDenormE), 
+                            .Zero(ZZeroE), .Inf(ZInfE), .ExpMax(ZExpMaxE), .ExpZero(ZExpZero));
 
+                            
     // is X normalized
     assign XNormE = ~(XExpMaxE|XExpZero);
     
-    // is the input a NaN
-    //     - force to be a NaN if it isn't properly Nan Boxed
-    assign XNaNE = XExpMaxE & ~XFracZero;
-    assign YNaNE = YExpMaxE & ~YFracZero;
-    assign ZNaNE = ZExpMaxE & ~ZFracZero;
-
-    // is the input a singnaling NaN
-    assign XSNaNE = XNaNE&~XFracE[`NF-1];
-    assign YSNaNE = YNaNE&~YFracE[`NF-1];
-    assign ZSNaNE = ZNaNE&~ZFracE[`NF-1];
-
-    // // is the input denormalized
-    // assign XDenormE = XExpZero & ~XFracZero;
-    // assign YDenormE = YExpZero & ~YFracZero;
-    // assign ZDenormE = ZExpZero & ~ZFracZero;
-
-    // is the input infinity
-    assign XInfE = XExpMaxE & XFracZero;
-    assign YInfE = YExpMaxE & YFracZero;
-    assign ZInfE = ZExpMaxE & ZFracZero;
-
-    // is the input zero
-    assign XZeroE = XExpZero & XFracZero;
-    assign YZeroE = YExpZero & YFracZero;
-    assign ZZeroE = ZExpZero & ZFracZero;
-    
 endmodule
\ No newline at end of file
diff --git a/pipelined/src/fpu/unpackinput.sv b/pipelined/src/fpu/unpackinput.sv
new file mode 100644
index 00000000..e8bd22fb
--- /dev/null
+++ b/pipelined/src/fpu/unpackinput.sv
@@ -0,0 +1,402 @@
+`include "wally-config.vh"
+
+module unpackinput ( 
+    input logic  [`FLEN-1:0]        In,    // inputs from register file
+    input logic  [`FPSIZES/3:0]     FmtE,       // format signal 00 - single 01 - double 11 - quad 10 - half
+    output logic                    Sgn,    // sign bits of XYZ
+    output logic [`NE-1:0]          Exp,    // exponents of XYZ (converted to largest supported precision)
+    output logic [`NF:0]            Man,    // mantissas of XYZ (converted to largest supported precision)
+    output logic                    NaN,    // is XYZ a NaN
+    output logic                    SNaN, // is XYZ a signaling NaN
+    output logic                    Denorm,   // is XYZ denormalized
+    output logic                    Zero,         // is XYZ zero
+    output logic                    Inf,            // is XYZ infinity
+    output logic                    ExpMax,                        // does In have the maximum exponent (NaN or Inf)
+    output logic                    ExpZero                        // is the exponent zero
+);
+ 
+    logic [`NF-1:0] Frac; //Fraction of XYZ
+    logic           ExpNonZero; // is the exponent of XYZ non-zero
+    logic           FracZero; // is the fraction zero
+    
+    if (`FPSIZES == 1) begin        // if there is only one floating point format supported
+
+        // sign bit
+        assign Sgn = In[`FLEN-1];
+
+        // exponent
+        assign Exp = {In[`FLEN-2:`NF+1], In[`NF]|Denorm};
+
+        // fraction (no assumed 1)
+        assign Frac = In[`NF-1:0];
+
+        // is the exponent non-zero
+        assign ExpNonZero = |Exp; 
+
+        // is the exponent all 1's
+        assign ExpMax = &Exp;
+
+
+        // is the input (in it's original format) denormalized
+        assign Denorm = ~|In[`FLEN-2:`NF] & ~FracZero; 
+    
+
+    end else if (`FPSIZES == 2) begin   // if there are 2 floating point formats supported
+        //***need better names for these constants
+        // largest format | smaller format
+        //----------------------------------
+        //      `FLEN     |     `LEN1       length of floating point number
+        //      `NE       |     `NE1        length of exponent
+        //      `NF       |     `NF1        length of fraction
+        //      `BIAS     |     `BIAS1      exponent's bias value
+        //      `FMT      |     `FMT1       precision's format value - Q=11 D=01 S=00 H=10
+
+        // Possible combinantions specified by spec:
+        //      double and single
+        //      single and half
+
+        // Not needed but can also handle:
+        //      quad   and double
+        //      quad   and single
+        //      quad   and half
+        //      double and half
+
+        logic  [`LEN1-1:0]  Len1; // Remove NaN boxing or NaN, if not properly NaN boxed
+
+        // Check NaN boxing, If the value is not properly NaN boxed, set the value to a quiet NaN
+        assign Len1 = &In[`FLEN-1:`LEN1] ? In[`LEN1-1:0] : {1'b0, {`NE1+1{1'b1}}, (`NF1-1)'(0)};
+
+        // choose sign bit depending on format - 1=larger precsion 0=smaller precision
+        assign Sgn = FmtE ? In[`FLEN-1] : Len1[`LEN1-1];
+
+        // example double to single conversion:
+        // 1023 = 0011 1111 1111
+        // 127  = 0000 0111 1111 (subtract this)
+        // 896  = 0011 1000 0000
+        // sexp = 0000 bbbb bbbb (add this) b = bit d = ~b 
+        // dexp = 0bdd dbbb bbbb 
+        // also need to take into account possible zero/denorm/inf/NaN values
+
+        // extract the exponent, converting the smaller exponent into the larger precision if nessisary
+        //      - if the original precision had a denormal number convert the exponent value 1
+        assign Exp = FmtE ? {In[`FLEN-2:`NF+1], In[`NF]|Denorm} : {Len1[`LEN1-2], {`NE-`NE1{~Len1[`LEN1-2]}}, Len1[`LEN1-3:`NF1+1], Len1[`NF1]|Denorm}; 
+
+        // is the input (in it's original format) denormalized
+
+                    // is the input (in it's original format) denormalized
+        assign Denorm = (FmtE ? ~|In[`FLEN-2:`NF] : ~|Len1[`LEN1-2:`NF1]) & ~FracZero; 
+
+        // extract the fraction, add trailing zeroes to the mantissa if nessisary
+        assign Frac = FmtE ? In[`NF-1:0] : {Len1[`NF1-1:0], (`NF-`NF1)'(0)};
+
+        // is the exponent non-zero
+        assign ExpNonZero = FmtE ? |In[`FLEN-2:`NF] : |Len1[`LEN1-2:`NF1]; 
+
+        // is the exponent all 1's
+        assign ExpMax = FmtE ? &In[`FLEN-2:`NF] : &Len1[`LEN1-2:`NF1];
+    
+
+    end else if (`FPSIZES == 3) begin       // three floating point precsions supported
+
+        //***need better names for these constants
+        // largest format | larger format  | smallest format
+        //---------------------------------------------------
+        //      `FLEN     |     `LEN1      |    `LEN2       length of floating point number
+        //      `NE       |     `NE1       |    `NE2        length of exponent
+        //      `NF       |     `NF1       |    `NF2        length of fraction
+        //      `BIAS     |     `BIAS1     |    `BIAS2      exponent's bias value
+        //      `FMT      |     `FMT1      |    `FMT2       precision's format value - Q=11 D=01 S=00 H=10
+
+        // Possible combinantions specified by spec:
+        //      quad   and double and single
+        //      double and single and half
+
+        // Not needed but can also handle:
+        //      quad   and double and half
+        //      quad   and single and half
+
+        logic  [`LEN1-1:0]  Len1; // Remove NaN boxing or NaN, if not properly NaN boxed for larger percision
+        logic  [`LEN2-1:0]  Len2; // Remove NaN boxing or NaN, if not properly NaN boxed for smallest precision
+        
+        // Check NaN boxing, If the value is not properly NaN boxed, set the value to a quiet NaN - for larger precision
+        assign Len1 = &In[`FLEN-1:`LEN1] ? In[`LEN1-1:0] : {1'b0, {`NE1+1{1'b1}}, (`NF1-1)'(0)};
+
+        // Check NaN boxing, If the value is not properly NaN boxed, set the value to a quiet NaN - for smaller precision
+        assign Len2 = &In[`FLEN-1:`LEN2] ? In[`LEN2-1:0] : {1'b0, {`NE2+1{1'b1}}, (`NF2-1)'(0)};
+
+        // There are 2 case statements
+        //      - one for other singals and one for sgn/exp/frac
+        //      - need two for the dependencies in the expoenent calculation
+        //*** pull out the ~FracZero and and it at the end
+        always_comb begin
+            case (FmtE)
+                `FMT: begin // if input is largest precision (`FLEN - ie quad or double)
+
+                    // This is the original format so set OrigDenorm to 0
+                    Denorm = ~|In[`FLEN-2:`NF] & ~FracZero; 
+
+                    // is the exponent non-zero
+                    ExpNonZero = |In[`FLEN-2:`NF]; 
+
+                    // is the exponent all 1's
+                    ExpMax = &In[`FLEN-2:`NF];
+                end
+                `FMT1: begin    // if input is larger precsion (`LEN1 - double or single)
+
+                    // is the input (in it's original format) denormalized
+                    Denorm = ~|Len1[`LEN1-2:`NF1] & ~FracZero; 
+
+                    // is the exponent non-zero
+                    ExpNonZero = |Len1[`LEN1-2:`NF1]; 
+
+                    // is the exponent all 1's
+                    ExpMax = &Len1[`LEN1-2:`NF1];
+                end
+                `FMT2: begin        // if input is smallest precsion (`LEN2 - single or half)
+
+                    // is the input (in it's original format) denormalized
+                    Denorm = ~|Len2[`LEN2-2:`NF2] & ~FracZero; 
+
+                    // is the exponent non-zero
+                    ExpNonZero = |Len2[`LEN2-2:`NF2]; 
+
+                    // is the exponent all 1's
+                    ExpMax = &Len2[`LEN2-2:`NF2];
+                end
+                default: begin
+                    Denorm = 0; 
+                    ExpNonZero = 0; 
+                    ExpMax = 0;
+                end
+            endcase
+        end
+        always_comb begin
+            case (FmtE)
+                `FMT: begin // if input is largest precision (`FLEN - ie quad or double)
+                    // extract the sign bit
+                    Sgn = In[`FLEN-1];
+
+                    // extract the exponent
+                    Exp = {In[`FLEN-2:`NF+1], In[`NF]|Denorm};
+
+                    // extract the fraction
+                    Frac = In[`NF-1:0];
+                end
+                `FMT1: begin    // if input is larger precsion (`LEN1 - double or single)
+
+                    // extract the sign bit
+                    Sgn = Len1[`LEN1-1];
+
+                    // example double to single conversion:
+                    // 1023 = 0011 1111 1111
+                    // 127  = 0000 0111 1111 (subtract this)
+                    // 896  = 0011 1000 0000
+                    // sexp = 0000 bbbb bbbb (add this) b = bit d = ~b 
+                    // dexp = 0bdd dbbb bbbb 
+                    // also need to take into account possible zero/denorm/inf/NaN values
+
+                    // convert the larger precision's exponent to use the largest precision's bias
+                    Exp = {Len1[`LEN1-2], {`NE-`NE1{~Len1[`LEN1-2]}}, Len1[`LEN1-3:`NF1+1], Len1[`NF1]|Denorm}; 
+
+                    // extract the fraction and add the nessesary trailing zeros
+                    Frac = {Len1[`NF1-1:0], (`NF-`NF1)'(0)};
+                end
+                `FMT2: begin        // if input is smallest precsion (`LEN2 - single or half)
+
+                    // exctract the sign bit
+                    Sgn = Len2[`LEN2-1];
+
+                    // example double to single conversion:
+                    // 1023 = 0011 1111 1111
+                    // 127  = 0000 0111 1111 (subtract this)
+                    // 896  = 0011 1000 0000
+                    // sexp = 0000 bbbb bbbb (add this) b = bit d = ~b 
+                    // dexp = 0bdd dbbb bbbb 
+                    // also need to take into account possible zero/denorm/inf/NaN values
+                    
+                    // convert the smallest precision's exponent to use the largest precision's bias
+                    Exp = Denorm ? {1'b0, {`NE-`NE2{1'b1}}, (`NE2-1)'(1)} : {Len2[`LEN2-2], {`NE-`NE2{~Len2[`LEN2-2]}}, Len2[`LEN2-3:`NF2]}; 
+
+                    // extract the fraction and add the nessesary trailing zeros
+                    Frac = {Len2[`NF2-1:0], (`NF-`NF2)'(0)};
+                end
+                default: begin
+                    Sgn = 0;
+                    Exp = 0; 
+                    Frac = 0;
+                end
+            endcase
+        end
+
+    end else if (`FPSIZES == 4) begin      // if all precsisons are supported - quad, double, single, and half
+    
+        //    quad   |  double  |  single  |  half    
+        //-------------------------------------------------------------------
+        //   `Q_LEN  |  `D_LEN  |  `S_LEN  |  `H_LEN     length of floating point number
+        //   `Q_NE   |  `D_NE   |  `S_NE   |  `H_NE      length of exponent
+        //   `Q_NF   |  `D_NF   |  `S_NF   |  `H_NF      length of fraction
+        //   `Q_BIAS |  `D_BIAS |  `S_BIAS |  `H_BIAS    exponent's bias value
+        //   `Q_FMT  |  `D_FMT  |  `S_FMT  |  `H_FMT     precision's format value - Q=11 D=01 S=00 H=10
+
+
+        logic  [`D_LEN-1:0]  Len1; // Remove NaN boxing or NaN, if not properly NaN boxed for double percision
+        logic  [`S_LEN-1:0]  Len2; // Remove NaN boxing or NaN, if not properly NaN boxed for single percision
+        logic  [`H_LEN-1:0]  Len3; // Remove NaN boxing or NaN, if not properly NaN boxed for half percision
+        
+        // Check NaN boxing, If the value is not properly NaN boxed, set the value to a quiet NaN - for double precision
+        assign Len1 = &In[`Q_LEN-1:`D_LEN] ? In[`D_LEN-1:0] : {1'b0, {`D_NE+1{1'b1}}, (`D_NF-1)'(0)};
+
+        // Check NaN boxing, If the value is not properly NaN boxed, set the value to a quiet NaN - for single precision
+        assign Len2 = &In[`Q_LEN-1:`S_LEN] ? In[`S_LEN-1:0] : {1'b0, {`S_NE+1{1'b1}}, (`S_NF-1)'(0)};
+
+        // Check NaN boxing, If the value is not properly NaN boxed, set the value to a quiet NaN - for half precision
+        assign Len3 = &In[`Q_LEN-1:`H_LEN] ? In[`H_LEN-1:0] : {1'b0, {`H_NE+1{1'b1}}, (`H_NF-1)'(0)};
+
+
+        // There are 2 case statements
+        //      - one for other singals and one for sgn/exp/frac
+        //      - need two for the dependencies in the expoenent calculation
+        always_comb begin
+            case (FmtE)
+                2'b11: begin  // if input is quad percision
+
+                    // is the input (in it's original format) denormalized
+                    Denorm = ~|In[`Q_LEN-2:`Q_NF] & ~FracZero; 
+
+                    // is the exponent non-zero
+                    ExpNonZero = |In[`Q_LEN-2:`Q_NF]; 
+
+                    // is the exponent all 1's
+                    ExpMax = &In[`Q_LEN-2:`Q_NF];
+                end
+                2'b01: begin  // if input is double percision
+
+                    // is the exponent all 1's
+                    ExpMax = &Len1[`D_LEN-2:`D_NF];
+
+                    // is the input (in it's original format) denormalized
+                    Denorm = ~|Len1[`D_LEN-2:`D_NF] & ~FracZero; 
+
+                    // is the exponent non-zero
+                    ExpNonZero = |Len1[`D_LEN-2:`D_NF]; 
+                end
+                2'b00: begin      // if input is single percision
+
+                    // is the exponent all 1's
+                    ExpMax = &Len2[`S_LEN-2:`S_NF];
+
+                    // is the input (in it's original format) denormalized
+                    Denorm = ~|Len2[`S_LEN-2:`S_NF] & ~FracZero; 
+
+                    // is the exponent non-zero
+                    ExpNonZero = |Len2[`S_LEN-2:`S_NF]; 
+                end
+                2'b10: begin      // if input is half percision
+
+                    // is the exponent all 1's
+                    ExpMax = &Len3[`H_LEN-2:`H_NF];
+
+                    // is the input (in it's original format) denormalized
+                    Denorm = ~|Len3[`H_LEN-2:`H_NF] & ~FracZero; 
+
+                    // is the exponent non-zero
+                    ExpNonZero = |Len3[`H_LEN-2:`H_NF]; 
+                end
+            endcase
+        end
+
+        always_comb begin
+            case (FmtE)
+                2'b11: begin  // if input is quad percision
+                    // extract sign bit
+                    Sgn = In[`Q_LEN-1];
+
+                    // extract the exponent
+                    Exp = {In[`Q_LEN-2:`Q_NF+1], In[`Q_NF]|Denorm};
+
+                    // extract the fraction
+                    Frac = In[`Q_NF-1:0];
+                end
+                2'b01: begin  // if input is double percision
+                    // extract sign bit
+                    Sgn = Len1[`D_LEN-1];
+
+                    // example double to single conversion:
+                    // 1023 = 0011 1111 1111
+                    // 127  = 0000 0111 1111 (subtract this)
+                    // 896  = 0011 1000 0000
+                    // sexp = 0000 bbbb bbbb (add this) b = bit d = ~b 
+                    // dexp = 0bdd dbbb bbbb 
+                    // also need to take into account possible zero/denorm/inf/NaN values
+                    
+                    // convert the double precsion exponent into quad precsion
+
+                    Exp = {Len1[`D_LEN-2], {`Q_NE-`D_NE{~Len1[`D_LEN-2]}}, Len1[`D_LEN-3:`D_NF+1], Len1[`D_NF]|Denorm}; 
+
+                    // extract the fraction and add the nessesary trailing zeros
+                    Frac = {Len1[`D_NF-1:0], (`Q_NF-`D_NF)'(0)};
+                end
+                2'b00: begin      // if input is single percision
+                    // extract sign bit
+                    Sgn = Len2[`S_LEN-1];
+
+                    // example double to single conversion:
+                    // 1023 = 0011 1111 1111
+                    // 127  = 0000 0111 1111 (subtract this)
+                    // 896  = 0011 1000 0000
+                    // sexp = 0000 bbbb bbbb (add this) b = bit d = ~b 
+                    // dexp = 0bdd dbbb bbbb 
+                    // also need to take into account possible zero/denorm/inf/NaN values
+                    
+                    // convert the single precsion exponent into quad precsion
+                    Exp = {Len2[`S_LEN-2], {`Q_NE-`S_NE{~Len2[`S_LEN-2]}}, Len2[`S_LEN-3:`S_NF+1], Len2[`S_NF]|Denorm}; 
+
+                    // extract the fraction and add the nessesary trailing zeros
+                    Frac = {Len2[`S_NF-1:0], (`Q_NF-`S_NF)'(0)};
+                end
+                2'b10: begin      // if input is half percision
+                    // extract sign bit
+                    Sgn = Len3[`H_LEN-1];
+
+                    // example double to single conversion:
+                    // 1023 = 0011 1111 1111
+                    // 127  = 0000 0111 1111 (subtract this)
+                    // 896  = 0011 1000 0000
+                    // sexp = 0000 bbbb bbbb (add this) b = bit d = ~b 
+                    // dexp = 0bdd dbbb bbbb 
+                    // also need to take into account possible zero/denorm/inf/NaN values
+
+                    // convert the half precsion exponent into quad precsion
+                    Exp = {Len3[`H_LEN-2], {`Q_NE-`H_NE{~Len3[`H_LEN-2]}}, Len3[`H_LEN-3:`H_NF+1], Len3[`H_NF]|Denorm}; 
+
+                    // extract the fraction and add the nessesary trailing zeros
+                    Frac = {Len3[`H_NF-1:0], (`Q_NF-`H_NF)'(0)};
+                end
+            endcase
+        end
+
+    end
+
+    // is the exponent all 0's
+    assign ExpZero = ~ExpNonZero;
+
+    // is the fraction zero
+    assign FracZero = ~|Frac;
+
+    // add the assumed one (or zero if denormal or zero) to create the mantissa
+    assign Man = {ExpNonZero, Frac};
+    
+    // is the input a NaN
+    //     - force to be a NaN if it isn't properly Nan Boxed
+    assign NaN = ExpMax & ~FracZero;
+
+    // is the input a singnaling NaN
+    assign SNaN = NaN&~Frac[`NF-1];
+
+    // is the input infinity
+    assign Inf = ExpMax & FracZero;
+
+    // is the input zero
+    assign Zero = ExpZero & FracZero;
+    
+endmodule
\ No newline at end of file
diff --git a/pipelined/src/generic/lzc.sv b/pipelined/src/generic/lzc.sv
index 5b1c22f9..1ce08247 100644
--- a/pipelined/src/generic/lzc.sv
+++ b/pipelined/src/generic/lzc.sv
@@ -1,14 +1,14 @@
 //leading zero counter i.e. priority encoder
 module lzc #(parameter WIDTH=1) (
     input logic  [WIDTH-1:0]            num,
-    output logic [$clog2(WIDTH)-1:0]  ZeroCnt
+    output logic [$clog2(WIDTH+1)-1:0]  ZeroCnt
 );
 /* verilator lint_off CMPCONST */
     
-    logic [$clog2(WIDTH)-1:0] i;
+    logic [$clog2(WIDTH+1)-1:0] i;
     always_comb begin
         i = 0;
-        while (~num[WIDTH-1-(32)'(i)] & $unsigned(i) <= $unsigned(($clog2(WIDTH))'(WIDTH-1))) i = i+1;  // search for leading one
+        while (~num[WIDTH-1-(32)'(i)] & $unsigned(i) <= $unsigned(($clog2(WIDTH+1))'(WIDTH-1))) i = i+1;  // search for leading one
         ZeroCnt = i;
     end
 /* verilator lint_on CMPCONST */

From f6ac33ce8a6f209dbf1907834461b1550e29d5d4 Mon Sep 17 00:00:00 2001
From: Katherine Parry <kparry4@gmail.com>
Date: Tue, 31 May 2022 17:40:34 +0000
Subject: [PATCH 03/14] reorginized unpackinput signals

---
 pipelined/src/fpu/unpackinput.sv | 371 +++++++++++--------------------
 1 file changed, 135 insertions(+), 236 deletions(-)

diff --git a/pipelined/src/fpu/unpackinput.sv b/pipelined/src/fpu/unpackinput.sv
index e8bd22fb..0b944b64 100644
--- a/pipelined/src/fpu/unpackinput.sv
+++ b/pipelined/src/fpu/unpackinput.sv
@@ -24,21 +24,24 @@ module unpackinput (
         // sign bit
         assign Sgn = In[`FLEN-1];
 
-        // exponent
-        assign Exp = {In[`FLEN-2:`NF+1], In[`NF]|Denorm};
-
         // fraction (no assumed 1)
         assign Frac = In[`NF-1:0];
+        
+        // is the fraction zero
+        assign FracZero = ~|Frac;
 
         // is the exponent non-zero
         assign ExpNonZero = |Exp; 
+        
+        // is the input (in it's original format) denormalized
+        assign Denorm = ~ExpNonZero & ~FracZero;
+
+        // exponent
+        assign Exp = {In[`FLEN-2:`NF+1], In[`NF]|Denorm};
+
 
         // is the exponent all 1's
         assign ExpMax = &Exp;
-
-
-        // is the input (in it's original format) denormalized
-        assign Denorm = ~|In[`FLEN-2:`NF] & ~FracZero; 
     
 
     end else if (`FPSIZES == 2) begin   // if there are 2 floating point formats supported
@@ -69,6 +72,18 @@ module unpackinput (
         // choose sign bit depending on format - 1=larger precsion 0=smaller precision
         assign Sgn = FmtE ? In[`FLEN-1] : Len1[`LEN1-1];
 
+        // extract the fraction, add trailing zeroes to the mantissa if nessisary
+        assign Frac = FmtE ? In[`NF-1:0] : {Len1[`NF1-1:0], (`NF-`NF1)'(0)};
+
+        // is the fraction zero
+        assign FracZero = ~|Frac;
+        
+        // is the exponent non-zero
+        assign ExpNonZero = FmtE ? |In[`FLEN-2:`NF] : |Len1[`LEN1-2:`NF1]; 
+
+        // is the input (in it's original format) denormalized
+        assign Denorm = ~ExpNonZero & ~FracZero;
+
         // example double to single conversion:
         // 1023 = 0011 1111 1111
         // 127  = 0000 0111 1111 (subtract this)
@@ -80,17 +95,8 @@ module unpackinput (
         // extract the exponent, converting the smaller exponent into the larger precision if nessisary
         //      - if the original precision had a denormal number convert the exponent value 1
         assign Exp = FmtE ? {In[`FLEN-2:`NF+1], In[`NF]|Denorm} : {Len1[`LEN1-2], {`NE-`NE1{~Len1[`LEN1-2]}}, Len1[`LEN1-3:`NF1+1], Len1[`NF1]|Denorm}; 
+ 
 
-        // is the input (in it's original format) denormalized
-
-                    // is the input (in it's original format) denormalized
-        assign Denorm = (FmtE ? ~|In[`FLEN-2:`NF] : ~|Len1[`LEN1-2:`NF1]) & ~FracZero; 
-
-        // extract the fraction, add trailing zeroes to the mantissa if nessisary
-        assign Frac = FmtE ? In[`NF-1:0] : {Len1[`NF1-1:0], (`NF-`NF1)'(0)};
-
-        // is the exponent non-zero
-        assign ExpNonZero = FmtE ? |In[`FLEN-2:`NF] : |Len1[`LEN1-2:`NF1]; 
 
         // is the exponent all 1's
         assign ExpMax = FmtE ? &In[`FLEN-2:`NF] : &Len1[`LEN1-2:`NF1];
@@ -124,109 +130,66 @@ module unpackinput (
         // Check NaN boxing, If the value is not properly NaN boxed, set the value to a quiet NaN - for smaller precision
         assign Len2 = &In[`FLEN-1:`LEN2] ? In[`LEN2-1:0] : {1'b0, {`NE2+1{1'b1}}, (`NF2-1)'(0)};
 
-        // There are 2 case statements
-        //      - one for other singals and one for sgn/exp/frac
-        //      - need two for the dependencies in the expoenent calculation
-        //*** pull out the ~FracZero and and it at the end
-        always_comb begin
+
+        // extract the sign bit
+        always_comb
             case (FmtE)
-                `FMT: begin // if input is largest precision (`FLEN - ie quad or double)
-
-                    // This is the original format so set OrigDenorm to 0
-                    Denorm = ~|In[`FLEN-2:`NF] & ~FracZero; 
-
-                    // is the exponent non-zero
-                    ExpNonZero = |In[`FLEN-2:`NF]; 
-
-                    // is the exponent all 1's
-                    ExpMax = &In[`FLEN-2:`NF];
-                end
-                `FMT1: begin    // if input is larger precsion (`LEN1 - double or single)
-
-                    // is the input (in it's original format) denormalized
-                    Denorm = ~|Len1[`LEN1-2:`NF1] & ~FracZero; 
-
-                    // is the exponent non-zero
-                    ExpNonZero = |Len1[`LEN1-2:`NF1]; 
-
-                    // is the exponent all 1's
-                    ExpMax = &Len1[`LEN1-2:`NF1];
-                end
-                `FMT2: begin        // if input is smallest precsion (`LEN2 - single or half)
-
-                    // is the input (in it's original format) denormalized
-                    Denorm = ~|Len2[`LEN2-2:`NF2] & ~FracZero; 
-
-                    // is the exponent non-zero
-                    ExpNonZero = |Len2[`LEN2-2:`NF2]; 
-
-                    // is the exponent all 1's
-                    ExpMax = &Len2[`LEN2-2:`NF2];
-                end
-                default: begin
-                    Denorm = 0; 
-                    ExpNonZero = 0; 
-                    ExpMax = 0;
-                end
+                `FMT:  Sgn = In[`FLEN-1];
+                `FMT1: Sgn = Len1[`LEN1-1];
+                `FMT2: Sgn = Len2[`LEN2-1];
+                default: Sgn = 0;
             endcase
-        end
-        always_comb begin
+
+        // extract the fraction
+        always_comb
             case (FmtE)
-                `FMT: begin // if input is largest precision (`FLEN - ie quad or double)
-                    // extract the sign bit
-                    Sgn = In[`FLEN-1];
-
-                    // extract the exponent
-                    Exp = {In[`FLEN-2:`NF+1], In[`NF]|Denorm};
-
-                    // extract the fraction
-                    Frac = In[`NF-1:0];
-                end
-                `FMT1: begin    // if input is larger precsion (`LEN1 - double or single)
-
-                    // extract the sign bit
-                    Sgn = Len1[`LEN1-1];
-
-                    // example double to single conversion:
-                    // 1023 = 0011 1111 1111
-                    // 127  = 0000 0111 1111 (subtract this)
-                    // 896  = 0011 1000 0000
-                    // sexp = 0000 bbbb bbbb (add this) b = bit d = ~b 
-                    // dexp = 0bdd dbbb bbbb 
-                    // also need to take into account possible zero/denorm/inf/NaN values
-
-                    // convert the larger precision's exponent to use the largest precision's bias
-                    Exp = {Len1[`LEN1-2], {`NE-`NE1{~Len1[`LEN1-2]}}, Len1[`LEN1-3:`NF1+1], Len1[`NF1]|Denorm}; 
-
-                    // extract the fraction and add the nessesary trailing zeros
-                    Frac = {Len1[`NF1-1:0], (`NF-`NF1)'(0)};
-                end
-                `FMT2: begin        // if input is smallest precsion (`LEN2 - single or half)
-
-                    // exctract the sign bit
-                    Sgn = Len2[`LEN2-1];
-
-                    // example double to single conversion:
-                    // 1023 = 0011 1111 1111
-                    // 127  = 0000 0111 1111 (subtract this)
-                    // 896  = 0011 1000 0000
-                    // sexp = 0000 bbbb bbbb (add this) b = bit d = ~b 
-                    // dexp = 0bdd dbbb bbbb 
-                    // also need to take into account possible zero/denorm/inf/NaN values
-                    
-                    // convert the smallest precision's exponent to use the largest precision's bias
-                    Exp = Denorm ? {1'b0, {`NE-`NE2{1'b1}}, (`NE2-1)'(1)} : {Len2[`LEN2-2], {`NE-`NE2{~Len2[`LEN2-2]}}, Len2[`LEN2-3:`NF2]}; 
-
-                    // extract the fraction and add the nessesary trailing zeros
-                    Frac = {Len2[`NF2-1:0], (`NF-`NF2)'(0)};
-                end
-                default: begin
-                    Sgn = 0;
-                    Exp = 0; 
-                    Frac = 0;
-                end
+                `FMT: Frac = In[`NF-1:0];
+                `FMT1: Frac = {Len1[`NF1-1:0], (`NF-`NF1)'(0)};
+                `FMT2: Frac = {Len2[`NF2-1:0], (`NF-`NF2)'(0)};
+                default: Frac = 0;
+            endcase
+
+        // is the fraction zero
+        assign FracZero = ~|Frac;
+
+
+        // is the exponent non-zero
+        always_comb
+            case (FmtE)
+                `FMT:  ExpNonZero = |In[`FLEN-2:`NF];     // if input is largest precision (`FLEN - ie quad or double)
+                `FMT1: ExpNonZero = |Len1[`LEN1-2:`NF1];  // if input is larger precsion (`LEN1 - double or single)
+                `FMT2: ExpNonZero = |Len2[`LEN2-2:`NF2]; // if input is smallest precsion (`LEN2 - single or half)
+                default: ExpNonZero = 0; 
+            endcase
+            
+        // is the input (in it's original format) denormalized
+        assign Denorm = ~ExpNonZero & ~FracZero;
+
+        // example double to single conversion:
+        // 1023 = 0011 1111 1111
+        // 127  = 0000 0111 1111 (subtract this)
+        // 896  = 0011 1000 0000
+        // sexp = 0000 bbbb bbbb (add this) b = bit d = ~b 
+        // dexp = 0bdd dbbb bbbb 
+        // also need to take into account possible zero/denorm/inf/NaN values
+
+        // convert the larger precision's exponent to use the largest precision's bias
+        always_comb 
+            case (FmtE)
+                `FMT:  Exp = {In[`FLEN-2:`NF+1], In[`NF]|Denorm};
+                `FMT1: Exp = {Len1[`LEN1-2], {`NE-`NE1{~Len1[`LEN1-2]}}, Len1[`LEN1-3:`NF1+1], Len1[`NF1]|Denorm}; 
+                `FMT2: Exp = {Len2[`LEN2-2], {`NE-`NE2{~Len2[`LEN2-2]}}, Len2[`LEN2-3:`NF2+1], Len2[`NF2]|Denorm}; 
+                default: Exp = 0;
+            endcase
+
+        // is the exponent all 1's
+        always_comb
+            case (FmtE)
+                `FMT:  ExpMax = &In[`FLEN-2:`NF];
+                `FMT1: ExpMax = &Len1[`LEN1-2:`NF1];
+                `FMT2: ExpMax = &Len2[`LEN2-2:`NF2];
+                default: ExpMax = 0;
             endcase
-        end
 
     end else if (`FPSIZES == 4) begin      // if all precsisons are supported - quad, double, single, and half
     
@@ -252,137 +215,73 @@ module unpackinput (
         // Check NaN boxing, If the value is not properly NaN boxed, set the value to a quiet NaN - for half precision
         assign Len3 = &In[`Q_LEN-1:`H_LEN] ? In[`H_LEN-1:0] : {1'b0, {`H_NE+1{1'b1}}, (`H_NF-1)'(0)};
 
-
-        // There are 2 case statements
-        //      - one for other singals and one for sgn/exp/frac
-        //      - need two for the dependencies in the expoenent calculation
-        always_comb begin
+        // extract sign bit
+        always_comb
             case (FmtE)
-                2'b11: begin  // if input is quad percision
-
-                    // is the input (in it's original format) denormalized
-                    Denorm = ~|In[`Q_LEN-2:`Q_NF] & ~FracZero; 
-
-                    // is the exponent non-zero
-                    ExpNonZero = |In[`Q_LEN-2:`Q_NF]; 
-
-                    // is the exponent all 1's
-                    ExpMax = &In[`Q_LEN-2:`Q_NF];
-                end
-                2'b01: begin  // if input is double percision
-
-                    // is the exponent all 1's
-                    ExpMax = &Len1[`D_LEN-2:`D_NF];
-
-                    // is the input (in it's original format) denormalized
-                    Denorm = ~|Len1[`D_LEN-2:`D_NF] & ~FracZero; 
-
-                    // is the exponent non-zero
-                    ExpNonZero = |Len1[`D_LEN-2:`D_NF]; 
-                end
-                2'b00: begin      // if input is single percision
-
-                    // is the exponent all 1's
-                    ExpMax = &Len2[`S_LEN-2:`S_NF];
-
-                    // is the input (in it's original format) denormalized
-                    Denorm = ~|Len2[`S_LEN-2:`S_NF] & ~FracZero; 
-
-                    // is the exponent non-zero
-                    ExpNonZero = |Len2[`S_LEN-2:`S_NF]; 
-                end
-                2'b10: begin      // if input is half percision
-
-                    // is the exponent all 1's
-                    ExpMax = &Len3[`H_LEN-2:`H_NF];
-
-                    // is the input (in it's original format) denormalized
-                    Denorm = ~|Len3[`H_LEN-2:`H_NF] & ~FracZero; 
-
-                    // is the exponent non-zero
-                    ExpNonZero = |Len3[`H_LEN-2:`H_NF]; 
-                end
+                2'b11: Sgn = In[`Q_LEN-1];
+                2'b01: Sgn = Len1[`D_LEN-1];
+                2'b00: Sgn = Len2[`S_LEN-1];
+                2'b10: Sgn = Len3[`H_LEN-1];
             endcase
-        end
+            
 
-        always_comb begin
+        // extract the fraction
+        always_comb
             case (FmtE)
-                2'b11: begin  // if input is quad percision
-                    // extract sign bit
-                    Sgn = In[`Q_LEN-1];
-
-                    // extract the exponent
-                    Exp = {In[`Q_LEN-2:`Q_NF+1], In[`Q_NF]|Denorm};
-
-                    // extract the fraction
-                    Frac = In[`Q_NF-1:0];
-                end
-                2'b01: begin  // if input is double percision
-                    // extract sign bit
-                    Sgn = Len1[`D_LEN-1];
-
-                    // example double to single conversion:
-                    // 1023 = 0011 1111 1111
-                    // 127  = 0000 0111 1111 (subtract this)
-                    // 896  = 0011 1000 0000
-                    // sexp = 0000 bbbb bbbb (add this) b = bit d = ~b 
-                    // dexp = 0bdd dbbb bbbb 
-                    // also need to take into account possible zero/denorm/inf/NaN values
-                    
-                    // convert the double precsion exponent into quad precsion
-
-                    Exp = {Len1[`D_LEN-2], {`Q_NE-`D_NE{~Len1[`D_LEN-2]}}, Len1[`D_LEN-3:`D_NF+1], Len1[`D_NF]|Denorm}; 
-
-                    // extract the fraction and add the nessesary trailing zeros
-                    Frac = {Len1[`D_NF-1:0], (`Q_NF-`D_NF)'(0)};
-                end
-                2'b00: begin      // if input is single percision
-                    // extract sign bit
-                    Sgn = Len2[`S_LEN-1];
-
-                    // example double to single conversion:
-                    // 1023 = 0011 1111 1111
-                    // 127  = 0000 0111 1111 (subtract this)
-                    // 896  = 0011 1000 0000
-                    // sexp = 0000 bbbb bbbb (add this) b = bit d = ~b 
-                    // dexp = 0bdd dbbb bbbb 
-                    // also need to take into account possible zero/denorm/inf/NaN values
-                    
-                    // convert the single precsion exponent into quad precsion
-                    Exp = {Len2[`S_LEN-2], {`Q_NE-`S_NE{~Len2[`S_LEN-2]}}, Len2[`S_LEN-3:`S_NF+1], Len2[`S_NF]|Denorm}; 
-
-                    // extract the fraction and add the nessesary trailing zeros
-                    Frac = {Len2[`S_NF-1:0], (`Q_NF-`S_NF)'(0)};
-                end
-                2'b10: begin      // if input is half percision
-                    // extract sign bit
-                    Sgn = Len3[`H_LEN-1];
-
-                    // example double to single conversion:
-                    // 1023 = 0011 1111 1111
-                    // 127  = 0000 0111 1111 (subtract this)
-                    // 896  = 0011 1000 0000
-                    // sexp = 0000 bbbb bbbb (add this) b = bit d = ~b 
-                    // dexp = 0bdd dbbb bbbb 
-                    // also need to take into account possible zero/denorm/inf/NaN values
-
-                    // convert the half precsion exponent into quad precsion
-                    Exp = {Len3[`H_LEN-2], {`Q_NE-`H_NE{~Len3[`H_LEN-2]}}, Len3[`H_LEN-3:`H_NF+1], Len3[`H_NF]|Denorm}; 
-
-                    // extract the fraction and add the nessesary trailing zeros
-                    Frac = {Len3[`H_NF-1:0], (`Q_NF-`H_NF)'(0)};
-                end
+                2'b11: Frac = In[`Q_NF-1:0];
+                2'b01: Frac = {Len1[`D_NF-1:0], (`Q_NF-`D_NF)'(0)};
+                2'b00: Frac = {Len2[`S_NF-1:0], (`Q_NF-`S_NF)'(0)};
+                2'b10: Frac = {Len3[`H_NF-1:0], (`Q_NF-`H_NF)'(0)};
+            endcase
+
+        // is the fraction zero
+        assign FracZero = ~|Frac;
+
+        // is the exponent non-zero
+        always_comb
+            case (FmtE)
+                2'b11: ExpNonZero = |In[`Q_LEN-2:`Q_NF];
+                2'b01: ExpNonZero = |Len1[`D_LEN-2:`D_NF];
+                2'b00: ExpNonZero = |Len2[`S_LEN-2:`S_NF]; 
+                2'b10: ExpNonZero = |Len3[`H_LEN-2:`H_NF]; 
+            endcase
+
+        // is the input (in it's original format) denormalized
+        assign Denorm = ~ExpNonZero & ~FracZero;
+
+
+        // example double to single conversion:
+        // 1023 = 0011 1111 1111
+        // 127  = 0000 0111 1111 (subtract this)
+        // 896  = 0011 1000 0000
+        // sexp = 0000 bbbb bbbb (add this) b = bit d = ~b 
+        // dexp = 0bdd dbbb bbbb 
+        // also need to take into account possible zero/denorm/inf/NaN values
+        
+        // convert the double precsion exponent into quad precsion
+        always_comb
+            case (FmtE)
+                2'b11: Exp = {In[`Q_LEN-2:`Q_NF+1], In[`Q_NF]|Denorm};
+                2'b01: Exp = {Len1[`D_LEN-2], {`Q_NE-`D_NE{~Len1[`D_LEN-2]}}, Len1[`D_LEN-3:`D_NF+1], Len1[`D_NF]|Denorm};
+                2'b00: Exp = {Len2[`S_LEN-2], {`Q_NE-`S_NE{~Len2[`S_LEN-2]}}, Len2[`S_LEN-3:`S_NF+1], Len2[`S_NF]|Denorm};
+                2'b10: Exp = {Len3[`H_LEN-2], {`Q_NE-`H_NE{~Len3[`H_LEN-2]}}, Len3[`H_LEN-3:`H_NF+1], Len3[`H_NF]|Denorm}; 
+            endcase
+
+
+        // is the exponent all 1's
+        always_comb 
+            case (FmtE)
+                2'b11: ExpMax = &In[`Q_LEN-2:`Q_NF];
+                2'b01: ExpMax = &Len1[`D_LEN-2:`D_NF];
+                2'b00: ExpMax = &Len2[`S_LEN-2:`S_NF];
+                2'b10: ExpMax = &Len3[`H_LEN-2:`H_NF];
             endcase
-        end
 
     end
 
     // is the exponent all 0's
     assign ExpZero = ~ExpNonZero;
 
-    // is the fraction zero
-    assign FracZero = ~|Frac;
-
     // add the assumed one (or zero if denormal or zero) to create the mantissa
     assign Man = {ExpNonZero, Frac};
     

From ae12cca9802e501f2a73868dd8b5f918c007c9b2 Mon Sep 17 00:00:00 2001
From: DTowersM <dtowersm@gmail.com>
Date: Tue, 31 May 2022 20:05:51 +0000
Subject: [PATCH 04/14] dummy start trigger and stop trigger support for make
 file

---
 benchmarks/embench/Makefile | 11 +++++++----
 1 file changed, 7 insertions(+), 4 deletions(-)

diff --git a/benchmarks/embench/Makefile b/benchmarks/embench/Makefile
index 28b012cd..0cb54e1a 100644
--- a/benchmarks/embench/Makefile
+++ b/benchmarks/embench/Makefile
@@ -1,4 +1,5 @@
 # Makefile added 1/20/22 David_Harris@hmc.edu
+# Expanded and developed by dtorres@hmc.edu
 # Compile Embench for Wally
 
 all: build sim
@@ -6,9 +7,9 @@ all: build sim
 allClean: clean all
 
 build:
-	../../addins/embench-iot/build_all.py --builddir=bd_speed --arch riscv32 --chip generic --board rv32wallyverilog --ldflags="-nostartfiles ../../../config/riscv32/boards/rv32wallyverilog/startup/crt0.S" --cflags="-nostartfiles" 
+	../../addins/embench-iot/build_all.py -v --builddir=bd_speed --arch riscv32 --chip generic --board rv32wallyverilog --ldflags="-nostartfiles ../../../config/riscv32/boards/rv32wallyverilog/startup/crt0.S" --cflags="-nostartfiles" 
 	find ../../addins/embench-iot/bd_speed/ -type f ! -name "*.*" | while read f; do cp "$$f" "$$f.elf"; done
-	../../addins/embench-iot/build_all.py --builddir=bd_size --arch riscv32 --chip generic --board rv32wallyverilog --ldflags="-nostdlib -nostartfiles" --cflags="-msave-restore" --dummy-libs="libgcc libm libc crt0"
+	../../addins/embench-iot/build_all.py -v --builddir=bd_size --arch riscv32 --chip generic --board rv32wallyverilog --ldflags="-nostdlib -nostartfiles ../../../config/riscv32/boards/rv32wallyverilog/startup/dummy.S" --cflags="-msave-restore" --dummy-libs="libgcc libm libc crt0"
 
 sim: modelSimBuild size speed
 
@@ -20,10 +21,10 @@ size:
 	../../addins/embench-iot/benchmark_size.py --builddir=bd_size
 
 speed:
-	../../addins/embench-iot/benchmark_speed.py --builddir=bd_speed --target-module run_wally --cpu-mhz=50
+	../../addins/embench-iot/benchmark_speed.py --builddir=bd_speed --target-module run_wally --cpu-mhz=1
 
 objdump:
-	find ../../addins/embench-iot/bd_speed/ -type f -name "*.elf" | while read f; do riscv64-unknown-elf-objdump -S "$$f" > "$$f.objdump"; done
+	find ../../addins/embench-iot/bd_speed/ -type f -name "*.elf" | while read f; do riscv64-unknown-elf-objdump -S -D "$$f" > "$$f.objdump"; done
 
 clean: 
 	rm -rf ../../addins/embench-iot/bd_speed/
@@ -37,3 +38,5 @@ clean:
 # ../../addins/embench-iot/build_all.py --arch riscv32 --chip generic --board rv32wallyverilog --cc riscv64-unknown-elf-gcc --cflags="-c -Os -ffunction-sections -nostdlib -march=rv32imac -mabi=ilp32" --ldflags="-Wl,-gc-sections -nostdlib -march=rv32imac -mabi=ilp32 -T../../../config/riscv32/boards/rv32wallyverilog/link.ld" --dummy-libs="libgcc libm libc"
 # --user-libs="-lm" 
 # riscv64-unknown-elf-gcc -O2 -g -nostartfiles -I/home/harris/riscv-wally/addins/embench-iot/support -I/home/harris/riscv-wally/addins/embench-iot/config/riscv32/boards/ri5cyverilator -I/home/harris/riscv-wally/addins/embench-iot/config/riscv32/chips/generic -I/home/harris/riscv-wally/addins/embench-iot/config/riscv32 -DCPU_MHZ=1 -DWARMUP_HEAT=1 -o main.o /home/harris/riscv-wally/addins/embench-iot/support/main.c
+
+# find ../../addins/embench-iot/bd_speed/ -type f -name "*.elf.objdump.lab" | while read f; do grep -n "begin_signature" $f | cut -f1 -d:

From 95df88ae70808a9e7943f652c25f1eeb9bd80b77 Mon Sep 17 00:00:00 2001
From: DTowersM <dtowersm@gmail.com>
Date: Tue, 31 May 2022 20:08:04 +0000
Subject: [PATCH 05/14] added embench tests to tests.vh

---
 pipelined/testbench/tests.vh | 32 +++++++++++++++++++++++++++++++-
 1 file changed, 31 insertions(+), 1 deletion(-)

diff --git a/pipelined/testbench/tests.vh b/pipelined/testbench/tests.vh
index dba197f5..d907d9a2 100644
--- a/pipelined/testbench/tests.vh
+++ b/pipelined/testbench/tests.vh
@@ -28,6 +28,7 @@
 `define WALLYTEST "2"
 `define MYIMPERASTEST   "3"
 `define COREMARK "4"
+`define EMBENCH "5"
 // *** remove MYIMPERASTEST cases when ported 
 
 string tvpaths[] = '{
@@ -35,15 +36,44 @@ string tvpaths[] = '{
     "../../addins/riscv-arch-test/work/",
     "../../tests/wally-riscv-arch-test/work/",
     "../../tests/imperas-riscv-tests/work/",
-    "../../benchmarks/riscv-coremark/work/"
+    "../../benchmarks/riscv-coremark/work/",
+    "../../addins/embench-iot/bd_speed/src/"
 };
 
+
+
    // *** make sure these are somewhere
   string coremark[] = '{
     `COREMARK,
     "coremark.bare.riscv", "100000"
   };
 
+  string embench[] = '{
+    `EMBENCH,
+    "aha-mont64/aha-mont64", "1080",
+    "crc32/crc32", "1080",
+    "cubic/cubic", "9080",
+    "edn/edn", "1080",
+    "huffbench/huffbench", "5080",
+    "matmult-int/matmult-int", "1080",
+    "md5sum/md5sum", "4080",
+    "minver/minver", "2080",
+    "nbody/nbody", "2080",
+    "nettle-aes/nettle-aes", "1080",
+    "nettle-sha256/nettle-sha256", "2080",
+    "nsichneu/nsichneu", "4080",
+    "picojpeg/picojpeg", "3080",
+    "primecount/primecount", "1080",
+    "qrduino/qrduino", "6080",
+    "sglib-combined/sglib-combined", "5080",
+    "slre/slre", "1080",
+    "st/st", "2080",
+    "statemate/statemate", "2080",
+    "tarfind/tarfind", "4080",
+    "ud/ud", "1080",
+    "wikisort/wikisort", "3080"
+  };
+
   string wally64a[] = '{
     `WALLYTEST,
     "rv64i_m/privilege/WALLY-amo", "2210",

From 0de54a01bf6a41c0d1019d702f9ee6e135330cbb Mon Sep 17 00:00:00 2001
From: DTowersM <dtowersm@gmail.com>
Date: Tue, 31 May 2022 20:09:48 +0000
Subject: [PATCH 06/14] removed delapidated signals SIE_REGW SIP_REGW TimerIntM
 SwIntM

---
 pipelined/regression/wave.do | 4 ----
 1 file changed, 4 deletions(-)

diff --git a/pipelined/regression/wave.do b/pipelined/regression/wave.do
index de6eb166..ab6cbc46 100644
--- a/pipelined/regression/wave.do
+++ b/pipelined/regression/wave.do
@@ -76,8 +76,6 @@ add wave -noupdate -group CSRs /testbench/dut/core/priv/priv/csr/PMPCFG_ARRAY_RE
 add wave -noupdate -group CSRs /testbench/dut/core/priv/priv/csr/SATP_REGW
 add wave -noupdate -group CSRs /testbench/dut/core/priv/priv/csr/SCOUNTEREN_REGW
 add wave -noupdate -group CSRs /testbench/dut/core/priv/priv/csr/SEPC_REGW
-add wave -noupdate -group CSRs /testbench/dut/core/priv/priv/csr/SIE_REGW
-add wave -noupdate -group CSRs /testbench/dut/core/priv/priv/csr/SIP_REGW
 add wave -noupdate -group CSRs /testbench/dut/core/priv/priv/csr/SSTATUS_REGW
 add wave -noupdate -group CSRs /testbench/dut/core/priv/priv/csr/STVEC_REGW
 add wave -noupdate -group Bpred -color Orange /testbench/dut/core/ifu/bpred/bpred/Predictor/DirPredictor/GHR
@@ -420,8 +418,6 @@ add wave -noupdate -group CLINT /testbench/dut/uncore/clint/clint/HRESPCLINT
 add wave -noupdate -group CLINT /testbench/dut/uncore/clint/clint/HREADYCLINT
 add wave -noupdate -group CLINT /testbench/dut/uncore/clint/clint/MTIME
 add wave -noupdate -group CLINT /testbench/dut/uncore/clint/clint/MTIMECMP
-add wave -noupdate -group CLINT /testbench/dut/uncore/clint/clint/TimerIntM
-add wave -noupdate -group CLINT /testbench/dut/uncore/clint/clint/SwIntM
 add wave -noupdate -group uart -expand -group {Bus Connection} /testbench/dut/uncore/uart/uart/HCLK
 add wave -noupdate -group uart -expand -group {Bus Connection} /testbench/dut/uncore/uart/uart/HRESETn
 add wave -noupdate -group uart -expand -group {Bus Connection} /testbench/dut/uncore/uart/uart/HSELUART

From 525f6a6069c8952c2c373f8124b1c2dedfb0c9ce Mon Sep 17 00:00:00 2001
From: DTowersM <dtowersm@gmail.com>
Date: Tue, 31 May 2022 20:13:32 +0000
Subject: [PATCH 07/14] added testbench.sv support for embench tests, test
 output still WIP

---
 pipelined/testbench/testbench.sv | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/pipelined/testbench/testbench.sv b/pipelined/testbench/testbench.sv
index fb338848..ba312292 100644
--- a/pipelined/testbench/testbench.sv
+++ b/pipelined/testbench/testbench.sv
@@ -119,6 +119,7 @@ logic [3:0] dummy;
         "wally32i":                       tests = wally32i; // *** redo
         "wally32e":                       tests = wally32e; 
         "wally32priv":                    tests = wally32priv; // *** redo
+        "embench":                        tests = embench;
       endcase
     end
     if (tests.size() == 0) begin
@@ -127,7 +128,7 @@ logic [3:0] dummy;
     end
   end
 
-  string signame, memfilename, pathname;
+  string signame, memfilename, pathname, objdumpfilename, adrstr;
 
   logic [31:0] GPIOPinsIn, GPIOPinsOut, GPIOPinsEn;
   logic UARTSin, UARTSout;

From aa7b0616e45f43b2cbaf3565aa798ee4a49815a0 Mon Sep 17 00:00:00 2001
From: David Harris <david_harris@hmc.edu>
Date: Tue, 31 May 2022 21:12:17 +0000
Subject: [PATCH 08/14] ../src/privileged/csrc.sv

---
 pipelined/src/privileged/privmode.sv | 11 +++++------
 pipelined/src/privileged/trap.sv     |  2 +-
 2 files changed, 6 insertions(+), 7 deletions(-)

diff --git a/pipelined/src/privileged/privmode.sv b/pipelined/src/privileged/privmode.sv
index 768d8a36..b0929642 100644
--- a/pipelined/src/privileged/privmode.sv
+++ b/pipelined/src/privileged/privmode.sv
@@ -44,12 +44,11 @@ module privmode (
     // PrivilegeMode FSM
     always_comb begin
       if (TrapM) begin // Change privilege based on DELEG registers (see 3.1.8)
-        if (`S_SUPPORTED & DelegateM)
-                          NextPrivilegeModeM = `S_MODE;
-        else              NextPrivilegeModeM = `M_MODE;
-      end else if (mretM) NextPrivilegeModeM = STATUS_MPP;
-      else if (sretM)     NextPrivilegeModeM = {1'b0, STATUS_SPP};
-      else                NextPrivilegeModeM = PrivilegeModeW;
+        if (`S_SUPPORTED & DelegateM) NextPrivilegeModeM = `S_MODE;
+        else                          NextPrivilegeModeM = `M_MODE;
+      end else if (mretM)             NextPrivilegeModeM = STATUS_MPP;
+      else if (sretM)                 NextPrivilegeModeM = {1'b0, STATUS_SPP};
+      else                            NextPrivilegeModeM = PrivilegeModeW;
     end
 
     flopenl #(2) privmodereg(clk, reset, ~StallW, NextPrivilegeModeM, `M_MODE, PrivilegeModeW);
diff --git a/pipelined/src/privileged/trap.sv b/pipelined/src/privileged/trap.sv
index 7bee52a0..35d680a6 100644
--- a/pipelined/src/privileged/trap.sv
+++ b/pipelined/src/privileged/trap.sv
@@ -64,7 +64,7 @@ module trap (
   assign IntPendingM = |PendingIntsM;
   assign ValidIntsM = {12{MIntGlobalEnM}} & PendingIntsM & ~MIDELEG_REGW | {12{SIntGlobalEnM}} & PendingIntsM & MIDELEG_REGW; 
   assign InterruptM = (|ValidIntsM) && InstrValidM && ~(CommittedM);  // *** RT. CommittedM is a temporary hack to prevent integer division from having an interrupt during divide.
-  assign DelegateM = (InterruptM ? MIDELEG_REGW[CauseM[3:0]] : MEDELEG_REGW[CauseM]) & 
+  assign DelegateM = `S_SUPPORTED & (InterruptM ? MIDELEG_REGW[CauseM[3:0]] : MEDELEG_REGW[CauseM]) & 
                      (PrivilegeModeW == `U_MODE | PrivilegeModeW == `S_MODE);
 
   ///////////////////////////////////////////

From f9533fea1a99b1634789dd8457740d1d55f0941f Mon Sep 17 00:00:00 2001
From: David Harris <david_harris@hmc.edu>
Date: Tue, 31 May 2022 21:32:31 +0000
Subject: [PATCH 09/14] Removed normalized output from unpack and simplified
 interface

---
 pipelined/src/fpu/fclassify.sv   |  4 ++--
 pipelined/src/fpu/fpu.sv         |  5 ++---
 pipelined/src/fpu/unpack.sv      | 13 +++---------
 pipelined/src/fpu/unpackinput.sv | 35 ++++++++------------------------
 4 files changed, 16 insertions(+), 41 deletions(-)

diff --git a/pipelined/src/fpu/fclassify.sv b/pipelined/src/fpu/fclassify.sv
index dd6165ca..05a91d21 100644
--- a/pipelined/src/fpu/fclassify.sv
+++ b/pipelined/src/fpu/fclassify.sv
@@ -5,7 +5,6 @@ module fclassify (
     input logic         XSgnE,  // sign bit
     input logic         XNaNE,  // is NaN
     input logic         XSNaNE, // is signaling NaN
-    input logic         XNormE, // is normal
     input logic         XDenormE, // is denormal
     input logic         XZeroE, // is zero
     input logic         XInfE,  // is infinity
@@ -14,9 +13,10 @@ module fclassify (
 
     logic PInf, PZero, PNorm, PDenorm;
     logic NInf, NZero, NNorm, NDenorm;
-
+    logic XNormE;
    
     // determine the sub categories
+    assign XNormE = ~(XNaNE | XInfE | XDenormE | XZeroE);
     assign PInf = ~XSgnE&XInfE;
     assign NInf = XSgnE&XInfE;
     assign PNorm = ~XSgnE&XNormE;
diff --git a/pipelined/src/fpu/fpu.sv b/pipelined/src/fpu/fpu.sv
index 053d3dd5..75781092 100755
--- a/pipelined/src/fpu/fpu.sv
+++ b/pipelined/src/fpu/fpu.sv
@@ -103,7 +103,6 @@ module fpu (
    logic 		  XInfM, YInfM, ZInfM;                // is the input infinity - memory stage
    logic 		  XInfQ, YInfQ;                       // is the input infinity - divide
    logic 		  XExpMaxE;                           // is the exponent all ones (max value)
-   logic 		  XNormE;                             // is normal
    logic 		  FmtQ;
    logic 		  FOpCtrlQ;     
 
@@ -178,7 +177,7 @@ module fpu (
    unpack unpack (.X(FSrcXE), .Y(FSrcYE), .Z(FSrcZE), .FmtE,
          .XSgnE, .YSgnE, .ZSgnE, .XExpE, .YExpE, .ZExpE, .XManE, .YManE, .ZManE, 
          .XNaNE, .YNaNE, .ZNaNE, .XSNaNE, .YSNaNE, .ZSNaNE, .XDenormE, .YDenormE, .ZDenormE, 
-         .XZeroE, .YZeroE, .ZZeroE, .XInfE, .YInfE, .ZInfE, .XExpMaxE, .XNormE);
+         .XZeroE, .YZeroE, .ZZeroE, .XInfE, .YInfE, .ZInfE, .XExpMaxE);
 
    // FMA
    //   - two stage FMA
@@ -215,7 +214,7 @@ module fpu (
    fcmp fcmp (.FmtE, .FOpCtrlE, .XSgnE, .YSgnE, .XExpE, .YExpE, .XManE, .YManE, 
             .XZeroE, .YZeroE, .XNaNE, .YNaNE, .XSNaNE, .YSNaNE, .FSrcXE, .FSrcYE, .CmpNVE, .CmpResE);
    fsgninj fsgninj(.SgnOpCodeE(FOpCtrlE[1:0]), .XSgnE, .YSgnE, .FSrcXE, .FmtE, .SgnResE);
-   fclassify fclassify (.XSgnE, .XDenormE, .XZeroE, .XNaNE, .XInfE, .XNormE, .XSNaNE, .ClassResE);
+   fclassify fclassify (.XSgnE, .XDenormE, .XZeroE, .XNaNE, .XInfE, .XSNaNE, .ClassResE);
    fcvt fcvt (.XSgnE, .XExpE, .XManE, .ForwardedSrcAE, .FOpCtrlE, .FWriteIntE, .XZeroE, .XDenormE,
               .XInfE, .XNaNE, .XSNaNE, .FrmE, .FmtE, .CvtResE, .CvtIntResE, .CvtFlgE);
 
diff --git a/pipelined/src/fpu/unpack.sv b/pipelined/src/fpu/unpack.sv
index 9e691e27..e9f005e7 100644
--- a/pipelined/src/fpu/unpack.sv
+++ b/pipelined/src/fpu/unpack.sv
@@ -6,7 +6,6 @@ module unpack (
     output logic                    XSgnE, YSgnE, ZSgnE,    // sign bits of XYZ
     output logic [`NE-1:0]          XExpE, YExpE, ZExpE,    // exponents of XYZ (converted to largest supported precision)
     output logic [`NF:0]            XManE, YManE, ZManE,    // mantissas of XYZ (converted to largest supported precision)
-    output logic                    XNormE,                 // is X a normalized number
     output logic                    XNaNE, YNaNE, ZNaNE,    // is XYZ a NaN
     output logic                    XSNaNE, YSNaNE, ZSNaNE, // is XYZ a signaling NaN
     output logic                    XDenormE, YDenormE, ZDenormE,   // is XYZ denormalized
@@ -18,23 +17,17 @@ module unpack (
     logic [`NF-1:0] XFracE, YFracE, ZFracE; //Fraction of XYZ
     logic           XExpNonzero, YExpNonzero, ZExpNonzero; // is the exponent of XYZ non-zero
     logic           XFracZero, YFracZero, ZFracZero; // is the fraction zero
-    logic           XExpZero, YExpZero, ZExpZero; // is the exponent zero
     logic           YExpMaxE, ZExpMaxE;  // is the exponent all 1s
     
     unpackinput unpackinputX (.In(X), .FmtE, .Sgn(XSgnE), .Exp(XExpE), .Man(XManE), 
                             .NaN(XNaNE), .SNaN(XSNaNE), .Denorm(XDenormE), 
-                            .Zero(XZeroE), .Inf(XInfE), .ExpMax(XExpMaxE), .ExpZero(XExpZero));
+                            .Zero(XZeroE), .Inf(XInfE), .ExpMax(XExpMaxE));
 
     unpackinput unpackinputY (.In(Y), .FmtE, .Sgn(YSgnE), .Exp(YExpE), .Man(YManE), 
                             .NaN(YNaNE), .SNaN(YSNaNE), .Denorm(YDenormE), 
-                            .Zero(YZeroE), .Inf(YInfE), .ExpMax(YExpMaxE), .ExpZero(YExpZero));
+                            .Zero(YZeroE), .Inf(YInfE), .ExpMax(YExpMaxE));
 
     unpackinput unpackinputZ (.In(Z), .FmtE, .Sgn(ZSgnE), .Exp(ZExpE), .Man(ZManE), 
                             .NaN(ZNaNE), .SNaN(ZSNaNE), .Denorm(ZDenormE), 
-                            .Zero(ZZeroE), .Inf(ZInfE), .ExpMax(ZExpMaxE), .ExpZero(ZExpZero));
-
-                            
-    // is X normalized
-    assign XNormE = ~(XExpMaxE|XExpZero);
-    
+                            .Zero(ZZeroE), .Inf(ZInfE), .ExpMax(ZExpMaxE));
 endmodule
\ No newline at end of file
diff --git a/pipelined/src/fpu/unpackinput.sv b/pipelined/src/fpu/unpackinput.sv
index 0b944b64..6b39d41c 100644
--- a/pipelined/src/fpu/unpackinput.sv
+++ b/pipelined/src/fpu/unpackinput.sv
@@ -11,39 +11,22 @@ module unpackinput (
     output logic                    Denorm,   // is XYZ denormalized
     output logic                    Zero,         // is XYZ zero
     output logic                    Inf,            // is XYZ infinity
-    output logic                    ExpMax,                        // does In have the maximum exponent (NaN or Inf)
-    output logic                    ExpZero                        // is the exponent zero
+    output logic                    ExpMax                       // does In have the maximum exponent (NaN or Inf)
 );
  
     logic [`NF-1:0] Frac; //Fraction of XYZ
     logic           ExpNonZero; // is the exponent of XYZ non-zero
     logic           FracZero; // is the fraction zero
+    logic           ExpZero;
     
     if (`FPSIZES == 1) begin        // if there is only one floating point format supported
-
-        // sign bit
-        assign Sgn = In[`FLEN-1];
-
-        // fraction (no assumed 1)
-        assign Frac = In[`NF-1:0];
-        
-        // is the fraction zero
-        assign FracZero = ~|Frac;
-
-        // is the exponent non-zero
-        assign ExpNonZero = |Exp; 
-        
-        // is the input (in it's original format) denormalized
-        assign Denorm = ~ExpNonZero & ~FracZero;
-
-        // exponent
-        assign Exp = {In[`FLEN-2:`NF+1], In[`NF]|Denorm};
-
-
-        // is the exponent all 1's
-        assign ExpMax = &Exp;
-    
-
+        assign Sgn = In[`FLEN-1];  // sign bit
+        assign Frac = In[`NF-1:0];  // fraction (no assumed 1)
+        assign FracZero = ~|Frac; // is the fraction zero?
+        assign ExpNonZero = |Exp;  // is the exponent non-zero
+        assign Denorm = ~ExpNonZero & ~FracZero; // is the input (in its original format) denormalized
+        assign Exp = {In[`FLEN-2:`NF+1], In[`NF]|Denorm};  // exponent.  Denormalized numbers have effective biased exponent of 1
+        assign ExpMax = &Exp;  // is the exponent all 1's
     end else if (`FPSIZES == 2) begin   // if there are 2 floating point formats supported
         //***need better names for these constants
         // largest format | smaller format

From 475a84491e94059482896c6e188313deb2baae97 Mon Sep 17 00:00:00 2001
From: David Harris <david_harris@hmc.edu>
Date: Tue, 31 May 2022 22:31:21 +0000
Subject: [PATCH 10/14] Unpackinput cleanup

---
 pipelined/src/fpu/unpackinput.sv | 27 ++++++++-------------------
 1 file changed, 8 insertions(+), 19 deletions(-)

diff --git a/pipelined/src/fpu/unpackinput.sv b/pipelined/src/fpu/unpackinput.sv
index 6b39d41c..9c58a444 100644
--- a/pipelined/src/fpu/unpackinput.sv
+++ b/pipelined/src/fpu/unpackinput.sv
@@ -262,23 +262,12 @@ module unpackinput (
 
     end
 
-    // is the exponent all 0's
-    assign ExpZero = ~ExpNonZero;
-
-    // add the assumed one (or zero if denormal or zero) to create the mantissa
-    assign Man = {ExpNonZero, Frac};
-    
-    // is the input a NaN
-    //     - force to be a NaN if it isn't properly Nan Boxed
-    assign NaN = ExpMax & ~FracZero;
-
-    // is the input a singnaling NaN
-    assign SNaN = NaN&~Frac[`NF-1];
-
-    // is the input infinity
-    assign Inf = ExpMax & FracZero;
-
-    // is the input zero
-    assign Zero = ExpZero & FracZero;
-    
+    // Output logic
+    assign ExpZero = ~ExpNonZero; // is the exponent all 0's?
+    assign Man = {ExpNonZero, Frac}; // add the assumed one (or zero if denormal or zero) to create the significand
+    //   ***  - force to be a NaN if it isn't properly Nan Boxed
+    assign NaN = ExpMax & ~FracZero; // is the input a NaN?
+    assign SNaN = NaN&~Frac[`NF-1]; // is the input a singnaling NaN?
+    assign Inf = ExpMax & FracZero; // is the input infinity?
+    assign Zero = ExpZero & FracZero; // is the input zero?
 endmodule
\ No newline at end of file

From 949f53695def9e808af913a6d028905424bc2277 Mon Sep 17 00:00:00 2001
From: cturek <cturek@hmc.edu>
Date: Wed, 1 Jun 2022 00:07:36 +0000
Subject: [PATCH 11/14] Fixed typos

---
 addins/riscv-arch-test |  2 +-
 pipelined/srt/srt.sv   | 12 ++++++------
 2 files changed, 7 insertions(+), 7 deletions(-)

diff --git a/addins/riscv-arch-test b/addins/riscv-arch-test
index be67c99b..307c77b2 160000
--- a/addins/riscv-arch-test
+++ b/addins/riscv-arch-test
@@ -1 +1 @@
-Subproject commit be67c99bd461742aa1c100bcc0732657faae2230
+Subproject commit 307c77b26e070ae85ffea665ad9b642b40e33c86
diff --git a/pipelined/srt/srt.sv b/pipelined/srt/srt.sv
index 835b1d1b..2275b93e 100644
--- a/pipelined/srt/srt.sv
+++ b/pipelined/srt/srt.sv
@@ -44,7 +44,7 @@ module srt #(parameter Nf=52) (
   input  logic [1:0] Fmt, // Floats: 00 = 16 bit, 01 = 32 bit, 10 = 64 bit, 11 = 128 bit
   input  logic       W64, // 32-bit ints on XLEN=64
   input  logic       Signed, // Interpret integers as signed 2's complement
-  input  logic       Int, // Choose integer inputss
+  input  logic       Int, // Choose integer inputs
   input  logic       Sqrt, // perform square root, not divide
   output logic       rsign,
   output logic [Nf-1:0] Quot, Rem, QuotOTFC, // *** later handle integers
@@ -52,7 +52,7 @@ module srt #(parameter Nf=52) (
   output logic [3:0] Flags
 );
 
-  logic          qp, qz, qm; // quotient is +1, 0, or -1
+  logic           qp, qz, qm; // quotient is +1, 0, or -1
   logic [`NE-1:0] calcExp;
   logic           calcSign;
   logic [Nf-1:0]  X, Dpreproc;
@@ -223,17 +223,17 @@ module otfc2 #(parameter N=52) (
   output logic [N-1:0] r
 );
 
-  // The on-the-fly converter transfers the quotient 
+  //  The on-the-fly converter transfers the quotient 
   //  bits to the quotient as they come. 
   //
-  // This code follows the psuedocode presented in the 
+  //  This code follows the psuedocode presented in the 
   //  floating point chapter of the book. Right now, 
   //  it is written for Radix-2 division.
   //
-  // QM is Q-1. It allows us to write negative bits 
+  //  QM is Q-1. It allows us to write negative bits 
   //  without using a costly CPA. 
   logic [N+2:0] Q, QM, QNext, QMNext;
-  // QR and QMR are the shifted versions of Q and QM.
+  //  QR and QMR are the shifted versions of Q and QM.
   //  They are treated as [N-1:r] size signals, and 
   //  discard the r most significant bits of Q and QM. 
   logic [N+1:0] QR, QMR;

From dd19e55b8f731736937800fe0e3d0f5fbbb11ecd Mon Sep 17 00:00:00 2001
From: Katherine Parry <kparry4@gmail.com>
Date: Wed, 1 Jun 2022 16:52:21 +0000
Subject: [PATCH 12/14] unpacker optimizations

---
 addins/riscv-arch-test              |   2 +-
 pipelined/src/fpu/fma.sv            |  21 ++--
 pipelined/src/fpu/fpu.sv            |   4 +-
 pipelined/src/fpu/unpack.sv         |  19 ++--
 pipelined/src/fpu/unpackinput.sv    | 152 +++++++++++-----------------
 pipelined/testbench/testbench-fp.sv |  41 ++++----
 6 files changed, 105 insertions(+), 134 deletions(-)

diff --git a/addins/riscv-arch-test b/addins/riscv-arch-test
index 307c77b2..be67c99b 160000
--- a/addins/riscv-arch-test
+++ b/addins/riscv-arch-test
@@ -1 +1 @@
-Subproject commit 307c77b26e070ae85ffea665ad9b642b40e33c86
+Subproject commit be67c99bd461742aa1c100bcc0732657faae2230
diff --git a/pipelined/src/fpu/fma.sv b/pipelined/src/fpu/fma.sv
index 5d16ccc5..f160d3ea 100644
--- a/pipelined/src/fpu/fma.sv
+++ b/pipelined/src/fpu/fma.sv
@@ -472,7 +472,7 @@ module fma2(
     // Select the result
     ///////////////////////////////////////////////////////////////////////////////
 
-    resultselect resultselect(.XSgnM, .YSgnM, .ZExpM, .XManM, .YManM, .ZManM, .ZDenormM,
+    resultselect resultselect(.XSgnM, .YSgnM, .ZExpM, .XManM, .YManM, .ZManM, .ZDenormM, .ZZeroM,
         .FrmM, .FmtM, .AddendStickyM, .KillProdM, .XInfM, .YInfM, .ZInfM, .XNaNM, .YNaNM, .ZNaNM, .RoundAdd,
         .ZSgnEffM, .PSgnM, .ResultSgn, .CalcPlus1, .Invalid, .Overflow, .Underflow, 
         .ResultDenorm, .ResultExp, .ResultFrac, .FMAResM);
@@ -1002,6 +1002,7 @@ module resultselect(
     input logic                     XInfM, YInfM, ZInfM,    // inputs are infinity
     input logic                     XNaNM, YNaNM, ZNaNM,    // inputs are NaN
     input logic                     ZDenormM, // is the original precision denormalized
+    input logic 		            ZZeroM,
     input logic                     ZSgnEffM,   // the modified Z sign - depends on instruction
     input logic                     PSgnM,      // the product's sign
     input logic                     ResultSgn,  // the result's sign
@@ -1027,7 +1028,7 @@ module resultselect(
         end
         assign OverflowResult =  ((FrmM[1:0]==2'b01) | (FrmM[1:0]==2'b10&~ResultSgn) | (FrmM[1:0]==2'b11&ResultSgn)) ? {ResultSgn, {`NE-1{1'b1}}, 1'b0, {`NF{1'b1}}} :
                                                                                                                     {ResultSgn, {`NE{1'b1}}, {`NF{1'b0}}};
-        assign KillProdResult = {ResultSgn, {ZExpM[`NE-1:1], ZExpM[0]&~ZDenormM, ZManM[`NF-1:0]} + (RoundAdd[`FLEN-2:0]&{`FLEN-1{AddendStickyM}})};
+        assign KillProdResult = {ResultSgn, {ZExpM[`NE-1:1], ZExpM[0]&~(ZDenormM|ZZeroM), ZManM[`NF-1:0]} + (RoundAdd[`FLEN-2:0]&{`FLEN-1{AddendStickyM}})};
         assign UnderflowResult = {ResultSgn, {`FLEN-1{1'b0}}} + {(`FLEN-1)'(0),(CalcPlus1&(AddendStickyM|FrmM[1]))};
         assign InfResult = {InfSgn, {`NE{1'b1}}, (`NF)'(0)};
         assign NormResult = {ResultSgn, ResultExp, ResultFrac};
@@ -1046,7 +1047,7 @@ module resultselect(
                                                                                                                             {ResultSgn, {`NE{1'b1}}, {`NF{1'b0}}} :
                                         ((FrmM[1:0]==2'b01) | (FrmM[1:0]==2'b10&~ResultSgn) | (FrmM[1:0]==2'b11&ResultSgn)) ? {{`FLEN-`LEN1{1'b1}}, ResultSgn, {`NE1-1{1'b1}}, 1'b0, {`NF1{1'b1}}} :
                                                                                                                             {{`FLEN-`LEN1{1'b1}}, ResultSgn, {`NE1{1'b1}}, (`NF1)'(0)};
-        assign KillProdResult = FmtM ? {ResultSgn, {ZExpM[`NE-1:1], ZExpM[0]&~ZDenormM, ZManM[`NF-1:0]} + (RoundAdd[`FLEN-2:0]&{`FLEN-1{AddendStickyM}})} : {{`FLEN-`LEN1{1'b1}}, ResultSgn, {ZExpM[`NE-1], ZExpM[`NE1-2:1], ZExpM[0]&~ZDenormM, ZManM[`NF-1:`NF-`NF1]} + (RoundAdd[`NF-`NF1+`LEN1-2:`NF-`NF1]&{`LEN1-1{AddendStickyM}})};
+        assign KillProdResult = FmtM ? {ResultSgn, {ZExpM[`NE-1:1], ZExpM[0]&~(ZDenormM|ZZeroM), ZManM[`NF-1:0]} + (RoundAdd[`FLEN-2:0]&{`FLEN-1{AddendStickyM}})} : {{`FLEN-`LEN1{1'b1}}, ResultSgn, {ZExpM[`NE-1], ZExpM[`NE1-2:1], ZExpM[0]&~(ZDenormM|ZZeroM), ZManM[`NF-1:`NF-`NF1]} + (RoundAdd[`NF-`NF1+`LEN1-2:`NF-`NF1]&{`LEN1-1{AddendStickyM}})};
         assign UnderflowResult = FmtM ? {ResultSgn, {`FLEN-1{1'b0}}} + {(`FLEN-1)'(0),(CalcPlus1&(AddendStickyM|FrmM[1]))} : {{`FLEN-`LEN1{1'b1}}, {ResultSgn, (`LEN1-1)'(0)} + {(`LEN1-1)'(0), (CalcPlus1&(AddendStickyM|FrmM[1]))}};
         assign InfResult = FmtM ? {InfSgn, {`NE{1'b1}}, (`NF)'(0)} : {{`FLEN-`LEN1{1'b1}}, InfSgn, {`NE1{1'b1}}, (`NF1)'(0)};
         assign NormResult = FmtM ? {ResultSgn, ResultExp, ResultFrac} : {{`FLEN-`LEN1{1'b1}}, ResultSgn, ResultExp[`NE1-1:0], ResultFrac[`NF-1:`NF-`NF1]};
@@ -1066,7 +1067,7 @@ module resultselect(
                     
                     OverflowResult = ((FrmM[1:0]==2'b01) | (FrmM[1:0]==2'b10&~ResultSgn) | (FrmM[1:0]==2'b11&ResultSgn)) ? {ResultSgn, {`NE-1{1'b1}}, 1'b0, {`NF{1'b1}}} :
                                                                                                                                         {ResultSgn, {`NE{1'b1}}, {`NF{1'b0}}};
-                    KillProdResult = {ResultSgn, {ZExpM[`NE-1:1], ZExpM[0]&~ZDenormM, ZManM[`NF-1:0]} + (RoundAdd[`FLEN-2:0]&{`FLEN-1{AddendStickyM}})};
+                    KillProdResult = {ResultSgn, {ZExpM[`NE-1:1], ZExpM[0]&~(ZDenormM|ZZeroM), ZManM[`NF-1:0]} + (RoundAdd[`FLEN-2:0]&{`FLEN-1{AddendStickyM}})};
                     UnderflowResult = {ResultSgn, {`FLEN-1{1'b0}}} + {(`FLEN-1)'(0),(CalcPlus1&(AddendStickyM|FrmM[1]))};
                     InfResult = {InfSgn, {`NE{1'b1}}, (`NF)'(0)};
                     NormResult = {ResultSgn, ResultExp, ResultFrac};
@@ -1082,7 +1083,7 @@ module resultselect(
                     end
                     OverflowResult = ((FrmM[1:0]==2'b01) | (FrmM[1:0]==2'b10&~ResultSgn) | (FrmM[1:0]==2'b11&ResultSgn)) ? {{`FLEN-`LEN1{1'b1}}, ResultSgn, {`NE1-1{1'b1}}, 1'b0, {`NF1{1'b1}}} :
                                                                                                                                   {{`FLEN-`LEN1{1'b1}}, ResultSgn, {`NE1{1'b1}}, (`NF1)'(0)};
-                    KillProdResult = {{`FLEN-`LEN1{1'b1}}, ResultSgn, {ZExpM[`NE-1], ZExpM[`NE1-2:1], ZExpM[0]&~ZDenormM, ZManM[`NF-1:`NF-`NF1]} + (RoundAdd[`NF-`NF1+`LEN1-2:`NF-`NF1]&{`LEN1-1{AddendStickyM}})};
+                    KillProdResult = {{`FLEN-`LEN1{1'b1}}, ResultSgn, {ZExpM[`NE-1], ZExpM[`NE1-2:1], ZExpM[0]&~(ZDenormM|ZZeroM), ZManM[`NF-1:`NF-`NF1]} + (RoundAdd[`NF-`NF1+`LEN1-2:`NF-`NF1]&{`LEN1-1{AddendStickyM}})};
                     UnderflowResult = {{`FLEN-`LEN1{1'b1}}, {ResultSgn, (`LEN1-1)'(0)} + {(`LEN1-1)'(0), (CalcPlus1&(AddendStickyM|FrmM[1]))}};
                     InfResult = {{`FLEN-`LEN1{1'b1}}, InfSgn, {`NE1{1'b1}}, (`NF1)'(0)};
                     NormResult = {{`FLEN-`LEN1{1'b1}}, ResultSgn, ResultExp[`NE1-1:0], ResultFrac[`NF-1:`NF-`NF1]};
@@ -1099,7 +1100,7 @@ module resultselect(
                     
                     OverflowResult = ((FrmM[1:0]==2'b01) | (FrmM[1:0]==2'b10&~ResultSgn) | (FrmM[1:0]==2'b11&ResultSgn)) ? {{`FLEN-`LEN2{1'b1}}, ResultSgn, {`NE2-1{1'b1}}, 1'b0, {`NF2{1'b1}}} :
                                                                                                                                   {{`FLEN-`LEN2{1'b1}}, ResultSgn, {`NE2{1'b1}}, (`NF2)'(0)};
-                    KillProdResult = {{`FLEN-`LEN2{1'b1}}, ResultSgn, {ZExpM[`NE-1], ZExpM[`NE2-2:1], ZExpM[0]&~ZDenormM, ZManM[`NF-1:`NF-`NF2]} + (RoundAdd[`NF-`NF2+`LEN2-2:`NF-`NF2]&{`LEN2-1{AddendStickyM}})};
+                    KillProdResult = {{`FLEN-`LEN2{1'b1}}, ResultSgn, {ZExpM[`NE-1], ZExpM[`NE2-2:1], ZExpM[0]&~(ZDenormM|ZZeroM), ZManM[`NF-1:`NF-`NF2]} + (RoundAdd[`NF-`NF2+`LEN2-2:`NF-`NF2]&{`LEN2-1{AddendStickyM}})};
                     UnderflowResult = {{`FLEN-`LEN2{1'b1}}, {ResultSgn, (`LEN2-1)'(0)} + {(`LEN2-1)'(0), (CalcPlus1&(AddendStickyM|FrmM[1]))}};
                     InfResult = {{`FLEN-`LEN2{1'b1}}, InfSgn, {`NE2{1'b1}}, (`NF2)'(0)};
                     NormResult = {{`FLEN-`LEN2{1'b1}}, ResultSgn, ResultExp[`NE2-1:0], ResultFrac[`NF-1:`NF-`NF2]};
@@ -1137,7 +1138,7 @@ module resultselect(
                     
                     OverflowResult = ((FrmM[1:0]==2'b01) | (FrmM[1:0]==2'b10&~ResultSgn) | (FrmM[1:0]==2'b11&ResultSgn)) ? {ResultSgn, {`NE-1{1'b1}}, 1'b0, {`NF{1'b1}}} :
                                                                                                                                         {ResultSgn, {`NE{1'b1}}, {`NF{1'b0}}};
-                    KillProdResult = {ResultSgn, {ZExpM[`Q_NE-1:1], ZExpM[0]&~ZDenormM, ZManM[`NF-1:0]} + (RoundAdd[`FLEN-2:0]&{`FLEN-1{AddendStickyM}})};
+                    KillProdResult = {ResultSgn, {ZExpM[`Q_NE-1:1], ZExpM[0]&~(ZDenormM|ZZeroM), ZManM[`NF-1:0]} + (RoundAdd[`FLEN-2:0]&{`FLEN-1{AddendStickyM}})};
                     UnderflowResult = {ResultSgn, {`FLEN-1{1'b0}}} + {(`FLEN-1)'(0),(CalcPlus1&(AddendStickyM|FrmM[1]))};
                     InfResult = {InfSgn, {`NE{1'b1}}, (`NF)'(0)};
                     NormResult = {ResultSgn, ResultExp, ResultFrac};
@@ -1153,7 +1154,7 @@ module resultselect(
                     end
                     OverflowResult = ((FrmM[1:0]==2'b01) | (FrmM[1:0]==2'b10&~ResultSgn) | (FrmM[1:0]==2'b11&ResultSgn)) ? {{`FLEN-`D_LEN{1'b1}}, ResultSgn, {`D_NE-1{1'b1}}, 1'b0, {`D_NF{1'b1}}} :
                                                                                                                                   {{`FLEN-`D_LEN{1'b1}}, ResultSgn, {`D_NE{1'b1}}, (`D_NF)'(0)};
-                    KillProdResult = {{`FLEN-`D_LEN{1'b1}}, ResultSgn, {ZExpM[`NE-1], ZExpM[`D_NE-2:1], ZExpM[0]&~ZDenormM, ZManM[`NF-1:`NF-`D_NF]} + (RoundAdd[`NF-`D_NF+`D_LEN-2:`NF-`D_NF]&{`D_LEN-1{AddendStickyM}})};
+                    KillProdResult = {{`FLEN-`D_LEN{1'b1}}, ResultSgn, {ZExpM[`NE-1], ZExpM[`D_NE-2:1], ZExpM[0]&~(ZDenormM|ZZeroM), ZManM[`NF-1:`NF-`D_NF]} + (RoundAdd[`NF-`D_NF+`D_LEN-2:`NF-`D_NF]&{`D_LEN-1{AddendStickyM}})};
                     UnderflowResult = {{`FLEN-`D_LEN{1'b1}}, {ResultSgn, (`D_LEN-1)'(0)} + {(`D_LEN-1)'(0), (CalcPlus1&(AddendStickyM|FrmM[1]))}};
                     InfResult = {{`FLEN-`D_LEN{1'b1}}, InfSgn, {`D_NE{1'b1}}, (`D_NF)'(0)};
                     NormResult = {{`FLEN-`D_LEN{1'b1}}, ResultSgn, ResultExp[`D_NE-1:0], ResultFrac[`NF-1:`NF-`D_NF]};
@@ -1170,7 +1171,7 @@ module resultselect(
                     
                     OverflowResult = ((FrmM[1:0]==2'b01) | (FrmM[1:0]==2'b10&~ResultSgn) | (FrmM[1:0]==2'b11&ResultSgn)) ? {{`FLEN-`S_LEN{1'b1}}, ResultSgn, {`S_NE-1{1'b1}}, 1'b0, {`S_NF{1'b1}}} :
                                                                                                                                   {{`FLEN-`S_LEN{1'b1}}, ResultSgn, {`S_NE{1'b1}}, (`S_NF)'(0)};
-                    KillProdResult = {{`FLEN-`S_LEN{1'b1}}, ResultSgn, {ZExpM[`NE-1], ZExpM[`S_NE-2:1], ZExpM[0]&~ZDenormM, ZManM[`NF-1:`NF-`S_NF]} + (RoundAdd[`NF-`S_NF+`S_LEN-2:`NF-`S_NF]&{`S_LEN-1{AddendStickyM}})};
+                    KillProdResult = {{`FLEN-`S_LEN{1'b1}}, ResultSgn, {ZExpM[`NE-1], ZExpM[`S_NE-2:1], ZExpM[0]&~(ZDenormM|ZZeroM), ZManM[`NF-1:`NF-`S_NF]} + (RoundAdd[`NF-`S_NF+`S_LEN-2:`NF-`S_NF]&{`S_LEN-1{AddendStickyM}})};
                     UnderflowResult = {{`FLEN-`S_LEN{1'b1}}, {ResultSgn, (`S_LEN-1)'(0)} + {(`S_LEN-1)'(0), (CalcPlus1&(AddendStickyM|FrmM[1]))}};
                     InfResult = {{`FLEN-`S_LEN{1'b1}}, InfSgn, {`S_NE{1'b1}}, (`S_NF)'(0)};
                     NormResult = {{`FLEN-`S_LEN{1'b1}}, ResultSgn, ResultExp[`S_NE-1:0], ResultFrac[`NF-1:`NF-`S_NF]};
@@ -1188,7 +1189,7 @@ module resultselect(
                     OverflowResult = ((FrmM[1:0]==2'b01) | (FrmM[1:0]==2'b10&~ResultSgn) | (FrmM[1:0]==2'b11&ResultSgn)) ? {{`FLEN-`H_LEN{1'b1}}, ResultSgn, {`H_NE-1{1'b1}}, 1'b0, {`H_NF{1'b1}}} :
                                                                                                               {{`FLEN-`H_LEN{1'b1}}, ResultSgn, {`H_NE{1'b1}}, (`H_NF)'(0)};      
 
-                    KillProdResult = {{`FLEN-`H_LEN{1'b1}}, ResultSgn, {ZExpM[`NE-1], ZExpM[`H_NE-2:1],ZExpM[0]&~ZDenormM, ZManM[`NF-1:`NF-`H_NF]} + (RoundAdd[`NF-`H_NF+`H_LEN-2:`NF-`H_NF]&{`H_LEN-1{AddendStickyM}})};
+                    KillProdResult = {{`FLEN-`H_LEN{1'b1}}, ResultSgn, {ZExpM[`NE-1], ZExpM[`H_NE-2:1],ZExpM[0]&~(ZDenormM|ZZeroM), ZManM[`NF-1:`NF-`H_NF]} + (RoundAdd[`NF-`H_NF+`H_LEN-2:`NF-`H_NF]&{`H_LEN-1{AddendStickyM}})};
                     UnderflowResult = {{`FLEN-`H_LEN{1'b1}}, {ResultSgn, (`H_LEN-1)'(0)} + {(`H_LEN-1)'(0), (CalcPlus1&(AddendStickyM|FrmM[1]))}};
                     InfResult = {{`FLEN-`H_LEN{1'b1}}, InfSgn, {`H_NE{1'b1}}, (`H_NF)'(0)};
                     NormResult = {{`FLEN-`H_LEN{1'b1}}, ResultSgn, ResultExp[`H_NE-1:0], ResultFrac[`NF-1:`NF-`H_NF]};
diff --git a/pipelined/src/fpu/fpu.sv b/pipelined/src/fpu/fpu.sv
index 75781092..113403c9 100755
--- a/pipelined/src/fpu/fpu.sv
+++ b/pipelined/src/fpu/fpu.sv
@@ -95,7 +95,7 @@ module fpu (
    logic 		  XNaNQ, YNaNQ;                       // is the input a NaN - divide
    logic 		  XSNaNE, YSNaNE, ZSNaNE;             // is the input a signaling NaN - execute stage
    logic 		  XSNaNM, YSNaNM, ZSNaNM;             // is the input a signaling NaN - memory stage
-   logic 		  XDenormE, YDenormE, ZDenormE;       // is the input denormalized
+   logic 		  XDenormE, ZDenormE;       // is the input denormalized
    logic 		  XZeroE, YZeroE, ZZeroE;             // is the input zero - execute stage
    logic 		  XZeroM, YZeroM, ZZeroM;             // is the input zero - memory stage
    logic 		  XZeroQ, YZeroQ;                     // is the input zero - divide
@@ -176,7 +176,7 @@ module fpu (
    //    - does some classifications (SNaN, NaN, Denorm, Norm, Zero, Infifnity)
    unpack unpack (.X(FSrcXE), .Y(FSrcYE), .Z(FSrcZE), .FmtE,
          .XSgnE, .YSgnE, .ZSgnE, .XExpE, .YExpE, .ZExpE, .XManE, .YManE, .ZManE, 
-         .XNaNE, .YNaNE, .ZNaNE, .XSNaNE, .YSNaNE, .ZSNaNE, .XDenormE, .YDenormE, .ZDenormE, 
+         .XNaNE, .YNaNE, .ZNaNE, .XSNaNE, .YSNaNE, .ZSNaNE, .XDenormE, .ZDenormE, 
          .XZeroE, .YZeroE, .ZZeroE, .XInfE, .YInfE, .ZInfE, .XExpMaxE);
 
    // FMA
diff --git a/pipelined/src/fpu/unpack.sv b/pipelined/src/fpu/unpack.sv
index e9f005e7..e28b2efe 100644
--- a/pipelined/src/fpu/unpack.sv
+++ b/pipelined/src/fpu/unpack.sv
@@ -8,26 +8,29 @@ module unpack (
     output logic [`NF:0]            XManE, YManE, ZManE,    // mantissas of XYZ (converted to largest supported precision)
     output logic                    XNaNE, YNaNE, ZNaNE,    // is XYZ a NaN
     output logic                    XSNaNE, YSNaNE, ZSNaNE, // is XYZ a signaling NaN
-    output logic                    XDenormE, YDenormE, ZDenormE,   // is XYZ denormalized
+    output logic                    XDenormE, ZDenormE,   // is XYZ denormalized
     output logic                    XZeroE, YZeroE, ZZeroE,         // is XYZ zero
     output logic                    XInfE, YInfE, ZInfE,            // is XYZ infinity
     output logic                    XExpMaxE                        // does X have the maximum exponent (NaN or Inf)
 );
  
     logic [`NF-1:0] XFracE, YFracE, ZFracE; //Fraction of XYZ
-    logic           XExpNonzero, YExpNonzero, ZExpNonzero; // is the exponent of XYZ non-zero
+    logic           XExpNonZero, YExpNonZero, ZExpNonZero; // is the exponent of XYZ non-zero
     logic           XFracZero, YFracZero, ZFracZero; // is the fraction zero
     logic           YExpMaxE, ZExpMaxE;  // is the exponent all 1s
     
     unpackinput unpackinputX (.In(X), .FmtE, .Sgn(XSgnE), .Exp(XExpE), .Man(XManE), 
-                            .NaN(XNaNE), .SNaN(XSNaNE), .Denorm(XDenormE), 
-                            .Zero(XZeroE), .Inf(XInfE), .ExpMax(XExpMaxE));
+                            .NaN(XNaNE), .SNaN(XSNaNE), .ExpNonZero(XExpNonZero),
+                            .Zero(XZeroE), .Inf(XInfE), .ExpMax(XExpMaxE), .FracZero(XFracZero));
 
     unpackinput unpackinputY (.In(Y), .FmtE, .Sgn(YSgnE), .Exp(YExpE), .Man(YManE), 
-                            .NaN(YNaNE), .SNaN(YSNaNE), .Denorm(YDenormE), 
-                            .Zero(YZeroE), .Inf(YInfE), .ExpMax(YExpMaxE));
+                            .NaN(YNaNE), .SNaN(YSNaNE), .ExpNonZero(YExpNonZero),
+                            .Zero(YZeroE), .Inf(YInfE), .ExpMax(YExpMaxE), .FracZero(YFracZero));
 
     unpackinput unpackinputZ (.In(Z), .FmtE, .Sgn(ZSgnE), .Exp(ZExpE), .Man(ZManE), 
-                            .NaN(ZNaNE), .SNaN(ZSNaNE), .Denorm(ZDenormE), 
-                            .Zero(ZZeroE), .Inf(ZInfE), .ExpMax(ZExpMaxE));
+                            .NaN(ZNaNE), .SNaN(ZSNaNE), .ExpNonZero(ZExpNonZero),
+                            .Zero(ZZeroE), .Inf(ZInfE), .ExpMax(ZExpMaxE), .FracZero(ZFracZero));
+    // is the input denormalized
+    assign XDenormE = ~XExpNonZero & ~XFracZero;
+    assign ZDenormE = ~ZExpNonZero & ~ZFracZero;
 endmodule
\ No newline at end of file
diff --git a/pipelined/src/fpu/unpackinput.sv b/pipelined/src/fpu/unpackinput.sv
index 9c58a444..434a5bf0 100644
--- a/pipelined/src/fpu/unpackinput.sv
+++ b/pipelined/src/fpu/unpackinput.sv
@@ -8,25 +8,24 @@ module unpackinput (
     output logic [`NF:0]            Man,    // mantissas of XYZ (converted to largest supported precision)
     output logic                    NaN,    // is XYZ a NaN
     output logic                    SNaN, // is XYZ a signaling NaN
-    output logic                    Denorm,   // is XYZ denormalized
     output logic                    Zero,         // is XYZ zero
     output logic                    Inf,            // is XYZ infinity
+    output logic                    ExpNonZero,            // is the exponent not zero
+    output logic                    FracZero,            // is the fraction zero
     output logic                    ExpMax                       // does In have the maximum exponent (NaN or Inf)
 );
  
     logic [`NF-1:0] Frac; //Fraction of XYZ
-    logic           ExpNonZero; // is the exponent of XYZ non-zero
-    logic           FracZero; // is the fraction zero
     logic           ExpZero;
+    logic           BadNaNBox;
     
     if (`FPSIZES == 1) begin        // if there is only one floating point format supported
+        assign BadNaNBox = 0;
         assign Sgn = In[`FLEN-1];  // sign bit
         assign Frac = In[`NF-1:0];  // fraction (no assumed 1)
-        assign FracZero = ~|Frac; // is the fraction zero?
-        assign ExpNonZero = |Exp;  // is the exponent non-zero
-        assign Denorm = ~ExpNonZero & ~FracZero; // is the input (in its original format) denormalized
-        assign Exp = {In[`FLEN-2:`NF+1], In[`NF]|Denorm};  // exponent.  Denormalized numbers have effective biased exponent of 1
-        assign ExpMax = &Exp;  // is the exponent all 1's
+        assign ExpNonZero = |In[`FLEN-2:`NF];  // is the exponent non-zero
+        assign Exp = {In[`FLEN-2:`NF+1], In[`NF]|~ExpNonZero};  // exponent.  Denormalized numbers have effective biased exponent of 1
+        assign ExpMax = &In[`FLEN-2:`NF];  // is the exponent all 1's
     end else if (`FPSIZES == 2) begin   // if there are 2 floating point formats supported
         //***need better names for these constants
         // largest format | smaller format
@@ -47,25 +46,16 @@ module unpackinput (
         //      quad   and half
         //      double and half
 
-        logic  [`LEN1-1:0]  Len1; // Remove NaN boxing or NaN, if not properly NaN boxed
-
-        // Check NaN boxing, If the value is not properly NaN boxed, set the value to a quiet NaN
-        assign Len1 = &In[`FLEN-1:`LEN1] ? In[`LEN1-1:0] : {1'b0, {`NE1+1{1'b1}}, (`NF1-1)'(0)};
+        assign BadNaNBox = ~(FmtE|(&In[`FLEN-1:`LEN1])); // Check NaN boxing
 
         // choose sign bit depending on format - 1=larger precsion 0=smaller precision
-        assign Sgn = FmtE ? In[`FLEN-1] : Len1[`LEN1-1];
+        assign Sgn = FmtE ? In[`FLEN-1] : In[`LEN1-1];
 
         // extract the fraction, add trailing zeroes to the mantissa if nessisary
-        assign Frac = FmtE ? In[`NF-1:0] : {Len1[`NF1-1:0], (`NF-`NF1)'(0)};
+        assign Frac = FmtE ? In[`NF-1:0] : {In[`NF1-1:0], (`NF-`NF1)'(0)};
 
-        // is the fraction zero
-        assign FracZero = ~|Frac;
-        
         // is the exponent non-zero
-        assign ExpNonZero = FmtE ? |In[`FLEN-2:`NF] : |Len1[`LEN1-2:`NF1]; 
-
-        // is the input (in it's original format) denormalized
-        assign Denorm = ~ExpNonZero & ~FracZero;
+        assign ExpNonZero = FmtE ? |In[`FLEN-2:`NF] : |In[`LEN1-2:`NF1]; 
 
         // example double to single conversion:
         // 1023 = 0011 1111 1111
@@ -77,12 +67,10 @@ module unpackinput (
 
         // extract the exponent, converting the smaller exponent into the larger precision if nessisary
         //      - if the original precision had a denormal number convert the exponent value 1
-        assign Exp = FmtE ? {In[`FLEN-2:`NF+1], In[`NF]|Denorm} : {Len1[`LEN1-2], {`NE-`NE1{~Len1[`LEN1-2]}}, Len1[`LEN1-3:`NF1+1], Len1[`NF1]|Denorm}; 
+        assign Exp = FmtE ? {In[`FLEN-2:`NF+1], In[`NF]|~ExpNonZero} : {In[`LEN1-2], {`NE-`NE1{~In[`LEN1-2]}}, In[`LEN1-3:`NF1+1], In[`NF1]|~ExpNonZero}; 
  
-
-
         // is the exponent all 1's
-        assign ExpMax = FmtE ? &In[`FLEN-2:`NF] : &Len1[`LEN1-2:`NF1];
+        assign ExpMax = FmtE ? &In[`FLEN-2:`NF] : &In[`LEN1-2:`NF1];
     
 
     end else if (`FPSIZES == 3) begin       // three floating point precsions supported
@@ -104,22 +92,21 @@ module unpackinput (
         //      quad   and double and half
         //      quad   and single and half
 
-        logic  [`LEN1-1:0]  Len1; // Remove NaN boxing or NaN, if not properly NaN boxed for larger percision
-        logic  [`LEN2-1:0]  Len2; // Remove NaN boxing or NaN, if not properly NaN boxed for smallest precision
-        
-        // Check NaN boxing, If the value is not properly NaN boxed, set the value to a quiet NaN - for larger precision
-        assign Len1 = &In[`FLEN-1:`LEN1] ? In[`LEN1-1:0] : {1'b0, {`NE1+1{1'b1}}, (`NF1-1)'(0)};
-
-        // Check NaN boxing, If the value is not properly NaN boxed, set the value to a quiet NaN - for smaller precision
-        assign Len2 = &In[`FLEN-1:`LEN2] ? In[`LEN2-1:0] : {1'b0, {`NE2+1{1'b1}}, (`NF2-1)'(0)};
-
+        // Check NaN boxing
+        always_comb
+            case (FmtE)
+                `FMT:  BadNaNBox = 0;
+                `FMT1: BadNaNBox = ~&In[`FLEN-1:`LEN1];
+                `FMT2: BadNaNBox = ~&In[`FLEN-1:`LEN2];
+                default: BadNaNBox = 0;
+            endcase
 
         // extract the sign bit
         always_comb
             case (FmtE)
                 `FMT:  Sgn = In[`FLEN-1];
-                `FMT1: Sgn = Len1[`LEN1-1];
-                `FMT2: Sgn = Len2[`LEN2-1];
+                `FMT1: Sgn = In[`LEN1-1];
+                `FMT2: Sgn = In[`LEN2-1];
                 default: Sgn = 0;
             endcase
 
@@ -127,27 +114,20 @@ module unpackinput (
         always_comb
             case (FmtE)
                 `FMT: Frac = In[`NF-1:0];
-                `FMT1: Frac = {Len1[`NF1-1:0], (`NF-`NF1)'(0)};
-                `FMT2: Frac = {Len2[`NF2-1:0], (`NF-`NF2)'(0)};
+                `FMT1: Frac = {In[`NF1-1:0], (`NF-`NF1)'(0)};
+                `FMT2: Frac = {In[`NF2-1:0], (`NF-`NF2)'(0)};
                 default: Frac = 0;
             endcase
 
-        // is the fraction zero
-        assign FracZero = ~|Frac;
-
-
         // is the exponent non-zero
         always_comb
             case (FmtE)
                 `FMT:  ExpNonZero = |In[`FLEN-2:`NF];     // if input is largest precision (`FLEN - ie quad or double)
-                `FMT1: ExpNonZero = |Len1[`LEN1-2:`NF1];  // if input is larger precsion (`LEN1 - double or single)
-                `FMT2: ExpNonZero = |Len2[`LEN2-2:`NF2]; // if input is smallest precsion (`LEN2 - single or half)
+                `FMT1: ExpNonZero = |In[`LEN1-2:`NF1];  // if input is larger precsion (`LEN1 - double or single)
+                `FMT2: ExpNonZero = |In[`LEN2-2:`NF2]; // if input is smallest precsion (`LEN2 - single or half)
                 default: ExpNonZero = 0; 
             endcase
             
-        // is the input (in it's original format) denormalized
-        assign Denorm = ~ExpNonZero & ~FracZero;
-
         // example double to single conversion:
         // 1023 = 0011 1111 1111
         // 127  = 0000 0111 1111 (subtract this)
@@ -159,9 +139,9 @@ module unpackinput (
         // convert the larger precision's exponent to use the largest precision's bias
         always_comb 
             case (FmtE)
-                `FMT:  Exp = {In[`FLEN-2:`NF+1], In[`NF]|Denorm};
-                `FMT1: Exp = {Len1[`LEN1-2], {`NE-`NE1{~Len1[`LEN1-2]}}, Len1[`LEN1-3:`NF1+1], Len1[`NF1]|Denorm}; 
-                `FMT2: Exp = {Len2[`LEN2-2], {`NE-`NE2{~Len2[`LEN2-2]}}, Len2[`LEN2-3:`NF2+1], Len2[`NF2]|Denorm}; 
+                `FMT:  Exp = {In[`FLEN-2:`NF+1], In[`NF]|~ExpNonZero};
+                `FMT1: Exp = {In[`LEN1-2], {`NE-`NE1{~In[`LEN1-2]}}, In[`LEN1-3:`NF1+1], In[`NF1]|~ExpNonZero}; 
+                `FMT2: Exp = {In[`LEN2-2], {`NE-`NE2{~In[`LEN2-2]}}, In[`LEN2-3:`NF2+1], In[`NF2]|~ExpNonZero}; 
                 default: Exp = 0;
             endcase
 
@@ -169,8 +149,8 @@ module unpackinput (
         always_comb
             case (FmtE)
                 `FMT:  ExpMax = &In[`FLEN-2:`NF];
-                `FMT1: ExpMax = &Len1[`LEN1-2:`NF1];
-                `FMT2: ExpMax = &Len2[`LEN2-2:`NF2];
+                `FMT1: ExpMax = &In[`LEN1-2:`NF1];
+                `FMT2: ExpMax = &In[`LEN2-2:`NF2];
                 default: ExpMax = 0;
             endcase
 
@@ -184,27 +164,22 @@ module unpackinput (
         //   `Q_BIAS |  `D_BIAS |  `S_BIAS |  `H_BIAS    exponent's bias value
         //   `Q_FMT  |  `D_FMT  |  `S_FMT  |  `H_FMT     precision's format value - Q=11 D=01 S=00 H=10
 
-
-        logic  [`D_LEN-1:0]  Len1; // Remove NaN boxing or NaN, if not properly NaN boxed for double percision
-        logic  [`S_LEN-1:0]  Len2; // Remove NaN boxing or NaN, if not properly NaN boxed for single percision
-        logic  [`H_LEN-1:0]  Len3; // Remove NaN boxing or NaN, if not properly NaN boxed for half percision
-        
-        // Check NaN boxing, If the value is not properly NaN boxed, set the value to a quiet NaN - for double precision
-        assign Len1 = &In[`Q_LEN-1:`D_LEN] ? In[`D_LEN-1:0] : {1'b0, {`D_NE+1{1'b1}}, (`D_NF-1)'(0)};
-
-        // Check NaN boxing, If the value is not properly NaN boxed, set the value to a quiet NaN - for single precision
-        assign Len2 = &In[`Q_LEN-1:`S_LEN] ? In[`S_LEN-1:0] : {1'b0, {`S_NE+1{1'b1}}, (`S_NF-1)'(0)};
-
-        // Check NaN boxing, If the value is not properly NaN boxed, set the value to a quiet NaN - for half precision
-        assign Len3 = &In[`Q_LEN-1:`H_LEN] ? In[`H_LEN-1:0] : {1'b0, {`H_NE+1{1'b1}}, (`H_NF-1)'(0)};
+        // Check NaN boxing
+        always_comb
+            case (FmtE)
+                2'b11:  BadNaNBox = 0;
+                2'b01: BadNaNBox = ~&In[`Q_LEN-1:`D_LEN];
+                2'b00: BadNaNBox = ~&In[`Q_LEN-1:`S_LEN];
+                2'b10: BadNaNBox = ~&In[`Q_LEN-1:`H_LEN];
+            endcase
 
         // extract sign bit
         always_comb
             case (FmtE)
                 2'b11: Sgn = In[`Q_LEN-1];
-                2'b01: Sgn = Len1[`D_LEN-1];
-                2'b00: Sgn = Len2[`S_LEN-1];
-                2'b10: Sgn = Len3[`H_LEN-1];
+                2'b01: Sgn = In[`D_LEN-1];
+                2'b00: Sgn = In[`S_LEN-1];
+                2'b10: Sgn = In[`H_LEN-1];
             endcase
             
 
@@ -212,26 +187,20 @@ module unpackinput (
         always_comb
             case (FmtE)
                 2'b11: Frac = In[`Q_NF-1:0];
-                2'b01: Frac = {Len1[`D_NF-1:0], (`Q_NF-`D_NF)'(0)};
-                2'b00: Frac = {Len2[`S_NF-1:0], (`Q_NF-`S_NF)'(0)};
-                2'b10: Frac = {Len3[`H_NF-1:0], (`Q_NF-`H_NF)'(0)};
+                2'b01: Frac = {In[`D_NF-1:0], (`Q_NF-`D_NF)'(0)};
+                2'b00: Frac = {In[`S_NF-1:0], (`Q_NF-`S_NF)'(0)};
+                2'b10: Frac = {In[`H_NF-1:0], (`Q_NF-`H_NF)'(0)};
             endcase
 
-        // is the fraction zero
-        assign FracZero = ~|Frac;
-
         // is the exponent non-zero
         always_comb
             case (FmtE)
                 2'b11: ExpNonZero = |In[`Q_LEN-2:`Q_NF];
-                2'b01: ExpNonZero = |Len1[`D_LEN-2:`D_NF];
-                2'b00: ExpNonZero = |Len2[`S_LEN-2:`S_NF]; 
-                2'b10: ExpNonZero = |Len3[`H_LEN-2:`H_NF]; 
+                2'b01: ExpNonZero = |In[`D_LEN-2:`D_NF];
+                2'b00: ExpNonZero = |In[`S_LEN-2:`S_NF]; 
+                2'b10: ExpNonZero = |In[`H_LEN-2:`H_NF]; 
             endcase
 
-        // is the input (in it's original format) denormalized
-        assign Denorm = ~ExpNonZero & ~FracZero;
-
 
         // example double to single conversion:
         // 1023 = 0011 1111 1111
@@ -244,10 +213,10 @@ module unpackinput (
         // convert the double precsion exponent into quad precsion
         always_comb
             case (FmtE)
-                2'b11: Exp = {In[`Q_LEN-2:`Q_NF+1], In[`Q_NF]|Denorm};
-                2'b01: Exp = {Len1[`D_LEN-2], {`Q_NE-`D_NE{~Len1[`D_LEN-2]}}, Len1[`D_LEN-3:`D_NF+1], Len1[`D_NF]|Denorm};
-                2'b00: Exp = {Len2[`S_LEN-2], {`Q_NE-`S_NE{~Len2[`S_LEN-2]}}, Len2[`S_LEN-3:`S_NF+1], Len2[`S_NF]|Denorm};
-                2'b10: Exp = {Len3[`H_LEN-2], {`Q_NE-`H_NE{~Len3[`H_LEN-2]}}, Len3[`H_LEN-3:`H_NF+1], Len3[`H_NF]|Denorm}; 
+                2'b11: Exp = {In[`Q_LEN-2:`Q_NF+1], In[`Q_NF]|~ExpNonZero};
+                2'b01: Exp = {In[`D_LEN-2], {`Q_NE-`D_NE{~In[`D_LEN-2]}}, In[`D_LEN-3:`D_NF+1], In[`D_NF]|~ExpNonZero};
+                2'b00: Exp = {In[`S_LEN-2], {`Q_NE-`S_NE{~In[`S_LEN-2]}}, In[`S_LEN-3:`S_NF+1], In[`S_NF]|~ExpNonZero};
+                2'b10: Exp = {In[`H_LEN-2], {`Q_NE-`H_NE{~In[`H_LEN-2]}}, In[`H_LEN-3:`H_NF+1], In[`H_NF]|~ExpNonZero}; 
             endcase
 
 
@@ -255,19 +224,18 @@ module unpackinput (
         always_comb 
             case (FmtE)
                 2'b11: ExpMax = &In[`Q_LEN-2:`Q_NF];
-                2'b01: ExpMax = &Len1[`D_LEN-2:`D_NF];
-                2'b00: ExpMax = &Len2[`S_LEN-2:`S_NF];
-                2'b10: ExpMax = &Len3[`H_LEN-2:`H_NF];
+                2'b01: ExpMax = &In[`D_LEN-2:`D_NF];
+                2'b00: ExpMax = &In[`S_LEN-2:`S_NF];
+                2'b10: ExpMax = &In[`H_LEN-2:`H_NF];
             endcase
 
     end
 
     // Output logic
-    assign ExpZero = ~ExpNonZero; // is the exponent all 0's?
+    assign FracZero = ~|Frac; // is the fraction zero?
     assign Man = {ExpNonZero, Frac}; // add the assumed one (or zero if denormal or zero) to create the significand
-    //   ***  - force to be a NaN if it isn't properly Nan Boxed
-    assign NaN = ExpMax & ~FracZero; // is the input a NaN?
-    assign SNaN = NaN&~Frac[`NF-1]; // is the input a singnaling NaN?
+    assign NaN = (ExpMax & ~FracZero)|BadNaNBox; // is the input a NaN?
+    assign SNaN = NaN&~Frac[`NF-1]&~BadNaNBox; // is the input a singnaling NaN?
     assign Inf = ExpMax & FracZero; // is the input infinity?
-    assign Zero = ExpZero & FracZero; // is the input zero?
+    assign Zero = ~ExpNonZero & FracZero; // is the input zero?
 endmodule
\ No newline at end of file
diff --git a/pipelined/testbench/testbench-fp.sv b/pipelined/testbench/testbench-fp.sv
index 892e7637..b46061a0 100644
--- a/pipelined/testbench/testbench-fp.sv
+++ b/pipelined/testbench/testbench-fp.sv
@@ -79,7 +79,6 @@ module testbenchfp;
   logic [`NF:0]         FmaRuXMan, FmaRuYMan, FmaRuZMan;
   logic [`NF:0]         FmaRdXMan, FmaRdYMan, FmaRdZMan;
   logic [`NF:0]         FmaRnmXMan, FmaRnmYMan, FmaRnmZMan;
-  logic                 XNorm;                                // is X normal
   logic                 XNaN, YNaN, ZNaN;                     // is the input NaN
   logic                 FmaRneXNaN, FmaRneYNaN, FmaRneZNaN;
   logic                 FmaRzXNaN, FmaRzYNaN, FmaRzZNaN;
@@ -92,12 +91,12 @@ module testbenchfp;
   logic                 FmaRuXSNaN, FmaRuYSNaN, FmaRuZSNaN;
   logic                 FmaRdXSNaN, FmaRdYSNaN, FmaRdZSNaN;
   logic                 FmaRnmXSNaN, FmaRnmYSNaN, FmaRnmZSNaN;
-  logic                 XDenorm, YDenorm, ZDenorm;            // is the input denormalized
-  logic                 FmaRneXDenorm, FmaRneYDenorm, FmaRneZDenorm;
-  logic                 FmaRzXDenorm, FmaRzYDenorm, FmaRzZDenorm;
-  logic                 FmaRuXDenorm, FmaRuYDenorm, FmaRuZDenorm;
-  logic                 FmaRdXDenorm, FmaRdYDenorm, FmaRdZDenorm;
-  logic                 FmaRnmXDenorm, FmaRnmYDenorm, FmaRnmZDenorm;
+  logic                 XDenorm, ZDenorm;            // is the input denormalized
+  logic                 FmaRneXDenorm, FmaRneZDenorm;
+  logic                 FmaRzXDenorm, FmaRzZDenorm;
+  logic                 FmaRuXDenorm, FmaRuZDenorm;
+  logic                 FmaRdXDenorm, FmaRdZDenorm;
+  logic                 FmaRnmXDenorm, FmaRnmZDenorm;
   logic                 XInf, YInf, ZInf;                   // is the input infinity
   logic                 FmaRneXInf, FmaRneYInf, FmaRneZInf;
   logic                 FmaRzXInf, FmaRzYInf, FmaRzZInf;
@@ -683,7 +682,7 @@ module testbenchfp;
                                     .XManE(FmaRneXMan), .YManE(FmaRneYMan), .ZManE(FmaRneZMan), 
                                     .XNaNE(FmaRneXNaN), .YNaNE(FmaRneYNaN), .ZNaNE(FmaRneZNaN),
                                     .XSNaNE(FmaRneXSNaN), .YSNaNE(FmaRneYSNaN), .ZSNaNE(FmaRneZSNaN), 
-                                    .XDenormE(FmaRneXDenorm), .YDenormE(FmaRneYDenorm), .ZDenormE(FmaRneZDenorm), 
+                                    .XDenormE(FmaRneXDenorm), .ZDenormE(FmaRneZDenorm), 
                                     .XZeroE(FmaRneXZero), .YZeroE(FmaRneYZero), .ZZeroE(FmaRneZZero),
                                     .XInfE(FmaRneXInf), .YInfE(FmaRneYInf), .ZInfE(FmaRneZInf), .FmaModFmt, .FmaFmt(FmaFmtVal),
                                     .X(FmaRneX), .Y(FmaRneY), .Z(FmaRneZ));
@@ -693,7 +692,7 @@ module testbenchfp;
                                     .XManE(FmaRzXMan), .YManE(FmaRzYMan), .ZManE(FmaRzZMan), 
                                     .XNaNE(FmaRzXNaN), .YNaNE(FmaRzYNaN), .ZNaNE(FmaRzZNaN),
                                     .XSNaNE(FmaRzXSNaN), .YSNaNE(FmaRzYSNaN), .ZSNaNE(FmaRzZSNaN), 
-                                    .XDenormE(FmaRzXDenorm), .YDenormE(FmaRzYDenorm), .ZDenormE(FmaRzZDenorm), 
+                                    .XDenormE(FmaRzXDenorm), .ZDenormE(FmaRzZDenorm), 
                                     .XZeroE(FmaRzXZero), .YZeroE(FmaRzYZero), .ZZeroE(FmaRzZZero),
                                     .XInfE(FmaRzXInf), .YInfE(FmaRzYInf), .ZInfE(FmaRzZInf), .FmaFmt(FmaFmtVal),
                                     .X(FmaRzX), .Y(FmaRzY), .Z(FmaRzZ));
@@ -703,7 +702,7 @@ module testbenchfp;
                                     .XManE(FmaRuXMan), .YManE(FmaRuYMan), .ZManE(FmaRuZMan), 
                                     .XNaNE(FmaRuXNaN), .YNaNE(FmaRuYNaN), .ZNaNE(FmaRuZNaN),
                                     .XSNaNE(FmaRuXSNaN), .YSNaNE(FmaRuYSNaN), .ZSNaNE(FmaRuZSNaN), 
-                                    .XDenormE(FmaRuXDenorm), .YDenormE(FmaRuYDenorm), .ZDenormE(FmaRuZDenorm), 
+                                    .XDenormE(FmaRuXDenorm), .ZDenormE(FmaRuZDenorm), 
                                     .XZeroE(FmaRuXZero), .YZeroE(FmaRuYZero), .ZZeroE(FmaRuZZero),
                                     .XInfE(FmaRuXInf), .YInfE(FmaRuYInf), .ZInfE(FmaRuZInf), .FmaFmt(FmaFmtVal),
                                     .X(FmaRuX), .Y(FmaRuY), .Z(FmaRuZ));
@@ -713,7 +712,7 @@ module testbenchfp;
                                     .XManE(FmaRdXMan), .YManE(FmaRdYMan), .ZManE(FmaRdZMan), 
                                     .XNaNE(FmaRdXNaN), .YNaNE(FmaRdYNaN), .ZNaNE(FmaRdZNaN),
                                     .XSNaNE(FmaRdXSNaN), .YSNaNE(FmaRdYSNaN), .ZSNaNE(FmaRdZSNaN), 
-                                    .XDenormE(FmaRdXDenorm), .YDenormE(FmaRdYDenorm), .ZDenormE(FmaRdZDenorm), 
+                                    .XDenormE(FmaRdXDenorm), .ZDenormE(FmaRdZDenorm), 
                                     .XZeroE(FmaRdXZero), .YZeroE(FmaRdYZero), .ZZeroE(FmaRdZZero),
                                     .XInfE(FmaRdXInf), .YInfE(FmaRdYInf), .ZInfE(FmaRdZInf), .FmaFmt(FmaFmtVal),
                                     .X(FmaRdX), .Y(FmaRdY), .Z(FmaRdZ));
@@ -723,7 +722,7 @@ module testbenchfp;
                                     .XManE(FmaRnmXMan), .YManE(FmaRnmYMan), .ZManE(FmaRnmZMan),
                                     .XNaNE(FmaRnmXNaN), .YNaNE(FmaRnmYNaN), .ZNaNE(FmaRnmZNaN),
                                     .XSNaNE(FmaRnmXSNaN), .YSNaNE(FmaRnmYSNaN), .ZSNaNE(FmaRnmZSNaN), 
-                                    .XDenormE(FmaRnmXDenorm), .YDenormE(FmaRnmYDenorm), .ZDenormE(FmaRnmZDenorm), 
+                                    .XDenormE(FmaRnmXDenorm), .ZDenormE(FmaRnmZDenorm), 
                                     .XZeroE(FmaRnmXZero), .YZeroE(FmaRnmYZero), .ZZeroE(FmaRnmZZero),
                                     .XInfE(FmaRnmXInf), .YInfE(FmaRnmYInf), .ZInfE(FmaRnmZInf), .FmaFmt(FmaFmtVal),
                                     .X(FmaRnmX), .Y(FmaRnmY), .Z(FmaRnmZ));
@@ -733,9 +732,9 @@ module testbenchfp;
                                     .XManE(XMan), .YManE(YMan), .ZManE(ZMan),
                                     .XNaNE(XNaN), .YNaNE(YNaN), .ZNaNE(ZNaN),
                                     .XSNaNE(XSNaN), .YSNaNE(YSNaN), .ZSNaNE(ZSNaN), 
-                                    .XDenormE(XDenorm), .YDenormE(YDenorm), .ZDenormE(ZDenorm), 
+                                    .XDenormE(XDenorm), .ZDenormE(ZDenorm), 
                                     .XZeroE(XZero), .YZeroE(YZero), .ZZeroE(ZZero),
-                                    .XInfE(XInf), .YInfE(YInf), .ZInfE(ZInf),.XNormE(XNorm), .XExpMaxE(XExpMax),
+                                    .XInfE(XInf), .YInfE(YInf), .ZInfE(ZInf), .XExpMaxE(XExpMax),
                                     .X, .Y, .Z);
 
 
@@ -1294,13 +1293,13 @@ module readfmavectors (
   output logic [`NF:0]        XManE, YManE, ZManE,    // mantissas of XYZ (converted to largest supported precision)
   output logic                XNaNE, YNaNE, ZNaNE,    // is XYZ a NaN
   output logic                XSNaNE, YSNaNE, ZSNaNE, // is XYZ a signaling NaN
-  output logic                XDenormE, YDenormE, ZDenormE,   // is XYZ denormalized
+  output logic                XDenormE, ZDenormE,   // is XYZ denormalized
   output logic                XZeroE, YZeroE, ZZeroE,         // is XYZ zero
   output logic                XInfE, YInfE, ZInfE,            // is XYZ infinity
   output logic [`FLEN-1:0]    X, Y, Z                 // inputs
 );
 
-  logic XNormE, XExpMaxE; // signals the unpacker outputs but isn't used in FMA
+  logic XExpMaxE; // signals the unpacker outputs but isn't used in FMA
   // apply test vectors on rising edge of clk
   // Format of vectors Inputs(1/2/3)_AnsFlg
   always @(posedge clk) begin
@@ -1335,7 +1334,7 @@ module readfmavectors (
   end
   
   unpack unpack(.X, .Y, .Z, .FmtE(FmaModFmt), .XSgnE, .YSgnE, .ZSgnE, .XExpE, .YExpE, .ZExpE, .XDenormE,
-                .XManE, .YManE, .ZManE, .XNormE, .XNaNE, .YNaNE, .ZNaNE, .XSNaNE, .YSNaNE, .ZSNaNE,
+                .XManE, .YManE, .ZManE, .XNaNE, .YNaNE, .ZNaNE, .XSNaNE, .YSNaNE, .ZSNaNE,
                 .XZeroE, .YZeroE, .ZZeroE, .XInfE, .YInfE, .ZInfE,
                 .XExpMaxE, .ZDenormE);
 endmodule
@@ -1373,10 +1372,10 @@ module readvectors (
   output logic [`NF:0]            XManE, YManE, ZManE,    // mantissas of XYZ (converted to largest supported precision)
   output logic                    XNaNE, YNaNE, ZNaNE,    // is XYZ a NaN
   output logic                    XSNaNE, YSNaNE, ZSNaNE, // is XYZ a signaling NaN
-  output logic                    XDenormE, YDenormE, ZDenormE,   // is XYZ denormalized
+  output logic                    XDenormE, ZDenormE,   // is XYZ denormalized
   output logic                    XZeroE, YZeroE, ZZeroE,         // is XYZ zero
   output logic                    XInfE, YInfE, ZInfE,            // is XYZ infinity
-  output logic XNormE, XExpMaxE,
+  output logic XExpMaxE,
   output logic [`FLEN-1:0] X, Y, Z
 );
 
@@ -1660,7 +1659,7 @@ module readvectors (
   end
   
   unpack unpack(.X, .Y, .Z, .FmtE(ModFmt), .XSgnE, .YSgnE, .ZSgnE, .XExpE, .YExpE, .ZExpE,
-                .XManE, .YManE, .ZManE, .XNormE, .XNaNE, .YNaNE, .ZNaNE, .XSNaNE, .YSNaNE, .ZSNaNE,
-                .XDenormE, .YDenormE, .ZDenormE, .XZeroE, .YZeroE, .ZZeroE, .XInfE, .YInfE, .ZInfE,
+                .XManE, .YManE, .ZManE, .XNaNE, .YNaNE, .ZNaNE, .XSNaNE, .YSNaNE, .ZSNaNE,
+                .XDenormE, .ZDenormE, .XZeroE, .YZeroE, .ZZeroE, .XInfE, .YInfE, .ZInfE,
                 .XExpMaxE);
 endmodule
\ No newline at end of file

From ee7070c5b6cda39d0ffbe07b7da4ee6aebbb1aef Mon Sep 17 00:00:00 2001
From: DTowersM <dtowersm@gmail.com>
Date: Wed, 1 Jun 2022 17:19:19 +0000
Subject: [PATCH 13/14] some changes to further support vsim on embench

---
 benchmarks/embench/Makefile | 24 ++++++++++++++++++------
 1 file changed, 18 insertions(+), 6 deletions(-)

diff --git a/benchmarks/embench/Makefile b/benchmarks/embench/Makefile
index 0cb54e1a..4a4875df 100644
--- a/benchmarks/embench/Makefile
+++ b/benchmarks/embench/Makefile
@@ -6,14 +6,23 @@ all: build sim
 
 allClean: clean all
 
-build:
-	../../addins/embench-iot/build_all.py -v --builddir=bd_speed --arch riscv32 --chip generic --board rv32wallyverilog --ldflags="-nostartfiles ../../../config/riscv32/boards/rv32wallyverilog/startup/crt0.S" --cflags="-nostartfiles" 
+build: buildspeed buildsize
+
+buildspeed:
+	../../addins/embench-iot/build_all.py --builddir=bd_speed --arch riscv32 --chip generic --board rv32wallyverilog --ldflags="-nostartfiles ../../../config/riscv32/boards/rv32wallyverilog/startup/crt0.S" --cflags="-nostartfiles" 
 	find ../../addins/embench-iot/bd_speed/ -type f ! -name "*.*" | while read f; do cp "$$f" "$$f.elf"; done
-	../../addins/embench-iot/build_all.py -v --builddir=bd_size --arch riscv32 --chip generic --board rv32wallyverilog --ldflags="-nostdlib -nostartfiles ../../../config/riscv32/boards/rv32wallyverilog/startup/dummy.S" --cflags="-msave-restore" --dummy-libs="libgcc libm libc crt0"
 
-sim: modelSimBuild size speed
+buildsize:
+	../../addins/embench-iot/build_all.py --builddir=bd_size --arch riscv32 --chip generic --board rv32wallyverilog --ldflags="-nostdlib -nostartfiles ../../../config/riscv32/boards/rv32wallyverilog/startup/dummy.S" --cflags="-msave-restore" --dummy-libs="libgcc libm libc crt0"
 
-modelSimBuild: objdump
+sim: modelSimBuild speed
+
+# vsim:
+# 	cd ../../pipelined/regression/
+# 	vsim -c -do "do wally-pipelined-batch.do rv32gc embench"
+# 	cd ../../benchmarks/embench/
+
+modelSimBuild: buildspeed objdump
 	find ../../addins/embench-iot/bd_speed/ -type f -name "*.elf" | while read f; do riscv64-unknown-elf-elf2hex --bit-width 32 --input "$$f" --output "$$f.memfile"; done
 	find ../../addins/embench-iot/bd_speed/ -type f -name "*.elf.objdump" | while read f; do extractFunctionRadix.sh $$f; done
 
@@ -23,13 +32,16 @@ size:
 speed:
 	../../addins/embench-iot/benchmark_speed.py --builddir=bd_speed --target-module run_wally --cpu-mhz=1
 
-objdump:
+objdump: buildspeed
 	find ../../addins/embench-iot/bd_speed/ -type f -name "*.elf" | while read f; do riscv64-unknown-elf-objdump -S -D "$$f" > "$$f.objdump"; done
 
 clean: 
 	rm -rf ../../addins/embench-iot/bd_speed/
 	rm -rf ../../addins/embench-iot/bd_size/
 
+allclean: clean
+	rm -rf ../../addins/embench-iot/logs/
+
 # std:
 # 	../../addins/embench-iot/build_all.py --builddir=bd_std --arch riscv32 --chip generic --board rv32wallyverilog --cc riscv64-unknown-elf-gcc --cflags="-v -c -O2 -ffunction-sections -march=rv32imac -mabi=ilp32" --ldflags="-Wl,-gc-sections -v -march=rv32imac -mabi=ilp32 ../../../../../benchmarks/embench/tohost.S -T../../../config/riscv32/boards/rv32wallyverilog/link.ld" --user-libs="-lm" 
 # 	riscv64-unknown-elf-objdump -D ../../addins/embench-iot/bd_std/src/aha-mont64/aha-mont64 > ../../addins/embench-iot/bd_std/src/aha-mont64/aha-mont64.objdump

From d28b4cf6027a8c39b5c5ef05086fca7834af41b8 Mon Sep 17 00:00:00 2001
From: DTowersM <dtowersm@gmail.com>
Date: Wed, 1 Jun 2022 21:00:44 +0000
Subject: [PATCH 14/14] added support for embench post processing to
 testbench.sv

---
 pipelined/testbench/testbench.sv | 138 ++++++++++++++++++-------------
 1 file changed, 79 insertions(+), 59 deletions(-)

diff --git a/pipelined/testbench/testbench.sv b/pipelined/testbench/testbench.sv
index ba312292..0ebab1cf 100644
--- a/pipelined/testbench/testbench.sv
+++ b/pipelined/testbench/testbench.sv
@@ -128,7 +128,8 @@ logic [3:0] dummy;
     end
   end
 
-  string signame, memfilename, pathname, objdumpfilename, adrstr;
+  string signame, memfilename, pathname, objdumpfilename, adrstr, outputfile;
+  integer outputFilePointer;
 
   logic [31:0] GPIOPinsIn, GPIOPinsOut, GPIOPinsEn;
   logic UARTSin, UARTSout;
@@ -213,70 +214,88 @@ logic [3:0] dummy;
           $display("Benchmark: coremark is done.");
           $stop;
         end
+      // Termination condition (i.e. we finished running current test) 
       if (DCacheFlushDone) begin
- 
-        #600; // give time for instructions in pipeline to finish
-        // clear signature to prevent contamination from previous tests
-        for(i=0; i<SIGNATURESIZE; i=i+1) begin
-          sig32[i] = 'bx;
-        end
-
-        // read signature, reformat in 64 bits if necessary
-        signame = {pathname, tests[test], ".signature.output"};
-        $readmemh(signame, sig32);
-        i = 0;
-        while (i < SIGNATURESIZE) begin
-          if (`XLEN == 32) begin
-            signature[i] = sig32[i];
-            i = i+1;
-          end else begin
-            signature[i/2] = {sig32[i+1], sig32[i]};
-            i = i + 2;
-          end
-          if (i >= 4 & sig32[i-4] === 'bx) begin
-            if (i == 4) begin
-              i = SIGNATURESIZE+1; // flag empty file
-              $display("  Error: empty test file");
-            end else i = SIGNATURESIZE; // skip over the rest of the x's for efficiency
-          end
-        end
-
-        // Check errors
-        errors = (i == SIGNATURESIZE+1); // error if file is empty
-        i = 0;
+        // Gets the memory location of begin_signature
         testadr = (`RAM_BASE+tests[test+1].atohex())/(`XLEN/8);
         testadrNoBase = (tests[test+1].atohex())/(`XLEN/8);
-        /* verilator lint_off INFINITELOOP */
-        while (signature[i] !== 'bx) begin
-          logic [`XLEN-1:0] sig;
-          if (`DMEM == `MEM_TIM) sig = dut.core.lsu.dtim.dtim.ram.memory.RAM[testadrNoBase+i];
-          else                   sig = dut.uncore.ram.ram.memory.RAM[testadrNoBase+i];
-          //$display("signature[%h] = %h sig = %h", i, signature[i], sig);
-          if (signature[i] !== sig &
-          //if (signature[i] !== dut.core.lsu.dtim.ram.memory.RAM[testadr+i] &
-	      (signature[i] !== DCacheFlushFSM.ShadowRAM[testadr+i])) begin  // ***i+1?
-            if ((signature[i] !== '0 | signature[i+4] !== 'x)) begin
-              // if (signature[i+4] !== 'bx | (signature[i] !== 32'hFFFFFFFF & signature[i] !== 32'h00000000)) begin
-              // report errors unless they are garbage at the end of the sim
-              // kind of hacky test for garbage right now
-              $display("sig4 = %h ne %b", signature[i+4], signature[i+4] !== 'bx);
-              errors = errors+1;
-              $display("  Error on test %s result %d: adr = %h sim (D$) %h sim (DMEM) = %h, signature = %h", 
-                    tests[test], i, (testadr+i)*(`XLEN/8), DCacheFlushFSM.ShadowRAM[testadr+i], sig, signature[i]);
-                    //   tests[test], i, (testadr+i)*(`XLEN/8), DCacheFlushFSM.ShadowRAM[testadr+i], dut.core.lsu.dtim.ram.memory.RAM[testadr+i], signature[i]);
-              $stop;//***debug
+        #600; // give time for instructions in pipeline to finish
+        if (TEST == "embench") begin
+          // Writes contents of begin_signature to .sim.output file
+          // this contains instret and cycles for start and end of test run, used by embench python speed script to calculate embench speed score
+          // also begin_signature contains the results of the self checking mechanism, which will be read by the python script for error checking
+          $display("Embench Benchmark: %s is done.", tests[test]);
+          outputfile = {pathname, tests[test], ".sim.output"};
+          outputFilePointer = $fopen(outputfile);
+          i = 0;
+          while ($unsigned(i) < $unsigned(5'd5)) begin
+            $fdisplayh(outputFilePointer, DCacheFlushFSM.ShadowRAM[testadr+i]);
+            i = i + 1;
+          end
+          $fclose(outputFilePointer);
+          $display("Embench Benchmark: created output file: %s", outputfile);
+        end else begin 
+          // for tests with no self checking mechanism, read .signature.output file and compare to check for errors
+          // clear signature to prevent contamination from previous tests
+          for(i=0; i<SIGNATURESIZE; i=i+1) begin
+            sig32[i] = 'bx;
+          end
+          // read signature, reformat in 64 bits if necessary
+          signame = {pathname, tests[test], ".signature.output"};
+          $readmemh(signame, sig32);
+          i = 0;
+          while (i < SIGNATURESIZE) begin
+            if (`XLEN == 32) begin
+              signature[i] = sig32[i];
+              i = i+1;
+            end else begin
+              signature[i/2] = {sig32[i+1], sig32[i]};
+              i = i + 2;
+            end
+            if (i >= 4 & sig32[i-4] === 'bx) begin
+              if (i == 4) begin
+                i = SIGNATURESIZE+1; // flag empty file
+                $display("  Error: empty test file");
+              end else i = SIGNATURESIZE; // skip over the rest of the x's for efficiency
             end
           end
-          i = i + 1;
-        end
-        /* verilator lint_on INFINITELOOP */
-        if (errors == 0) begin
-          $display("%s succeeded.  Brilliant!!!", tests[test]);
-        end
-        else begin
-          $display("%s failed with %d errors. :(", tests[test], errors);
-          totalerrors = totalerrors+1;
+
+          // Check errors
+          errors = (i == SIGNATURESIZE+1); // error if file is empty
+          i = 0;
+          /* verilator lint_off INFINITELOOP */
+          while (signature[i] !== 'bx) begin
+            logic [`XLEN-1:0] sig;
+            if (`DMEM == `MEM_TIM) sig = dut.core.lsu.dtim.dtim.ram.memory.RAM[testadrNoBase+i];
+            else                   sig = dut.uncore.ram.ram.memory.RAM[testadrNoBase+i];
+            //$display("signature[%h] = %h sig = %h", i, signature[i], sig);
+            if (signature[i] !== sig &
+            //if (signature[i] !== dut.core.lsu.dtim.ram.memory.RAM[testadr+i] &
+            (signature[i] !== DCacheFlushFSM.ShadowRAM[testadr+i])) begin  // ***i+1?
+              if ((signature[i] !== '0 | signature[i+4] !== 'x)) begin
+                // if (signature[i+4] !== 'bx | (signature[i] !== 32'hFFFFFFFF & signature[i] !== 32'h00000000)) begin
+                // report errors unless they are garbage at the end of the sim
+                // kind of hacky test for garbage right now
+                $display("sig4 = %h ne %b", signature[i+4], signature[i+4] !== 'bx);
+                errors = errors+1;
+                $display("  Error on test %s result %d: adr = %h sim (D$) %h sim (DMEM) = %h, signature = %h", 
+                      tests[test], i, (testadr+i)*(`XLEN/8), DCacheFlushFSM.ShadowRAM[testadr+i], sig, signature[i]);
+                      //   tests[test], i, (testadr+i)*(`XLEN/8), DCacheFlushFSM.ShadowRAM[testadr+i], dut.core.lsu.dtim.ram.memory.RAM[testadr+i], signature[i]);
+                $stop;//***debug
+              end
+            end
+            i = i + 1;
+          end
+          /* verilator lint_on INFINITELOOP */
+          if (errors == 0) begin
+            $display("%s succeeded.  Brilliant!!!", tests[test]);
+          end
+          else begin
+            $display("%s failed with %d errors. :(", tests[test], errors);
+            totalerrors = totalerrors+1;
+          end
         end
+        // move onto the next test, check to see if we're done
         test = test + 2;
         if (test == tests.size()) begin
           if (totalerrors == 0) $display("SUCCESS! All tests ran without failures.");
@@ -284,6 +303,7 @@ logic [3:0] dummy;
           $stop;
         end
         else begin
+            // If there are still additional tests to run, read in information for the next test
             //pathname = tvpaths[tests[0]];
             memfilename = {pathname, tests[test], ".elf.memfile"};
             //$readmemh(memfilename, dut.uncore.ram.ram.memory.RAM);