From dac011c1d2fd5eb635dafa8235e250a96d3a6030 Mon Sep 17 00:00:00 2001
From: Alec Vercruysse <vercruysse.alec@gmail.com>
Date: Wed, 29 Mar 2023 13:04:00 -0700
Subject: [PATCH 1/7] icache coverage improvements by simplifying logic

---
 src/cache/cache.sv    | 19 +++++++++++++------
 src/cache/cacheLRU.sv |  8 +++++---
 2 files changed, 18 insertions(+), 9 deletions(-)

diff --git a/src/cache/cache.sv b/src/cache/cache.sv
index da7f8327..3dac0c56 100644
--- a/src/cache/cache.sv
+++ b/src/cache/cache.sv
@@ -168,14 +168,21 @@ module cache #(parameter LINELEN,  NUMLINES,  NUMWAYS, LOGBWPL, WORDLEN, MUXINTE
     assign DemuxedByteMask[(index+1)*(WORDLEN/8)-1:index*(WORDLEN/8)] = MemPAdrDecoded[index] ? ByteMask : '0;
   end
   assign FetchBufferByteSel = SetValid & ~SetDirty ? '1 : ~DemuxedByteMask;  // If load miss set all muxes to 1.
-  assign LineByteMask = SetValid ? '1 : SetDirty ? DemuxedByteMask : '0;
 
-  // Merge write data into fetched cache line for store miss
-  for(index = 0; index < LINELEN/8; index++) begin
-    mux2 #(8) WriteDataMux(.d0(CacheWriteData[(8*index)%WORDLEN+7:(8*index)%WORDLEN]),
-      .d1(FetchBuffer[8*index+7:8*index]), .s(FetchBufferByteSel[index]), .y(LineWriteData[8*index+7:8*index]));
+  if(!READ_ONLY_CACHE) begin:WriteSelLogic
+    // Merge write data into fetched cache line for store miss
+    for(index = 0; index < LINELEN/8; index++) begin
+       mux2 #(8) WriteDataMux(.d0(CacheWriteData[(8*index)%WORDLEN+7:(8*index)%WORDLEN]),
+         .d1(FetchBuffer[8*index+7:8*index]), .s(FetchBufferByteSel[index]), .y(LineWriteData[8*index+7:8*index]));
+    end
+    assign LineByteMask = SetValid ? '1 : SetDirty ? DemuxedByteMask : '0;
   end
-   
+  else
+    begin:WriteSelLogic
+       // No need for this mux if the cache does not handle writes.
+       assign LineWriteData = FetchBuffer;
+       assign LineByteMask = '1;
+    end
   /////////////////////////////////////////////////////////////////////////////////////////////
   // Flush logic
   /////////////////////////////////////////////////////////////////////////////////////////////
diff --git a/src/cache/cacheLRU.sv b/src/cache/cacheLRU.sv
index 05e26f4b..78080794 100644
--- a/src/cache/cacheLRU.sv
+++ b/src/cache/cacheLRU.sv
@@ -98,7 +98,9 @@ module cacheLRU
     assign LRUUpdate[t1] = LRUUpdate[s] & WayEncoded[r];
   end
 
-  mux2 #(1) LRUMuxes[NUMWAYS-2:0](CurrLRU, ~WayExpanded, LRUUpdate, NextLRU);
+  // The root node of the LRU tree will always be selected in LRUUpdate. No mux needed.
+  assign NextLRU[NUMWAYS-2] = ~WayExpanded[NUMWAYS-2];
+  mux2 #(1) LRUMuxes[NUMWAYS-3:0](CurrLRU[NUMWAYS-3:0], ~WayExpanded[NUMWAYS-3:0], LRUUpdate[NUMWAYS-3:0], NextLRU[NUMWAYS-3:0]);
 
   // Compute next victim way.
   for(s = NUMWAYS-2; s >= NUMWAYS/2; s--) begin
@@ -128,8 +130,8 @@ module cacheLRU
   always_ff @(posedge clk) begin
     if (reset) for (int set = 0; set < NUMLINES; set++) LRUMemory[set] <= '0;
     if(CacheEn) begin
-      if((InvalidateCache | FlushCache) & ~FlushStage) for (int set = 0; set < NUMLINES; set++) LRUMemory[set] <= '0;
-      else if (LRUWriteEn & ~FlushStage) begin 
+      // if((InvalidateCache | FlushCache) & ~FlushStage) for (int set = 0; set < NUMLINES; set++) LRUMemory[set] <= '0;
+      if (LRUWriteEn & ~FlushStage) begin 
         LRUMemory[PAdr] <= NextLRU;
       end
       if(LRUWriteEn & ~FlushStage & (PAdr == CacheSet))

From 3990417d704209eac501755de21bf6a0df354487 Mon Sep 17 00:00:00 2001
From: Alessandro Maiuolo <amaiuolo@g.hmc.edu>
Date: Wed, 29 Mar 2023 20:57:26 -0700
Subject: [PATCH 2/7] integrated tv generation for IFdivsqrt

---
 .../fp/combined_IF_vectors/IF_vectors/README  |   4 +
 .../combined_IF_vectors/create_IF_vectors.sh  |   8 +
 .../extract_arch_vectors.py                   | 251 ++++++++++++++++++
 .../extract_testfloat_vectors.py              |  79 ++++++
 tests/fp/create_all_vectors.sh                |   3 +
 5 files changed, 345 insertions(+)
 create mode 100644 tests/fp/combined_IF_vectors/IF_vectors/README
 create mode 100755 tests/fp/combined_IF_vectors/create_IF_vectors.sh
 create mode 100755 tests/fp/combined_IF_vectors/extract_arch_vectors.py
 create mode 100755 tests/fp/combined_IF_vectors/extract_testfloat_vectors.py

diff --git a/tests/fp/combined_IF_vectors/IF_vectors/README b/tests/fp/combined_IF_vectors/IF_vectors/README
new file mode 100644
index 00000000..bfbf368d
--- /dev/null
+++ b/tests/fp/combined_IF_vectors/IF_vectors/README
@@ -0,0 +1,4 @@
+This folder holds the archtest and testfloat vectors necessary fo evaluating performance
+of standalone intdiv vs combined IFdivsqrt
+
+to generate vectors, uncomment line 8 in create_all_vectors.sh
\ No newline at end of file
diff --git a/tests/fp/combined_IF_vectors/create_IF_vectors.sh b/tests/fp/combined_IF_vectors/create_IF_vectors.sh
new file mode 100755
index 00000000..d6b83f59
--- /dev/null
+++ b/tests/fp/combined_IF_vectors/create_IF_vectors.sh
@@ -0,0 +1,8 @@
+#!/bin/sh
+# create test vectors for stand alone int
+
+./extract_testfloat_vectors.py
+./extract_arch_vectors.py
+
+# to create tvs for evaluation of combined IFdivsqrt
+#./combined_IF_vectors/create_IF_vectors.sh
\ No newline at end of file
diff --git a/tests/fp/combined_IF_vectors/extract_arch_vectors.py b/tests/fp/combined_IF_vectors/extract_arch_vectors.py
new file mode 100755
index 00000000..c80c7a84
--- /dev/null
+++ b/tests/fp/combined_IF_vectors/extract_arch_vectors.py
@@ -0,0 +1,251 @@
+#! /usr/bin/python3
+
+# author: Alessandro Maiuolo
+# contact: amaiuolo@g.hmc.edu
+# date created: 3-29-2023
+
+# extract all arch test vectors
+import os
+wally = os.popen('echo $WALLY').read().strip()
+
+def ext_bits(my_string):
+    target_len = 32 # we want 128 bits, div by 4 bc hex notation
+    zeroes_to_add = target_len - len(my_string)
+    return zeroes_to_add*"0" + my_string
+
+def twos_comp(b, x):
+    if b == 32:
+        return hex(0x100000000 - int(x,16))[2:]
+    elif b == 64:
+        return hex(0x10000000000000000 - int(x,16))[2:]
+    else:
+        return "UNEXPECTED_BITSIZE"
+
+def unpack_rf(packed):
+    bin_u = bin(int(packed, 16))[2:].zfill(8) # translate to binary
+    flags = hex(int(bin_u[3:],2))[2:].zfill(2)
+    rounding_mode = hex(int(bin_u[:3],2))[2:]
+    return flags, rounding_mode
+
+# rounding mode dictionary
+round_dict = {
+    "rne":"0",
+    "rnm":"4",
+    "ru":"3",
+    "rz":"1",
+    "rd":"2",
+    "dyn":"7"
+}
+
+# fcsr dictionary
+fcsr_dict = {
+    "0":"rne",
+    "128":"rnm",
+    "96":"ru",
+    "32":"rz",
+    "64":"rd",
+    "224":"dyn"
+}
+
+print("creating arch test vectors")
+
+class Config:
+  def __init__(self, bits, letter, op, filt, op_code):
+    self.bits = bits
+    self.letter = letter
+    self.op = op
+    self.filt = filt
+    self.op_code = op_code
+
+def create_vectors(my_config):
+    suite_folder_num = my_config.bits
+    if my_config.bits == 64 and my_config.letter == "F": suite_folder_num = 32
+    source_dir1 = "{}/addins/riscv-arch-test/riscv-test-suite/rv{}i_m/{}/src/".format(wally, suite_folder_num, my_config.letter)
+    source_dir2 = "{}/tests/riscof/work/riscv-arch-test/rv{}i_m/{}/src/".format(wally, my_config.bits, my_config.letter)
+    dest_dir = "{}/tests/fp/combined_IF_vectors/IF_vectors/".format(wally)
+    all_vectors1 = os.listdir(source_dir1)
+
+    filt_vectors1 = [v for v in all_vectors1 if my_config.filt in v]
+    # print(filt_vectors1)
+    filt_vectors2 = [v + "/ref/Reference-sail_c_simulator.signature" for v in all_vectors1 if my_config.filt in v]
+
+    # iterate through all vectors
+    for i in range(len(filt_vectors1)):
+        vector1 = filt_vectors1[i]
+        vector2 = filt_vectors2[i]
+        operation = my_config.op_code
+        rounding_mode = "X"
+        flags = "XX"
+        # use name to create our new tv
+        dest_file = open("{}cvw_{}_{}.tv".format(dest_dir, my_config.bits, vector1[:-2]), 'a')
+        # open vectors
+        src_file1 = open(source_dir1 + vector1,'r')
+        src_file2 = open(source_dir2 + vector2,'r')
+        # for each test in the vector
+        reading = True
+        src_file2.readline() #skip first bc junk
+        # print(my_config.bits, my_config.letter)
+        if my_config.letter == "F" and my_config.bits == 64:
+            reading = True
+            # print("trigger 64F")
+            #skip first 2 lines bc junk
+            src_file2.readline()
+            while reading:
+                # get answer and flags from Ref...signature
+                # answers are before deadbeef (first line of 4)
+                # flags are after deadbeef (third line of 4)
+                answer = src_file2.readline().strip()
+                deadbeef = src_file2.readline().strip()
+                # print(answer)
+                if not (answer == "e7d4b281" and deadbeef == "6f5ca309"): # if there is still stuff to read
+                    # get flags
+                    packed = src_file2.readline().strip()[6:]
+                    flags, rounding_mode = unpack_rf(packed)
+                    # skip 00000000 buffer
+                    src_file2.readline()
+
+                    # parse through .S file
+                    detected = False
+                    done = False
+                    op1val = "0"
+                    op2val = "0"
+                    while not (detected or done):
+                        # print("det1")
+                        line = src_file1.readline()
+                        # print(line)
+                        if "op1val" in line:
+                            # print("det2")
+                            # parse line
+                            op1val = line.split("op1val")[1].split("x")[1].split(";")[0]
+                            if my_config.op != "fsqrt": # sqrt doesn't have two input vals
+                                op2val = line.split("op2val")[1].split("x")[1].strip()
+                                if op2val[-1] == ";": op2val = op2val[:-1] # remove ; if it's there
+                            else:
+                                op2val = 32*"X"
+                            # go to next test in vector
+                            detected = True
+                        elif "RVTEST_CODE_END" in line:
+                            done = True
+                    # put it all together
+                    if not done:
+                        translation = "{}_{}_{}_{}_{}_{}".format(operation, ext_bits(op1val), ext_bits(op2val), ext_bits(answer.strip()), flags, rounding_mode)
+                        dest_file.write(translation + "\n")
+                else:
+                    # print("read false")
+                    reading = False
+        elif my_config.letter == "M" and my_config.bits == 64:
+            reading = True
+            #skip first 2 lines bc junk
+            src_file2.readline()
+            while reading:
+                # print("trigger 64M")
+                # get answer from Ref...signature
+                # answers span two lines and are reversed
+                answer2 = src_file2.readline().strip()
+                answer1 = src_file2.readline().strip()
+                answer = answer1 + answer2
+                # print(answer1,answer2)
+                if not (answer2 == "e7d4b281" and answer1 == "6f5ca309"): # if there is still stuff to read
+                    # parse through .S file
+                    detected = False
+                    done = False
+                    op1val = "0"
+                    op2val = "0"
+                    while not (detected or done):
+                        # print("det1")
+                        line = src_file1.readline()
+                        # print(line)
+                        if "op1val" in line:
+                            # print("det2")
+                            # parse line
+                            op1val = line.split("op1val")[1].split("x")[1].split(";")[0]
+                            if "-" in line.split("op1val")[1].split("x")[0]: # neg sign handling
+                                op1val = twos_comp(my_config.bits, op1val)
+                            if my_config.op != "fsqrt": # sqrt doesn't have two input vals, unnec here but keeping for later
+                                op2val = line.split("op2val")[1].split("x")[1].strip()
+                                if op2val[-1] == ";": op2val = op2val[:-1] # remove ; if it's there
+                                if "-" in line.split("op2val")[1].split("x")[0]: # neg sign handling
+                                    op2val = twos_comp(my_config.bits, op2val)
+                            # go to next test in vector
+                            detected = True
+                        elif "RVTEST_CODE_END" in line:
+                            done = True
+                    # ints don't have flags
+                    flags = "XX"
+                    # put it all together
+                    if not done:
+                        translation = "{}_{}_{}_{}_{}_{}".format(operation, ext_bits(op1val), ext_bits(op2val), ext_bits(answer.strip()), flags.strip(), rounding_mode)
+                        dest_file.write(translation + "\n")
+                else:
+                    # print("read false")
+                    reading = False
+        else:
+            while reading:
+                # get answer and flags from Ref...signature
+                answer = src_file2.readline()
+                # print(answer)
+                packed = src_file2.readline()[6:]
+                # print(packed)
+                if len(packed.strip())>0: # if there is still stuff to read
+                    # print("packed")
+                    # parse through .S file
+                    detected = False
+                    done = False
+                    op1val = "0"
+                    op2val = "0"
+                    while not (detected or done):
+                        # print("det1")
+                        line = src_file1.readline()
+                        # print(line)
+                        if "op1val" in line:
+                            # print("det2")
+                            # parse line
+                            op1val = line.split("op1val")[1].split("x")[1].split(";")[0]
+                            if "-" in line.split("op1val")[1].split("x")[0]: # neg sign handling
+                                op1val = twos_comp(my_config.bits, op1val)
+                            if my_config.op != "fsqrt": # sqrt doesn't have two input vals
+                                op2val = line.split("op2val")[1].split("x")[1].strip()
+                                if op2val[-1] == ";": op2val = op2val[:-1] # remove ; if it's there
+                                if "-" in line.split("op2val")[1].split("x")[0]: # neg sign handling
+                                    op2val = twos_comp(my_config.bits, op2val)
+                            # go to next test in vector
+                            detected = True
+                        elif "RVTEST_CODE_END" in line:
+                            done = True
+                    # rounding mode for float
+                    if not done and (my_config.op == "fsqrt" or my_config.op == "fdiv"):
+                        flags, rounding_mode = unpack_rf(packed)
+                    
+                    # put it all together
+                    if not done:
+                        translation = "{}_{}_{}_{}_{}_{}".format(operation, ext_bits(op1val), ext_bits(op2val), ext_bits(answer.strip()), flags, rounding_mode)
+                        dest_file.write(translation + "\n")
+                else:
+                    # print("read false")
+                    reading = False
+        print("out")
+        dest_file.close()
+        src_file1.close()
+        src_file2.close()
+
+config_list = [
+Config(32, "M", "div", "div_", 0),
+Config(32, "F", "fdiv", "fdiv", 1),
+Config(32, "F", "fsqrt", "fsqrt", 2),
+Config(32, "M", "rem", "rem-", 3),
+Config(32, "M", "divu", "divu-", 4),
+Config(32, "M", "remu", "remu-", 5),
+Config(64, "M", "div", "div-", 0),
+Config(64, "F", "fdiv", "fdiv", 1),
+Config(64, "F", "fsqrt", "fsqrt", 2),
+Config(64, "M", "rem", "rem-", 3),
+Config(64, "M", "divu", "divu-", 4),
+Config(64, "M", "remu", "remu-", 5),
+Config(64, "M", "divw", "divw-", 6),
+Config(64, "M", "divuw", "divuw-", 7),
+Config(64, "M", "remw", "remw-", 8),
+Config(64, "M", "remuw", "remuw-", 9)
+]
+
+for c in config_list:
+    create_vectors(c)
\ No newline at end of file
diff --git a/tests/fp/combined_IF_vectors/extract_testfloat_vectors.py b/tests/fp/combined_IF_vectors/extract_testfloat_vectors.py
new file mode 100755
index 00000000..07047be2
--- /dev/null
+++ b/tests/fp/combined_IF_vectors/extract_testfloat_vectors.py
@@ -0,0 +1,79 @@
+#! /usr/bin/python3
+# extract sqrt and float div testfloat vectors
+
+# author: Alessandro Maiuolo
+# contact: amaiuolo@g.hmc.edu
+# date created: 3-29-2023
+
+import os
+wally = os.popen('echo $WALLY').read().strip()
+# print(wally)
+
+def ext_bits(my_string):
+    target_len = 32 # we want 128 bits, div by 4 bc hex notation
+    zeroes_to_add = target_len - len(my_string)
+    return zeroes_to_add*"0" + my_string
+
+# rounding mode dictionary
+round_dict = {
+    "rne":"0",
+    "rnm":"4",
+    "ru":"3",
+    "rz":"1",
+    "rd":"2",
+    "dyn":"7"
+}
+
+
+print("creating testfloat div test vectors")
+
+source_dir = "{}/tests/fp/vectors/".format(wally)
+dest_dir = "{}/tests/fp/combined_IF_vectors/IF_vectors/".format(wally)
+all_vectors = os.listdir(source_dir)
+
+div_vectors = [v for v in all_vectors if "div" in v]
+
+# iterate through all float div vectors
+for vector in div_vectors:
+    # use name to determine configs
+    config_list = vector.split(".")[0].split("_")
+    operation = "1" #float div
+    rounding_mode = round_dict[str(config_list[2])]
+    # use name to create our new tv
+    dest_file = open(dest_dir + "cvw_" + vector, 'a')
+    # open vector
+    src_file = open(source_dir + vector,'r')
+    # for each test in the vector
+    for i in src_file.readlines():
+        translation = "" # this stores the test that we are currently working on
+        [input_1, input_2, answer, flags] = i.split("_") # separate inputs, answer, and flags
+        # put it all together, strip nec for removing \n on the end of the flags
+        translation = "{}_{}_{}_{}_{}_{}".format(operation, ext_bits(input_1), ext_bits(input_2), ext_bits(answer), flags.strip(), rounding_mode)
+        dest_file.write(translation + "\n")
+    dest_file.close()
+    src_file.close()
+
+
+print("creating testfloat sqrt test vectors")
+
+sqrt_vectors = [v for v in all_vectors if "sqrt" in v]
+
+# iterate through all float div vectors
+for vector in sqrt_vectors:
+    # use name to determine configs
+    config_list = vector.split(".")[0].split("_")
+    operation = "2" #sqrt
+    rounding_mode = round_dict[str(config_list[2])]
+    # use name to create our new tv
+    dest_file = open(dest_dir + "cvw_" + vector, 'a')
+    # open vector
+    src_file = open(source_dir + vector,'r')
+    # for each test in the vector
+    for i in src_file.readlines():
+        translation = "" # this stores the test that we are currently working on
+        [input_1, answer, flags] = i.split("_") # separate inputs, answer, and flags
+        # put it all together, strip nec for removing \n on the end of the flags
+        translation = "{}_{}_{}_{}_{}_{}".format(operation, ext_bits(input_1), "X"*32, ext_bits(answer), flags.strip(), rounding_mode)
+        dest_file.write(translation + "\n")
+    dest_file.close()
+    src_file.close()
\ No newline at end of file
diff --git a/tests/fp/create_all_vectors.sh b/tests/fp/create_all_vectors.sh
index f1ba3625..38cfd555 100755
--- a/tests/fp/create_all_vectors.sh
+++ b/tests/fp/create_all_vectors.sh
@@ -3,3 +3,6 @@
 mkdir -p vectors
 ./create_vectors.sh
 ./remove_spaces.sh
+
+# to create tvs for evaluation of combined IFdivsqrt
+#./combined_IF_vectors/create_IF_vectors.sh
\ No newline at end of file

From 132074523faa7ea5e5eafe5a22060f320911c3f9 Mon Sep 17 00:00:00 2001
From: Alec Vercruysse <vercruysse.alec@gmail.com>
Date: Thu, 30 Mar 2023 10:32:40 -0700
Subject: [PATCH 3/7] Make entire cache write path conditional on
 READ_ONLY_CACHE

---
 src/cache/cache.sv | 21 +++++++++++----------
 1 file changed, 11 insertions(+), 10 deletions(-)

diff --git a/src/cache/cache.sv b/src/cache/cache.sv
index 3dac0c56..56044384 100644
--- a/src/cache/cache.sv
+++ b/src/cache/cache.sv
@@ -96,8 +96,7 @@ module cache #(parameter LINELEN,  NUMLINES,  NUMWAYS, LOGBWPL, WORDLEN, MUXINTE
   logic [LINELEN-1:0]            ReadDataLine, ReadDataLineCache;
   logic                          SelFetchBuffer;
   logic                          CacheEn;
-  logic [CACHEWORDSPERLINE-1:0]  MemPAdrDecoded;
-  logic [LINELEN/8-1:0]          LineByteMask, DemuxedByteMask, FetchBufferByteSel;
+  logic [LINELEN/8-1:0]          LineByteMask;
   logic [$clog2(LINELEN/8) - $clog2(MUXINTERVAL/8) - 1:0] WordOffsetAddr;
 
   genvar                         index;
@@ -161,15 +160,17 @@ module cache #(parameter LINELEN,  NUMLINES,  NUMWAYS, LOGBWPL, WORDLEN, MUXINTE
   /////////////////////////////////////////////////////////////////////////////////////////////
   // Write Path
   /////////////////////////////////////////////////////////////////////////////////////////////
-
-  // Adjust byte mask from word to cache line
-  onehotdecoder #(LOGCWPL) adrdec(.bin(PAdr[LOGCWPL+LOGLLENBYTES-1:LOGLLENBYTES]), .decoded(MemPAdrDecoded));
-  for(index = 0; index < 2**LOGCWPL; index++) begin
-    assign DemuxedByteMask[(index+1)*(WORDLEN/8)-1:index*(WORDLEN/8)] = MemPAdrDecoded[index] ? ByteMask : '0;
-  end
-  assign FetchBufferByteSel = SetValid & ~SetDirty ? '1 : ~DemuxedByteMask;  // If load miss set all muxes to 1.
-
   if(!READ_ONLY_CACHE) begin:WriteSelLogic
+    logic [CACHEWORDSPERLINE-1:0]  MemPAdrDecoded;
+    logic [LINELEN/8-1:0]          DemuxedByteMask, FetchBufferByteSel;
+
+    // Adjust byte mask from word to cache line
+    onehotdecoder #(LOGCWPL) adrdec(.bin(PAdr[LOGCWPL+LOGLLENBYTES-1:LOGLLENBYTES]), .decoded(MemPAdrDecoded));
+    for(index = 0; index < 2**LOGCWPL; index++) begin
+       assign DemuxedByteMask[(index+1)*(WORDLEN/8)-1:index*(WORDLEN/8)] = MemPAdrDecoded[index] ? ByteMask : '0;
+    end
+    assign FetchBufferByteSel = SetValid & ~SetDirty ? '1 : ~DemuxedByteMask;  // If load miss set all muxes to 1.
+
     // Merge write data into fetched cache line for store miss
     for(index = 0; index < LINELEN/8; index++) begin
        mux2 #(8) WriteDataMux(.d0(CacheWriteData[(8*index)%WORDLEN+7:(8*index)%WORDLEN]),

From 3815b7117b03502ef5a43a15208d5e1732cd4c7f Mon Sep 17 00:00:00 2001
From: Alexa Wright <acwright@hmc.edu>
Date: Sat, 1 Apr 2023 16:02:23 -0700
Subject: [PATCH 4/7] Added tests for writing and reading to HPMCOUNTERM csrs

---
 tests/coverage/priv.S | 46 ++++++++++++++++++++++++++++++++++++++++++-
 1 file changed, 45 insertions(+), 1 deletion(-)

diff --git a/tests/coverage/priv.S b/tests/coverage/priv.S
index 8cd18925..7382d331 100644
--- a/tests/coverage/priv.S
+++ b/tests/coverage/priv.S
@@ -42,5 +42,49 @@ main:
     csrw scause, t0
     csrw sepc, t0
     csrw stimecmp, t0
-    
+
+    # Switch to machine mode
+    li a0, 3   
+    ecall 
+    # Testing the HPMCOUNTERM performance counter: writing
+    # Base address is 2816 (MHPMCOUNTERBASE)
+    # There are 32 HPMCOUNTER registers
+    csrw 2816, t0
+    csrw 2817, t0
+    csrw 2818, t0
+    csrw 2819, t0
+    csrw 2820, t0
+    csrw 2821, t0
+    csrw 2822, t0
+    csrw 2823, t0
+    csrw 2824, t0
+    csrw 2825, t0
+    csrw 2826, t0
+    csrw 2827, t0
+    csrw 2828, t0
+    csrw 2829, t0
+    csrw 2830, t0
+    csrw 2831, t0  
+    csrw 2832, t0
+    csrw 2833, t0
+    csrw 2834, t0
+    csrw 2835, t0
+    csrw 2836, t0
+    csrw 2837, t0
+    csrw 2838, t0
+    csrw 2839, t0
+    csrw 2840, t0
+    csrw 2841, t0
+    csrw 2842, t0
+    csrw 2843, t0
+    csrw 2844, t0
+    csrw 2845, t0
+    csrw 2846, t0
+    csrw 2847, t0      
+
+    # Testing the HPMCOUNTERM performance counter: reading
+    csrr t0, 2817
     j done
+
+
+

From e3f3f1421673a7c0016ad81f936df7f61620ac58 Mon Sep 17 00:00:00 2001
From: James Stine <james.stine@okstate.edu>
Date: Sun, 2 Apr 2023 18:16:23 -0500
Subject: [PATCH 5/7] Update one bug in testfloat - still have to fix fpdiv but
 others should now all work

---
 testbench/testbench-fp.sv | 309 +++++++++++++++++++-------------------
 1 file changed, 155 insertions(+), 154 deletions(-)

diff --git a/testbench/testbench-fp.sv b/testbench/testbench-fp.sv
index d1f6f9b6..f250e803 100644
--- a/testbench/testbench-fp.sv
+++ b/testbench/testbench-fp.sv
@@ -1,7 +1,8 @@
-///////////////////////////////////////////
+<///////////////////////////////////////////
 //
 // Written: me@KatherineParry.com
 // Modified: 7/5/2022
+// Modified: 4/2/2023
 //
 // Purpose: Testbench for Testfloat
 // 
@@ -32,75 +33,74 @@
 module testbenchfp;
   parameter TEST="none";
 
-  string      Tests[];        // list of tests to be run
-  logic [2:0] OpCtrl[];       // list of op controls
-  logic [2:0] Unit[];         // list of units being tested
-  logic WriteInt[];           // Is being written to integer resgiter
-  logic [2:0] Frm[4:0] = {3'b100, 3'b010, 3'b011, 3'b001, 3'b000}; // rounding modes: rne-000, rz-001, ru-011, rd-010, rnm-100
-  logic [1:0] Fmt[];          // list of formats for the other units
-  
+  string                       Tests[];        // list of tests to be run
+  logic [2:0]                  OpCtrl[];       // list of op controls
+  logic [2:0]                  Unit[];         // list of units being tested
+  logic                        WriteInt[];           // Is being written to integer resgiter
+  logic [2:0]                  Frm[4:0] = {3'b100, 3'b010, 3'b011, 3'b001, 3'b000}; // rounding modes: rne-000, rz-001, ru-011, rd-010, rnm-100
+  logic [1:0]                  Fmt[];          // list of formats for the other units  
 
-  logic               clk=0;
-  logic [31:0]        TestNum=0;    // index for the test
-  logic [31:0]        OpCtrlNum=0;  // index for OpCtrl
-  logic [31:0]        errors=0;     // how many errors
-  logic [31:0]        VectorNum=0;  // index for test vector
-  logic [31:0]        FrmNum=0;     // index for rounding mode
-  logic [`FLEN*4+7:0] TestVectors[8388609:0];     // list of test vectors
+  logic                        clk=0;
+  logic [31:0]                 TestNum=0;    // index for the test
+  logic [31:0]                 OpCtrlNum=0;  // index for OpCtrl
+  logic [31:0]                 errors=0;     // how many errors
+  logic [31:0]                 VectorNum=0;  // index for test vector
+  logic [31:0]                 FrmNum=0;     // index for rounding mode
+  logic [`FLEN*4+7:0]          TestVectors[8388609:0];     // list of test vectors
 
-  logic [1:0]           FmtVal;          // value of the current Fmt
-  logic [2:0]           UnitVal, OpCtrlVal, FrmVal; // value of the currnet Unit/OpCtrl/FrmVal
-  logic                 WriteIntVal;                // value of the current WriteInt
-  logic [`FLEN-1:0]     X, Y, Z;                    // inputs read from TestFloat
-  logic [`XLEN-1:0]     SrcA;                       // integer input
-  logic [`FLEN-1:0]	    Ans;                        // correct answer from TestFloat
-  logic [`FLEN-1:0]	    Res;                        // result from other units
-  logic [4:0]	 	        AnsFlg;                     // correct flags read from testfloat
-  logic [4:0]	 	        ResFlg, Flg;                // Result flags
-  logic	[`FMTBITS-1:0]  ModFmt;                     // format - 10 = half, 00 = single, 01 = double, 11 = quad
-  logic [`FLEN-1:0]     FpRes, FpCmpRes;            // Results from each unit
-  logic [`XLEN-1:0]     IntRes, CmpRes;             // Results from each unit
-  logic [4:0]           FmaFlg, CvtFlg, DivFlg, CmpFlg;  // Outputed flags
-  logic                 AnsNaN, ResNaN, NaNGood;
-  logic                 Xs, Ys, Zs;                 // sign of the inputs
-  logic [`NE-1:0]       Xe, Ye, Ze;                 // exponent of the inputs
-  logic [`NF:0]         Xm, Ym, Zm;                 // mantissas of the inputs
-  logic                 XNaN, YNaN, ZNaN;           // is the input NaN
-  logic                 XSNaN, YSNaN, ZSNaN;        // is the input a signaling NaN
-  logic                 XSubnorm, ZSubnorm;           // is the input denormalized
-  logic                 XInf, YInf, ZInf;           // is the input infinity
-  logic                 XZero, YZero, ZZero;        // is the input zero
-  logic                 XExpMax, YExpMax, ZExpMax;  // is the input's exponent all ones  
-  logic  [`CVTLEN-1:0]  CvtLzcInE;                  // input to the Leading Zero Counter (priority encoder)
-  logic                 IntZero;
-  logic                 CvtResSgnE;
-  logic [`NE:0]         CvtCalcExpE;    // the calculated expoent
-	logic [`LOGCVTLEN-1:0] CvtShiftAmtE;  // how much to shift by
-	logic [`DIVb:0]       Quot;
-  logic                 CvtResSubnormUfE;
-  logic                 DivStart, FDivBusyE, OldFDivBusyE;
-  logic                 reset = 1'b0;
-  logic [$clog2(`NF+2)-1:0] XZeroCnt, YZeroCnt;
-  logic [`DURLEN-1:0]   Dur;
+  logic [1:0]                  FmtVal;          // value of the current Fmt
+  logic [2:0]                  UnitVal, OpCtrlVal, FrmVal; // value of the currnet Unit/OpCtrl/FrmVal
+  logic                        WriteIntVal;                // value of the current WriteInt
+  logic [`FLEN-1:0]            X, Y, Z;                    // inputs read from TestFloat
+  logic [`XLEN-1:0]            SrcA;                       // integer input
+  logic [`FLEN-1:0]	       Ans;                        // correct answer from TestFloat
+  logic [`FLEN-1:0]	       Res;                        // result from other units
+  logic [4:0]	 	       AnsFlg;                     // correct flags read from testfloat
+  logic [4:0]	 	       ResFlg, Flg;                // Result flags
+  logic	[`FMTBITS-1:0]         ModFmt;                     // format - 10 = half, 00 = single, 01 = double, 11 = quad
+  logic [`FLEN-1:0]            FpRes, FpCmpRes;            // Results from each unit
+  logic [`XLEN-1:0]            IntRes, CmpRes;             // Results from each unit
+  logic [4:0]                  FmaFlg, CvtFlg, DivFlg, CmpFlg;  // Outputed flags
+  logic                        AnsNaN, ResNaN, NaNGood;
+  logic                        Xs, Ys, Zs;                 // sign of the inputs
+  logic [`NE-1:0]              Xe, Ye, Ze;                 // exponent of the inputs
+  logic [`NF:0]                Xm, Ym, Zm;                 // mantissas of the inputs
+  logic                        XNaN, YNaN, ZNaN;           // is the input NaN
+  logic                        XSNaN, YSNaN, ZSNaN;        // is the input a signaling NaN
+  logic                        XSubnorm, ZSubnorm;           // is the input denormalized
+  logic                        XInf, YInf, ZInf;           // is the input infinity
+  logic                        XZero, YZero, ZZero;        // is the input zero
+  logic                        XExpMax, YExpMax, ZExpMax;  // is the input's exponent all ones  
+  logic  [`CVTLEN-1:0]         CvtLzcInE;                  // input to the Leading Zero Counter (priority encoder)
+  logic                        IntZero;
+  logic                        CvtResSgnE;
+  logic [`NE:0]                CvtCalcExpE;    // the calculated expoent
+  logic [`LOGCVTLEN-1:0]       CvtShiftAmtE;  // how much to shift by
+  logic [`DIVb:0]              Quot;
+  logic                        CvtResSubnormUfE;
+  logic                        DivStart, FDivBusyE, OldFDivBusyE;
+  logic                        reset = 1'b0;
+  logic [$clog2(`NF+2)-1:0]    XZeroCnt, YZeroCnt;
+  logic [`DURLEN-1:0]          Dur;
 
   // in-between FMA signals
-  logic                 Mult;
-  logic                 Ss;
-  logic [`NE+1:0]	      Pe;
-  logic [`NE+1:0]	      Se;
-  logic 				        ASticky;
-  logic 					      KillProd; 
-  logic [$clog2(3*`NF+5)-1:0]	SCnt;
-  logic [3*`NF+3:0]	    Sm;       
-  logic 			          InvA;
-  logic 			          NegSum;
-  logic 			          As;
-  logic 			          Ps;
-  logic                 DivSticky;
-  logic                 DivDone;
-  logic                 DivNegSticky;
-  logic [`NE+1:0]       DivCalcExp;
-  logic                 divsqrtop;
+  logic                        Mult;
+  logic                        Ss;
+  logic [`NE+1:0]	       Pe;
+  logic [`NE+1:0]	       Se;
+  logic 		       ASticky;
+  logic 		       KillProd; 
+  logic [$clog2(3*`NF+5)-1:0]  SCnt;
+  logic [3*`NF+3:0]	       Sm;       
+  logic 		       InvA;
+  logic 		       NegSum;
+  logic 		       As;
+  logic 		       Ps;
+  logic                        DivSticky;
+  logic                        DivDone;
+  logic                        DivNegSticky;
+  logic [`NE+1:0]              DivCalcExp;
+  logic                        divsqrtop;
 
 
   ///////////////////////////////////////////////////////////////////////////////////////////////
@@ -126,28 +126,28 @@ module testbenchfp;
     $display("TEST is %s", TEST);
     if (`Q_SUPPORTED) begin // if Quad percision is supported
       if (TEST === "cvtint"| TEST === "all") begin  // if testing integer conversion
-                                              // add the 128-bit cvtint tests to the to-be-tested list
-                                              Tests = {Tests, f128rv32cvtint};
-                                              // add the op-codes for these tests to the op-code list
-                                              OpCtrl = {OpCtrl, `FROM_UI_OPCTRL, `FROM_I_OPCTRL, `TO_UI_OPCTRL, `TO_I_OPCTRL};
-                                              WriteInt = {WriteInt, 1'b0, 1'b0, 1'b1, 1'b1};
-                                              // add what unit is used and the fmt to their lists (one for each test)
-                                              for(int i = 0; i<20; i++) begin
-                                                Unit = {Unit, `CVTINTUNIT};
-                                                Fmt = {Fmt, 2'b11};
-                                              end
-                                              if (`XLEN == 64) begin // if 64-bit integers are supported add their conversions
-                                                Tests = {Tests, f128rv64cvtint};
-                                              // add the op-codes for these tests to the op-code list
-                                                OpCtrl = {OpCtrl, `FROM_UL_OPCTRL, `FROM_L_OPCTRL, `TO_UL_OPCTRL, `TO_L_OPCTRL};
-                                                WriteInt = {WriteInt, 1'b0, 1'b0, 1'b1, 1'b1};
-                                              // add what unit is used and the fmt to their lists (one for each test)
-                                              for(int i = 0; i<20; i++) begin
-                                                Unit = {Unit, `CVTINTUNIT};
-                                                Fmt = {Fmt, 2'b11};
-                                              end
-                                              end
-                                            end
+         // add the 128-bit cvtint tests to the to-be-tested list
+         Tests = {Tests, f128rv32cvtint};
+         // add the op-codes for these tests to the op-code list
+         OpCtrl = {OpCtrl, `FROM_UI_OPCTRL, `FROM_I_OPCTRL, `TO_UI_OPCTRL, `TO_I_OPCTRL};
+         WriteInt = {WriteInt, 1'b0, 1'b0, 1'b1, 1'b1};
+         // add what unit is used and the fmt to their lists (one for each test)
+         for(int i = 0; i<20; i++) begin
+            Unit = {Unit, `CVTINTUNIT};
+            Fmt = {Fmt, 2'b11};
+         end
+         if (`XLEN == 64) begin // if 64-bit integers are supported add their conversions
+            Tests = {Tests, f128rv64cvtint};
+            // add the op-codes for these tests to the op-code list
+            OpCtrl = {OpCtrl, `FROM_UL_OPCTRL, `FROM_L_OPCTRL, `TO_UL_OPCTRL, `TO_L_OPCTRL};
+            WriteInt = {WriteInt, 1'b0, 1'b0, 1'b1, 1'b1};
+            // add what unit is used and the fmt to their lists (one for each test)
+            for(int i = 0; i<20; i++) begin
+               Unit = {Unit, `CVTINTUNIT};
+               Fmt = {Fmt, 2'b11};
+            end
+         end
+      end
       if (TEST === "cvtfp" | TEST === "all") begin  // if the floating-point conversions are being tested
         if(`D_SUPPORTED) begin // if double precision is supported
           // add the 128 <-> 64 bit conversions to the to-be-tested list
@@ -270,27 +270,27 @@ module testbenchfp;
     end
     if (`D_SUPPORTED) begin // if double precision is supported
       if (TEST === "cvtint"| TEST === "all") begin // if integer conversion is being tested
-                                              Tests = {Tests, f64rv32cvtint};
-                                              // add the op-codes for these tests to the op-code list
-                                              OpCtrl = {OpCtrl, `FROM_UI_OPCTRL, `FROM_I_OPCTRL, `TO_UI_OPCTRL, `TO_I_OPCTRL};
-                                              WriteInt = {WriteInt, 1'b0, 1'b0, 1'b1, 1'b1};
-                                              // add what unit is used and the fmt to their lists (one for each test)
-                                              for(int i = 0; i<20; i++) begin
-                                                Unit = {Unit, `CVTINTUNIT};
-                                                Fmt = {Fmt, 2'b01};
-                                              end
-                                              if (`XLEN == 64) begin // if 64-bit integers are being supported
-                                                Tests = {Tests, f64rv64cvtint};
-                                                // add the op-codes for these tests to the op-code list
-                                                OpCtrl = {OpCtrl, `FROM_UL_OPCTRL, `FROM_L_OPCTRL, `TO_UL_OPCTRL, `TO_L_OPCTRL};
-                                                WriteInt = {WriteInt, 1'b0, 1'b0, 1'b1, 1'b1};
-                                                // add what unit is used and the fmt to their lists (one for each test)
-                                                for(int i = 0; i<20; i++) begin
-                                                  Unit = {Unit, `CVTINTUNIT};
-                                                  Fmt = {Fmt, 2'b01};
-                                                end
-                                              end
-                                            end
+         Tests = {Tests, f64rv32cvtint};
+         // add the op-codes for these tests to the op-code list
+         OpCtrl = {OpCtrl, `FROM_UI_OPCTRL, `FROM_I_OPCTRL, `TO_UI_OPCTRL, `TO_I_OPCTRL};
+         WriteInt = {WriteInt, 1'b0, 1'b0, 1'b1, 1'b1};
+         // add what unit is used and the fmt to their lists (one for each test)
+         for(int i = 0; i<20; i++) begin
+            Unit = {Unit, `CVTINTUNIT};
+            Fmt = {Fmt, 2'b01};
+         end
+         if (`XLEN == 64) begin // if 64-bit integers are being supported
+            Tests = {Tests, f64rv64cvtint};
+            // add the op-codes for these tests to the op-code list
+            OpCtrl = {OpCtrl, `FROM_UL_OPCTRL, `FROM_L_OPCTRL, `TO_UL_OPCTRL, `TO_L_OPCTRL};
+            WriteInt = {WriteInt, 1'b0, 1'b0, 1'b1, 1'b1};
+            // add what unit is used and the fmt to their lists (one for each test)
+            for(int i = 0; i<20; i++) begin
+               Unit = {Unit, `CVTINTUNIT};
+               Fmt = {Fmt, 2'b01};
+            end
+         end
+      end
       if (TEST === "cvtfp" | TEST === "all") begin // if floating point conversions are being tested
         if(`F_SUPPORTED) begin // if single precision is supported
           // add the 64 <-> 32 bit conversions to the to-be-tested list
@@ -397,27 +397,27 @@ module testbenchfp;
     end
     if (`F_SUPPORTED) begin // if single precision being supported
       if (TEST === "cvtint"| TEST === "all") begin // if integer conversion is being tested
-                                              Tests = {Tests, f32rv32cvtint};
-                                              // add the op-codes for these tests to the op-code list
-                                              OpCtrl = {OpCtrl, `FROM_UI_OPCTRL, `FROM_I_OPCTRL, `TO_UI_OPCTRL, `TO_I_OPCTRL};
-                                              WriteInt = {WriteInt, 1'b0, 1'b0, 1'b1, 1'b1};
-                                              // add what unit is used and the fmt to their lists (one for each test)
-                                              for(int i = 0; i<20; i++) begin
-                                                Unit = {Unit, `CVTINTUNIT};
-                                                Fmt = {Fmt, 2'b00};
-                                              end
-                                              if (`XLEN == 64) begin // if 64-bit integers are supported
-                                                Tests = {Tests, f32rv64cvtint};
-                                                // add the op-codes for these tests to the op-code list
-                                                OpCtrl = {OpCtrl, `FROM_UL_OPCTRL, `FROM_L_OPCTRL, `TO_UL_OPCTRL, `TO_L_OPCTRL};
-                                                WriteInt = {WriteInt, 1'b0, 1'b0, 1'b1, 1'b1};
-                                                // add what unit is used and the fmt to their lists (one for each test)
-                                              for(int i = 0; i<20; i++) begin
-                                                Unit = {Unit, `CVTINTUNIT};
-                                                Fmt = {Fmt, 2'b00};
-                                              end
-                                              end
-                                            end
+         Tests = {Tests, f32rv32cvtint};
+         // add the op-codes for these tests to the op-code list
+         OpCtrl = {OpCtrl, `FROM_UI_OPCTRL, `FROM_I_OPCTRL, `TO_UI_OPCTRL, `TO_I_OPCTRL};
+         WriteInt = {WriteInt, 1'b0, 1'b0, 1'b1, 1'b1};
+         // add what unit is used and the fmt to their lists (one for each test)
+         for(int i = 0; i<20; i++) begin
+            Unit = {Unit, `CVTINTUNIT};
+            Fmt = {Fmt, 2'b00};
+         end
+         if (`XLEN == 64) begin // if 64-bit integers are supported
+            Tests = {Tests, f32rv64cvtint};
+            // add the op-codes for these tests to the op-code list
+            OpCtrl = {OpCtrl, `FROM_UL_OPCTRL, `FROM_L_OPCTRL, `TO_UL_OPCTRL, `TO_L_OPCTRL};
+            WriteInt = {WriteInt, 1'b0, 1'b0, 1'b1, 1'b1};
+            // add what unit is used and the fmt to their lists (one for each test)
+            for(int i = 0; i<20; i++) begin
+               Unit = {Unit, `CVTINTUNIT};
+               Fmt = {Fmt, 2'b00};
+            end
+         end
+      end
       if (TEST === "cvtfp" | TEST === "all") begin  // if floating point conversion is being tested
         if(`ZFH_SUPPORTED) begin 
           // add the 32 <-> 16 bit conversions to the to-be-tested list
@@ -508,27 +508,27 @@ module testbenchfp;
     end
     if (`ZFH_SUPPORTED) begin // if half precision supported
       if (TEST === "cvtint"| TEST === "all") begin // if in conversions are being tested
-                                              Tests = {Tests, f16rv32cvtint};
-                                              // add the op-codes for these tests to the op-code list
-                                              OpCtrl = {OpCtrl, `FROM_UI_OPCTRL, `FROM_I_OPCTRL, `TO_UI_OPCTRL, `TO_I_OPCTRL};
-                                              WriteInt = {WriteInt, 1'b0, 1'b0, 1'b1, 1'b1};
-                                              // add what unit is used and the fmt to their lists (one for each test)
-                                              for(int i = 0; i<20; i++) begin
-                                                Unit = {Unit, `CVTINTUNIT};
-                                                Fmt = {Fmt, 2'b10};
-                                              end
-                                              if (`XLEN == 64) begin // if 64-bit integers are supported
-                                                Tests = {Tests, f16rv64cvtint};
-                                                // add the op-codes for these tests to the op-code list
-                                                OpCtrl = {OpCtrl, `FROM_UL_OPCTRL, `FROM_L_OPCTRL, `TO_UL_OPCTRL, `TO_L_OPCTRL};
-                                                WriteInt = {WriteInt, 1'b0, 1'b0, 1'b1, 1'b1};
-                                                // add what unit is used and the fmt to their lists (one for each test)
-                                                for(int i = 0; i<20; i++) begin
-                                                  Unit = {Unit, `CVTINTUNIT};
-                                                  Fmt = {Fmt, 2'b10};
-                                                end
-                                              end
-                                            end
+         Tests = {Tests, f16rv32cvtint};
+         // add the op-codes for these tests to the op-code list
+         OpCtrl = {OpCtrl, `FROM_UI_OPCTRL, `FROM_I_OPCTRL, `TO_UI_OPCTRL, `TO_I_OPCTRL};
+         WriteInt = {WriteInt, 1'b0, 1'b0, 1'b1, 1'b1};
+         // add what unit is used and the fmt to their lists (one for each test)
+         for(int i = 0; i<20; i++) begin
+            Unit = {Unit, `CVTINTUNIT};
+            Fmt = {Fmt, 2'b10};
+         end
+         if (`XLEN == 64) begin // if 64-bit integers are supported
+            Tests = {Tests, f16rv64cvtint};
+            // add the op-codes for these tests to the op-code list
+            OpCtrl = {OpCtrl, `FROM_UL_OPCTRL, `FROM_L_OPCTRL, `TO_UL_OPCTRL, `TO_L_OPCTRL};
+            WriteInt = {WriteInt, 1'b0, 1'b0, 1'b1, 1'b1};
+            // add what unit is used and the fmt to their lists (one for each test)
+            for(int i = 0; i<20; i++) begin
+               Unit = {Unit, `CVTINTUNIT};
+               Fmt = {Fmt, 2'b10};
+            end
+         end
+      end
       if (TEST === "cmp"   | TEST === "all") begin // if comparisions are being tested
         // add the correct tests/op-ctrls/unit/fmt to their lists
         Tests = {Tests, f16cmp};
@@ -656,7 +656,8 @@ module testbenchfp;
   end
 
   // extract the inputs (X, Y, Z, SrcA) and the output (Ans, AnsFlg) from the current test vector
-  readvectors readvectors          (.clk, .Fmt(FmtVal), .ModFmt, .TestVector(TestVectors[VectorNum]), .VectorNum, .Ans(Ans), .AnsFlg(AnsFlg), .SrcA, 
+  readvectors readvectors          (.clk, .Fmt(FmtVal), .ModFmt, .TestVector(TestVectors[VectorNum]), 
+                                    .VectorNum, .Ans(Ans), .AnsFlg(AnsFlg), .SrcA, 
                                     .Xs, .Ys, .Zs, .Unit(UnitVal),
                                     .Xe, .Ye, .Ze, .TestNum, .OpCtrl(OpCtrlVal),
                                     .Xm, .Ym, .Zm, .DivStart,
@@ -680,7 +681,7 @@ module testbenchfp;
   ///////////////////////////////////////////////////////////////////////////////////////////////
 
   // instantiate devices under test
-  if (TEST === "fma"| TEST === "mul" | TEST === "add" | TEST === "all") begin : fma
+  if (TEST === "fma"| TEST === "mul" | TEST === "add" | TEST === "sub" | TEST === "all") begin : fma
     fma fma(.Xs(Xs), .Ys(Ys), .Zs(Zs), 
             .Xe(Xe), .Ye(Ye), .Ze(Ze), 
             .Xm(Xm), .Ym(Ym), .Zm(Zm),
@@ -1331,4 +1332,4 @@ module readvectors (
                 .Xm, .Ym, .Zm, .XNaN, .YNaN, .ZNaN, .XSNaN, .YSNaN, .ZSNaN,
                 .XSubnorm, .XZero, .YZero, .ZZero, .XInf, .YInf, .ZInf,
                 .XEn, .YEn, .ZEn, .XExpMax);
-endmodule
\ No newline at end of file
+endmodule

From 440e41bb3e32cebeec411cdaa92fab2671bc66f0 Mon Sep 17 00:00:00 2001
From: Sydney Riley <sriley@g.hmc.edu>
Date: Sun, 2 Apr 2023 23:51:34 -0700
Subject: [PATCH 6/7] expanded ifu coverage including 4 added directed tests
 and 1 exclusion, expanded fpu coverage including 6 directed tests and 2
 multiline exclusions.

---
 src/fpu/fctrl.sv      |  9 ++++++++-
 src/ifu/decompress.sv |  6 ++++++
 tests/coverage/fpu.S  | 18 +++++++++++++++++-
 tests/coverage/ifu.S  | 19 ++++++++++++++++++-
 4 files changed, 49 insertions(+), 3 deletions(-)

diff --git a/src/fpu/fctrl.sv b/src/fpu/fctrl.sv
index ad900701..23279bd1 100755
--- a/src/fpu/fctrl.sv
+++ b/src/fpu/fctrl.sv
@@ -146,10 +146,13 @@ module fctrl (
                                                ControlsD = `FCTRLW'b1_0_01_00_000_0_0_0; // fcvt.s.(d/q/h)
                     7'b0100001: if (Rs2D[4:2] == 3'b000  & SupportedFmt2 & Rs2D[1:0] != 2'b01)
                                                ControlsD = `FCTRLW'b1_0_01_00_001_0_0_0; // fcvt.d.(s/h/q)
+                    // coverage off                           
+                    // We are turning off coverage because rv64gc configuration doesn't support quad or half
                     7'b0100010: if (Rs2D[4:2] == 3'b000 & SupportedFmt2 & Rs2D[1:0] != 2'b10)
                                                ControlsD = `FCTRLW'b1_0_01_00_010_0_0_0; // fcvt.h.(s/d/q)
                     7'b0100011: if (Rs2D[4:2] == 3'b000  & SupportedFmt2 & Rs2D[1:0] != 2'b11)
                                                ControlsD = `FCTRLW'b1_0_01_00_011_0_0_0; // fcvt.q.(s/h/d)
+                    // coverage on
                    7'b1101000: case(Rs2D)
                                   5'b00000:    ControlsD = `FCTRLW'b1_0_01_00_101_0_0_0; // fcvt.s.w   w->s
                                   5'b00001:    ControlsD = `FCTRLW'b1_0_01_00_100_0_0_0; // fcvt.s.wu wu->s
@@ -174,6 +177,9 @@ module fctrl (
                                   5'b00010:    ControlsD = `FCTRLW'b0_1_01_00_011_0_0_1; // fcvt.l.d   d->l
                                   5'b00011:    ControlsD = `FCTRLW'b0_1_01_00_010_0_0_1; // fcvt.lu.d  d->lu
                                 endcase
+                    //coverage off
+                    // turning coverage off here because rv64gc configuration does not support floating point halfs and quads
+                    // verified that these branches will not ever be taken in rv64gc configuration.
                     7'b1101010: case(Rs2D)
                                   5'b00000:    ControlsD = `FCTRLW'b1_0_01_00_101_0_0_0; // fcvt.h.w   w->h
                                   5'b00001:    ControlsD = `FCTRLW'b1_0_01_00_100_0_0_0; // fcvt.h.wu wu->h
@@ -197,7 +203,8 @@ module fctrl (
                                   5'b00001:    ControlsD = `FCTRLW'b0_1_01_00_000_0_0_1; // fcvt.wu.q  q->wu
                                   5'b00010:    ControlsD = `FCTRLW'b0_1_01_00_011_0_0_1; // fcvt.l.q   q->l
                                   5'b00011:    ControlsD = `FCTRLW'b0_1_01_00_010_0_0_1; // fcvt.lu.q  q->lu
-                                endcase                            
+                                endcase
+                    // coverage on                            
                   endcase
       endcase
       /* verilator lint_off CASEINCOMPLETE */
diff --git a/src/ifu/decompress.sv b/src/ifu/decompress.sv
index 0ab0e706..b28a9e7b 100644
--- a/src/ifu/decompress.sv
+++ b/src/ifu/decompress.sv
@@ -135,10 +135,16 @@ module decompress (
                       IllegalCompInstrD = 1;
                       InstrD = {16'b0, instr16}; // preserve instruction for mtval on trap
                     end
+                  // coverage off
+                  // are excluding this branch from coverage because in rv64gc XLEN is always 64 and thus greater than 32 bits
+                  // This branch will only be taken if instr16[12:10] == 3'b111 and 'XLEN !> 32, because all other 
+                  // possible values for instr16[12:10] are covered by branches above. XLEN !> 32 
+                  // will never occur in rv64gc so this branch can not be covered
                   else begin // illegal instruction
                     IllegalCompInstrD = 1;
                     InstrD = {16'b0, instr16}; // preserve instruction for mtval on trap
                   end
+                  // coverage on
         5'b01101: InstrD = {immCJ, 5'b00000, 7'b1101111}; // c.j
         5'b01110: InstrD = {immCB[11:5], 5'b00000, rs1p, 3'b000, immCB[4:0], 7'b1100011}; // c.beqz
         5'b01111: InstrD = {immCB[11:5], 5'b00000, rs1p, 3'b001, immCB[4:0], 7'b1100011}; // c.bnez
diff --git a/tests/coverage/fpu.S b/tests/coverage/fpu.S
index 1a2d5ce7..527547bb 100644
--- a/tests/coverage/fpu.S
+++ b/tests/coverage/fpu.S
@@ -55,7 +55,23 @@ main:
     fcvt.l.q a0, ft3
     fcvt.lu.q a0, ft3
 
- 
+
+    // Tests verfying that half and quad floating point convertion instructions are not supported by rv64gc
+    # fcvt.h.d ft3, ft0 // Somehow this instruction is taking the route on line 124
+                      // idea: enable the Q extension for this to work properly? A: Q and halfs not supported in rv64gc
+    # fcvt.h.w ft3, a0
+    # fcvt.w.h a0, ft0
+    # fcvt.q.w ft3, a0
+    # fcvt.w.q a0, ft0
+    # fcvt.q.d ft3, ft0
+
+    .word 0x38007553    // Testing the all False case for 119 - funct7 under, op = 101 0011
+    .word 0x40000053    // Line 145 All False Test case - illegal instruction?
+    .word 0xd0400053    // Line 156 All False Test case - illegal instruction?
+    .word 0xc0400053    // Line 162 All False Test case - illegal instruction?
+    .word 0xd2400053    // Line 168 All False Test case - illegal instruction?
+    .word 0xc2400053    // Line 174 All False Test case - illegal instruction?
+
     # Test illegal instructions are detected
     .word 0x00000007 // illegal floating-point load (bad Funct3)
     .word 0x00000027 // illegal floating-point store (bad Funct3)
diff --git a/tests/coverage/ifu.S b/tests/coverage/ifu.S
index 3ceeeac1..68db3d08 100644
--- a/tests/coverage/ifu.S
+++ b/tests/coverage/ifu.S
@@ -32,9 +32,26 @@ main:
     csrs mstatus, t0
 
     # calling compressed floating point load double instruction
-    //.halfword 0x2000 // CL type compressed floating-point ld-->funct3,imm,rs1',imm,rd',op
+    //.hword 0x2000 // CL type compressed floating-point ld-->funct3,imm,rs1',imm,rd',op
                         // binary version 0000 0000 0000 0000 0010 0000 0000 0000
     mv s0, sp
     c.fld fs0, 0(s0)
+    c.fsd fs0, 0(s0)
+
+    // c.fldsp fs0, 0
+    .hword 0x2002
+
+    // c.fsdsp fs0, 0
+    .hword 0xA002
+
+    # set XLEN to 64
+    li t0, 0x200000000
+    csrs mstatus, t0
+
+    //# Illegal compressed instruction with op = 01, instr[15:10] = 100111, and 0's everywhere else
+    //.hword 0x9C01
+
+    # Illegal compressed instruction 
+    .hword 0x9C41
 
     j done

From 7e5e9d928e2b94ae39b5b86e766b123fad624e0b Mon Sep 17 00:00:00 2001
From: Sydeny <sriley@g.hmc.edu>
Date: Mon, 3 Apr 2023 01:55:23 -0700
Subject: [PATCH 7/7] Manual merge for fctrl.sv, fpu.S, and ifu.S files

---
 src/fpu/fctrl.sv     | 204 ++++++++++++++++++++++---------------------
 tests/coverage/fpu.S |   3 -
 tests/coverage/ifu.S |   7 +-
 3 files changed, 107 insertions(+), 107 deletions(-)

diff --git a/src/fpu/fctrl.sv b/src/fpu/fctrl.sv
index 0c345a49..b3400107 100755
--- a/src/fpu/fctrl.sv
+++ b/src/fpu/fctrl.sv
@@ -100,105 +100,111 @@ module fctrl (
       ControlsD = `FCTRLW'b0_0_00_xx_000_0_1_0; // default: non-implemented instruction
       /* verilator lint_off CASEINCOMPLETE */ // default value above has priority so no other default needed
       case(OpD)
-      7'b0000111: case(Funct3D)
-                    3'b010:                      ControlsD = `FCTRLW'b1_0_10_xx_0xx_0_0_0; // flw
-                    3'b011:  if (`D_SUPPORTED)   ControlsD = `FCTRLW'b1_0_10_xx_0xx_0_0_0; // fld
-                    3'b100:  if (`Q_SUPPORTED)   ControlsD = `FCTRLW'b1_0_10_xx_0xx_0_0_0; // flq
-                    3'b001:  if (`ZFH_SUPPORTED) ControlsD = `FCTRLW'b1_0_10_xx_0xx_0_0_0; // flh
-                  endcase
-      7'b0100111: case(Funct3D)
-                    3'b010:                      ControlsD = `FCTRLW'b0_0_10_xx_0xx_0_0_0; // fsw
-                    3'b011:  if (`D_SUPPORTED)   ControlsD = `FCTRLW'b0_0_10_xx_0xx_0_0_0; // fsd
-                    3'b100:  if (`Q_SUPPORTED)   ControlsD = `FCTRLW'b0_0_10_xx_0xx_0_0_0; // fsq
-                    3'b001:  if (`ZFH_SUPPORTED) ControlsD = `FCTRLW'b0_0_10_xx_0xx_0_0_0; // fsh
-                  endcase
-      7'b1000011:   ControlsD = `FCTRLW'b1_0_01_10_000_0_0_0; // fmadd
-      7'b1000111:   ControlsD = `FCTRLW'b1_0_01_10_001_0_0_0; // fmsub
-      7'b1001011:   ControlsD = `FCTRLW'b1_0_01_10_010_0_0_0; // fnmsub
-      7'b1001111:   ControlsD = `FCTRLW'b1_0_01_10_011_0_0_0; // fnmadd
-      7'b1010011: casez(Funct7D)
-                    7'b00000??: ControlsD = `FCTRLW'b1_0_01_10_110_0_0_0; // fadd
-                    7'b00001??: ControlsD = `FCTRLW'b1_0_01_10_111_0_0_0; // fsub
-                    7'b00010??: ControlsD = `FCTRLW'b1_0_01_10_100_0_0_0; // fmul
-                    7'b00011??: ControlsD = `FCTRLW'b1_0_01_01_xx0_1_0_0; // fdiv
-                    7'b01011??: if (Rs2D == 5'b0000) ControlsD = `FCTRLW'b1_0_01_01_xx1_1_0_0; // fsqrt
-                    7'b00100??: case(Funct3D)
-                                  3'b000:  ControlsD = `FCTRLW'b1_0_00_xx_000_0_0_0; // fsgnj
-                                  3'b001:  ControlsD = `FCTRLW'b1_0_00_xx_001_0_0_0; // fsgnjn
-                                  3'b010:  ControlsD = `FCTRLW'b1_0_00_xx_010_0_0_0; // fsgnjx
-                               endcase
-                    7'b00101??: case(Funct3D)
-                                  3'b000:  ControlsD = `FCTRLW'b1_0_00_xx_110_0_0_0; // fmin
-                                  3'b001:  ControlsD = `FCTRLW'b1_0_00_xx_101_0_0_0; // fmax
-                                endcase
-                    7'b10100??: case(Funct3D)
-                                  3'b010:  ControlsD = `FCTRLW'b0_1_00_xx_010_0_0_0; // feq
-                                  3'b001:  ControlsD = `FCTRLW'b0_1_00_xx_001_0_0_0; // flt
-                                  3'b000:  ControlsD = `FCTRLW'b0_1_00_xx_011_0_0_0; // fle
-                                endcase
-                    7'b11100??: if (Funct3D == 3'b001 & Rs2D == 5'b00000)          
-                                               ControlsD = `FCTRLW'b0_1_10_xx_000_0_0_0; // fclass
-                                else if (Funct3D == 3'b000 & Rs2D == 5'b00000) 
-                                               ControlsD = `FCTRLW'b0_1_11_xx_000_0_0_0; // fmv.x.w / fmv.x.d to int register
-                    7'b111100?: if (Funct3D == 3'b000 & Rs2D == 5'b00000) 
-                                               ControlsD = `FCTRLW'b1_0_00_xx_011_0_0_0; // fmv.w.x / fmv.d.x   to fp reg
-                    7'b0100000: if (Rs2D[4:2] == 3'b000 & SupportedFmt2 & Rs2D[1:0] != 2'b00)
-                                               ControlsD = `FCTRLW'b1_0_01_00_000_0_0_0; // fcvt.s.(d/q/h)
-                    7'b0100001: if (Rs2D[4:2] == 3'b000  & SupportedFmt2 & Rs2D[1:0] != 2'b01)
-                                               ControlsD = `FCTRLW'b1_0_01_00_001_0_0_0; // fcvt.d.(s/h/q)
-                    7'b0100010: if (Rs2D[4:2] == 3'b000 & SupportedFmt2 & Rs2D[1:0] != 2'b10)
-                                               ControlsD = `FCTRLW'b1_0_01_00_010_0_0_0; // fcvt.h.(s/d/q)
-                    7'b0100011: if (Rs2D[4:2] == 3'b000  & SupportedFmt2 & Rs2D[1:0] != 2'b11)
-                                               ControlsD = `FCTRLW'b1_0_01_00_011_0_0_0; // fcvt.q.(s/h/d)
-                   7'b1101000: case(Rs2D)
-                                  5'b00000:    ControlsD = `FCTRLW'b1_0_01_00_101_0_0_0; // fcvt.s.w   w->s
-                                  5'b00001:    ControlsD = `FCTRLW'b1_0_01_00_100_0_0_0; // fcvt.s.wu wu->s
-                                  5'b00010:    ControlsD = `FCTRLW'b1_0_01_00_111_0_0_0; // fcvt.s.l   l->s
-                                  5'b00011:    ControlsD = `FCTRLW'b1_0_01_00_110_0_0_0; // fcvt.s.lu lu->s
-                                endcase
-                    7'b1100000: case(Rs2D)
-                                  5'b00000:    ControlsD = `FCTRLW'b0_1_01_00_001_0_0_1; // fcvt.w.s   s->w
-                                  5'b00001:    ControlsD = `FCTRLW'b0_1_01_00_000_0_0_1; // fcvt.wu.s  s->wu
-                                  5'b00010:    ControlsD = `FCTRLW'b0_1_01_00_011_0_0_1; // fcvt.l.s   s->l
-                                  5'b00011:    ControlsD = `FCTRLW'b0_1_01_00_010_0_0_1; // fcvt.lu.s  s->lu
-                                endcase
-                    7'b1101001: case(Rs2D)
-                                  5'b00000:    ControlsD = `FCTRLW'b1_0_01_00_101_0_0_0; // fcvt.d.w   w->d
-                                  5'b00001:    ControlsD = `FCTRLW'b1_0_01_00_100_0_0_0; // fcvt.d.wu wu->d
-                                  5'b00010:    ControlsD = `FCTRLW'b1_0_01_00_111_0_0_0; // fcvt.d.l   l->d
-                                  5'b00011:    ControlsD = `FCTRLW'b1_0_01_00_110_0_0_0; // fcvt.d.lu lu->d
-                                endcase
-                    7'b1100001: case(Rs2D)
-                                  5'b00000:    ControlsD = `FCTRLW'b0_1_01_00_001_0_0_1; // fcvt.w.d   d->w
-                                  5'b00001:    ControlsD = `FCTRLW'b0_1_01_00_000_0_0_1; // fcvt.wu.d  d->wu
-                                  5'b00010:    ControlsD = `FCTRLW'b0_1_01_00_011_0_0_1; // fcvt.l.d   d->l
-                                  5'b00011:    ControlsD = `FCTRLW'b0_1_01_00_010_0_0_1; // fcvt.lu.d  d->lu
-                                endcase
-                    7'b1101010: case(Rs2D)
-                                  5'b00000:    ControlsD = `FCTRLW'b1_0_01_00_101_0_0_0; // fcvt.h.w   w->h
-                                  5'b00001:    ControlsD = `FCTRLW'b1_0_01_00_100_0_0_0; // fcvt.h.wu wu->h
-                                  5'b00010:    ControlsD = `FCTRLW'b1_0_01_00_111_0_0_0; // fcvt.h.l   l->h
-                                  5'b00011:    ControlsD = `FCTRLW'b1_0_01_00_110_0_0_0; // fcvt.h.lu lu->h
-                                endcase
-                    7'b1100010: case(Rs2D)
-                                  5'b00000:    ControlsD = `FCTRLW'b0_1_01_00_001_0_0_1; // fcvt.w.h   h->w
-                                  5'b00001:    ControlsD = `FCTRLW'b0_1_01_00_000_0_0_1; // fcvt.wu.h  h->wu
-                                  5'b00010:    ControlsD = `FCTRLW'b0_1_01_00_011_0_0_1; // fcvt.l.h   h->l
-                                  5'b00011:    ControlsD = `FCTRLW'b0_1_01_00_010_0_0_1; // fcvt.lu.h  h->lu
-                                endcase
-                    7'b1101011: case(Rs2D)
-                                  5'b00000:    ControlsD = `FCTRLW'b1_0_01_00_101_0_0_0; // fcvt.q.w   w->q
-                                  5'b00001:    ControlsD = `FCTRLW'b1_0_01_00_100_0_0_0; // fcvt.q.wu wu->q
-                                  5'b00010:    ControlsD = `FCTRLW'b1_0_01_00_111_0_0_0; // fcvt.q.l   l->q
-                                  5'b00011:    ControlsD = `FCTRLW'b1_0_01_00_110_0_0_0; // fcvt.q.lu lu->q
-                                endcase
-                    7'b1100011: case(Rs2D)
-                                  5'b00000:    ControlsD = `FCTRLW'b0_1_01_00_001_0_0_1; // fcvt.w.q   q->w
-                                  5'b00001:    ControlsD = `FCTRLW'b0_1_01_00_000_0_0_1; // fcvt.wu.q  q->wu
-                                  5'b00010:    ControlsD = `FCTRLW'b0_1_01_00_011_0_0_1; // fcvt.l.q   q->l
-                                  5'b00011:    ControlsD = `FCTRLW'b0_1_01_00_010_0_0_1; // fcvt.lu.q  q->lu
-                                endcase                            
-                  endcase
+        7'b0000111: case(Funct3D)
+                      3'b010:                      ControlsD = `FCTRLW'b1_0_10_xx_0xx_0_0_0; // flw
+                      3'b011:  if (`D_SUPPORTED)   ControlsD = `FCTRLW'b1_0_10_xx_0xx_0_0_0; // fld
+                      3'b100:  if (`Q_SUPPORTED)   ControlsD = `FCTRLW'b1_0_10_xx_0xx_0_0_0; // flq
+                      3'b001:  if (`ZFH_SUPPORTED) ControlsD = `FCTRLW'b1_0_10_xx_0xx_0_0_0; // flh
+                    endcase
+        7'b0100111: case(Funct3D)
+                      3'b010:                      ControlsD = `FCTRLW'b0_0_10_xx_0xx_0_0_0; // fsw
+                      3'b011:  if (`D_SUPPORTED)   ControlsD = `FCTRLW'b0_0_10_xx_0xx_0_0_0; // fsd
+                      3'b100:  if (`Q_SUPPORTED)   ControlsD = `FCTRLW'b0_0_10_xx_0xx_0_0_0; // fsq
+                      3'b001:  if (`ZFH_SUPPORTED) ControlsD = `FCTRLW'b0_0_10_xx_0xx_0_0_0; // fsh
+                    endcase
+        7'b1000011:   ControlsD = `FCTRLW'b1_0_01_10_000_0_0_0; // fmadd
+        7'b1000111:   ControlsD = `FCTRLW'b1_0_01_10_001_0_0_0; // fmsub
+        7'b1001011:   ControlsD = `FCTRLW'b1_0_01_10_010_0_0_0; // fnmsub
+        7'b1001111:   ControlsD = `FCTRLW'b1_0_01_10_011_0_0_0; // fnmadd
+        7'b1010011: casez(Funct7D)
+                      7'b00000??: ControlsD = `FCTRLW'b1_0_01_10_110_0_0_0; // fadd
+                      7'b00001??: ControlsD = `FCTRLW'b1_0_01_10_111_0_0_0; // fsub
+                      7'b00010??: ControlsD = `FCTRLW'b1_0_01_10_100_0_0_0; // fmul
+                      7'b00011??: ControlsD = `FCTRLW'b1_0_01_01_xx0_1_0_0; // fdiv
+                      7'b01011??: if (Rs2D == 5'b0000) ControlsD = `FCTRLW'b1_0_01_01_xx1_1_0_0; // fsqrt
+                      7'b00100??: case(Funct3D)
+                                    3'b000:  ControlsD = `FCTRLW'b1_0_00_xx_000_0_0_0; // fsgnj
+                                    3'b001:  ControlsD = `FCTRLW'b1_0_00_xx_001_0_0_0; // fsgnjn
+                                    3'b010:  ControlsD = `FCTRLW'b1_0_00_xx_010_0_0_0; // fsgnjx
+                                  endcase
+                      7'b00101??: case(Funct3D)
+                                    3'b000:  ControlsD = `FCTRLW'b1_0_00_xx_110_0_0_0; // fmin
+                                    3'b001:  ControlsD = `FCTRLW'b1_0_00_xx_101_0_0_0; // fmax
+                                  endcase
+                      7'b10100??: case(Funct3D)
+                                    3'b010:  ControlsD = `FCTRLW'b0_1_00_xx_010_0_0_0; // feq
+                                    3'b001:  ControlsD = `FCTRLW'b0_1_00_xx_001_0_0_0; // flt
+                                    3'b000:  ControlsD = `FCTRLW'b0_1_00_xx_011_0_0_0; // fle
+                                  endcase
+                      7'b11100??: if (Funct3D == 3'b001 & Rs2D == 5'b00000)          
+                                                ControlsD = `FCTRLW'b0_1_10_xx_000_0_0_0; // fclass
+                                  else if (Funct3D == 3'b000 & Rs2D == 5'b00000) 
+                                                ControlsD = `FCTRLW'b0_1_11_xx_000_0_0_0; // fmv.x.w / fmv.x.d to int register
+                      7'b111100?: if (Funct3D == 3'b000 & Rs2D == 5'b00000) 
+                                                ControlsD = `FCTRLW'b1_0_00_xx_011_0_0_0; // fmv.w.x / fmv.d.x   to fp reg
+                      7'b0100000: if (Rs2D[4:2] == 3'b000 & SupportedFmt2 & Rs2D[1:0] != 2'b00)
+                                                ControlsD = `FCTRLW'b1_0_01_00_000_0_0_0; // fcvt.s.(d/q/h)
+                      7'b0100001: if (Rs2D[4:2] == 3'b000  & SupportedFmt2 & Rs2D[1:0] != 2'b01)
+                                                ControlsD = `FCTRLW'b1_0_01_00_001_0_0_0; // fcvt.d.(s/h/q)
+                      // coverage off
+                      // Not covered in testing because rv64gc does not support half or quad precision
+                      7'b0100010: if (Rs2D[4:2] == 3'b000 & SupportedFmt2 & Rs2D[1:0] != 2'b10)
+                                                ControlsD = `FCTRLW'b1_0_01_00_010_0_0_0; // fcvt.h.(s/d/q)
+                      7'b0100011: if (Rs2D[4:2] == 3'b000  & SupportedFmt2 & Rs2D[1:0] != 2'b11)
+                                                ControlsD = `FCTRLW'b1_0_01_00_011_0_0_0; // fcvt.q.(s/h/d)
+                      // coverage on
+                      7'b1101000: case(Rs2D)
+                                    5'b00000:    ControlsD = `FCTRLW'b1_0_01_00_101_0_0_0; // fcvt.s.w   w->s
+                                    5'b00001:    ControlsD = `FCTRLW'b1_0_01_00_100_0_0_0; // fcvt.s.wu wu->s
+                                    5'b00010:    ControlsD = `FCTRLW'b1_0_01_00_111_0_0_0; // fcvt.s.l   l->s
+                                    5'b00011:    ControlsD = `FCTRLW'b1_0_01_00_110_0_0_0; // fcvt.s.lu lu->s
+                                  endcase
+                      7'b1100000: case(Rs2D)
+                                    5'b00000:    ControlsD = `FCTRLW'b0_1_01_00_001_0_0_1; // fcvt.w.s   s->w
+                                    5'b00001:    ControlsD = `FCTRLW'b0_1_01_00_000_0_0_1; // fcvt.wu.s  s->wu
+                                    5'b00010:    ControlsD = `FCTRLW'b0_1_01_00_011_0_0_1; // fcvt.l.s   s->l
+                                    5'b00011:    ControlsD = `FCTRLW'b0_1_01_00_010_0_0_1; // fcvt.lu.s  s->lu
+                                  endcase
+                      7'b1101001: case(Rs2D)
+                                    5'b00000:    ControlsD = `FCTRLW'b1_0_01_00_101_0_0_0; // fcvt.d.w   w->d
+                                    5'b00001:    ControlsD = `FCTRLW'b1_0_01_00_100_0_0_0; // fcvt.d.wu wu->d
+                                    5'b00010:    ControlsD = `FCTRLW'b1_0_01_00_111_0_0_0; // fcvt.d.l   l->d
+                                    5'b00011:    ControlsD = `FCTRLW'b1_0_01_00_110_0_0_0; // fcvt.d.lu lu->d
+                                  endcase
+                      7'b1100001: case(Rs2D)
+                                    5'b00000:    ControlsD = `FCTRLW'b0_1_01_00_001_0_0_1; // fcvt.w.d   d->w
+                                    5'b00001:    ControlsD = `FCTRLW'b0_1_01_00_000_0_0_1; // fcvt.wu.d  d->wu
+                                    5'b00010:    ControlsD = `FCTRLW'b0_1_01_00_011_0_0_1; // fcvt.l.d   d->l
+                                    5'b00011:    ControlsD = `FCTRLW'b0_1_01_00_010_0_0_1; // fcvt.lu.d  d->lu
+                                  endcase
+                      // coverage off
+                      // Not covered in testing because rv64gc does not support half or quad precision
+                      7'b1101010: case(Rs2D)
+                                    5'b00000:    ControlsD = `FCTRLW'b1_0_01_00_101_0_0_0; // fcvt.h.w   w->h
+                                    5'b00001:    ControlsD = `FCTRLW'b1_0_01_00_100_0_0_0; // fcvt.h.wu wu->h
+                                    5'b00010:    ControlsD = `FCTRLW'b1_0_01_00_111_0_0_0; // fcvt.h.l   l->h
+                                    5'b00011:    ControlsD = `FCTRLW'b1_0_01_00_110_0_0_0; // fcvt.h.lu lu->h
+                                  endcase
+                      7'b1100010: case(Rs2D)
+                                    5'b00000:    ControlsD = `FCTRLW'b0_1_01_00_001_0_0_1; // fcvt.w.h   h->w
+                                    5'b00001:    ControlsD = `FCTRLW'b0_1_01_00_000_0_0_1; // fcvt.wu.h  h->wu
+                                    5'b00010:    ControlsD = `FCTRLW'b0_1_01_00_011_0_0_1; // fcvt.l.h   h->l
+                                    5'b00011:    ControlsD = `FCTRLW'b0_1_01_00_010_0_0_1; // fcvt.lu.h  h->lu
+                                  endcase
+                      7'b1101011: case(Rs2D)
+                                    5'b00000:    ControlsD = `FCTRLW'b1_0_01_00_101_0_0_0; // fcvt.q.w   w->q
+                                    5'b00001:    ControlsD = `FCTRLW'b1_0_01_00_100_0_0_0; // fcvt.q.wu wu->q
+                                    5'b00010:    ControlsD = `FCTRLW'b1_0_01_00_111_0_0_0; // fcvt.q.l   l->q
+                                    5'b00011:    ControlsD = `FCTRLW'b1_0_01_00_110_0_0_0; // fcvt.q.lu lu->q
+                                  endcase
+                      7'b1100011: case(Rs2D)
+                                    5'b00000:    ControlsD = `FCTRLW'b0_1_01_00_001_0_0_1; // fcvt.w.q   q->w
+                                    5'b00001:    ControlsD = `FCTRLW'b0_1_01_00_000_0_0_1; // fcvt.wu.q  q->wu
+                                    5'b00010:    ControlsD = `FCTRLW'b0_1_01_00_011_0_0_1; // fcvt.l.q   q->l
+                                    5'b00011:    ControlsD = `FCTRLW'b0_1_01_00_010_0_0_1; // fcvt.lu.q  q->lu
+                                  endcase
+                      // coverage on
+                    endcase
       endcase
     end
     /* verilator lint_on CASEINCOMPLETE */
diff --git a/tests/coverage/fpu.S b/tests/coverage/fpu.S
index 17fed79b..a349ac60 100644
--- a/tests/coverage/fpu.S
+++ b/tests/coverage/fpu.S
@@ -57,7 +57,6 @@ main:
     fcvt.l.q a0, ft3
     fcvt.lu.q a0, ft3
 
-<<<<<<< HEAD
 
     // Tests verfying that half and quad floating point convertion instructions are not supported by rv64gc
     # fcvt.h.d ft3, ft0 // Somehow this instruction is taking the route on line 124
@@ -75,8 +74,6 @@ main:
     .word 0xd2400053    // Line 168 All False Test case - illegal instruction?
     .word 0xc2400053    // Line 174 All False Test case - illegal instruction?
 
-=======
->>>>>>> d4b7da34dee55ec8394ab391ecd6514c887a9790
     # Test illegal instructions are detected
     .word 0x00000007 // illegal floating-point load (bad Funct3)
     .word 0x00000027 // illegal floating-point store (bad Funct3)
diff --git a/tests/coverage/ifu.S b/tests/coverage/ifu.S
index 68db3d08..9cde14ce 100644
--- a/tests/coverage/ifu.S
+++ b/tests/coverage/ifu.S
@@ -36,6 +36,7 @@ main:
                         // binary version 0000 0000 0000 0000 0010 0000 0000 0000
     mv s0, sp
     c.fld fs0, 0(s0)
+
     c.fsd fs0, 0(s0)
 
     // c.fldsp fs0, 0
@@ -44,14 +45,10 @@ main:
     // c.fsdsp fs0, 0
     .hword 0xA002
 
-    # set XLEN to 64
-    li t0, 0x200000000
-    csrs mstatus, t0
-
     //# Illegal compressed instruction with op = 01, instr[15:10] = 100111, and 0's everywhere else
     //.hword 0x9C01
 
-    # Illegal compressed instruction 
+    # Line Illegal compressed instruction 
     .hword 0x9C41
 
     j done