/////////////////////////////////////////// // intdivrestoring.sv // // Written: David_Harris@hmc.edu 12 September 2021 // Modified: // // Purpose: Restoring integer division using a shift register and subtractor // // Documentation: RISC-V System on Chip Design // // A component of the CORE-V-WALLY configurable RISC-V project. // https://github.com/openhwgroup/cvw // // Copyright (C) 2021-23 Harvey Mudd College & Oklahoma State University // // SPDX-License-Identifier: Apache-2.0 WITH SHL-2.1 // // Licensed under the Solderpad Hardware License v 2.1 (the “License”); you may not use this file // except in compliance with the License, or, at your option, the Apache License version 2.0. You // may obtain a copy of the License at // // https://solderpad.org/licenses/SHL-2.1/ // // Unless required by applicable law or agreed to in writing, any work distributed under the // License is distributed on an “AS IS” BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, // either express or implied. See the License for the specific language governing permissions // and limitations under the License. //////////////////////////////////////////////////////////////////////////////////////////////// module div import cvw::*; #(parameter cvw_t P) ( input logic clk, input logic reset, input logic StallM, input logic FlushE, input logic IntDivE, // integer division/remainder instruction of any type input logic DivSignedE, // signed division input logic W64E, // W-type instructions (divw, divuw, remw, remuw) input logic [P.XLEN-1:0] ForwardedSrcAE, ForwardedSrcBE, // Forwarding mux outputs for Source A and B output logic DivBusyE, // Divide is busy - stall pipeline output logic [P.XLEN-1:0] QuotM, RemM // Quotient and remainder outputs ); localparam STEPBITS = $clog2(P.XLEN/P.IDIV_BITSPERCYCLE); // Number of steps typedef enum logic [1:0] {IDLE, BUSY, DONE} statetype; // division FSM state statetype state; logic [P.XLEN-1:0] W[P.IDIV_BITSPERCYCLE:0]; // Residual for each of k steps logic [P.XLEN-1:0] XQ[P.IDIV_BITSPERCYCLE:0]; // dividend/quotient for each of k steps logic [P.XLEN-1:0] WNext, XQNext; // initialized W and XQ going into registers logic [P.XLEN-1:0] DinE, XinE; // divisor & dividend, possibly truncated to 32 bits logic [P.XLEN-1:0] DnE; // DnE = ~DinE logic [P.XLEN-1:0] DAbsBE; // absolute value of D logic [P.XLEN-1:0] DAbsB; // registered absolute value of D, constant during division logic [P.XLEN-1:0] XnE; // DXnE = ~XinE logic [P.XLEN-1:0] XInitE; // |X|, or original X for divide by 0 logic [P.XLEN-1:0] WnM, XQnM; // negated residual W and quotient XQ for postprocessing sign correction logic [STEPBITS:0] step; // division step logic Div0E, Div0M; // divide by 0 logic DivStartE; // start integer division logic SignXE, SignDE; // sign of dividend and divisor logic NegQE, NegWM, NegQM; // negate quotient or residual during postprocessing ////////////////////////////// // Execute Stage: prepare for division calculation with control logic, W logic and absolute values, initialize W and XQ ////////////////////////////// // Divider control signals assign DivStartE = IntDivE & (state == IDLE) & ~StallM; assign DivBusyE = (state == BUSY) | DivStartE; // Handle sign extension for W-type instructions if (P.XLEN == 64) begin:rv64 // RV64 has W-type instructions mux2 #(P.XLEN) xinmux(ForwardedSrcAE, {ForwardedSrcAE[31:0], 32'b0}, W64E, XinE); mux2 #(P.XLEN) dinmux(ForwardedSrcBE, {{32{ForwardedSrcBE[31]&DivSignedE}}, ForwardedSrcBE[31:0]}, W64E, DinE); end else begin // RV32 has no W-type instructions assign XinE = ForwardedSrcAE; assign DinE = ForwardedSrcBE; end // Extract sign bits and check fo division by zero assign SignDE = DivSignedE & DinE[P.XLEN-1]; assign SignXE = DivSignedE & XinE[P.XLEN-1]; assign NegQE = SignDE ^ SignXE; assign Div0E = (DinE == 0); // Take absolute value for signed operations, and negate D to handle subtraction in divider stages neg #(P.XLEN) negd(DinE, DnE); mux2 #(P.XLEN) dabsmux(DnE, DinE, SignDE, DAbsBE); // take absolute value for signed operations, and negate for subtraction setp neg #(P.XLEN) negx(XinE, XnE); mux3 #(P.XLEN) xabsmux(XinE, XnE, ForwardedSrcAE, {Div0E, SignXE}, XInitE); // take absolute value for signed operations, or keep original value for divide by 0 ////////////////////////////// // Division Iterations (effectively stalled execute stage, no suffix) ////////////////////////////// // initialization multiplexers on first cycle of operation mux2 #(P.XLEN) wmux(W[P.IDIV_BITSPERCYCLE], {P.XLEN{1'b0}}, DivStartE, WNext); mux2 #(P.XLEN) xmux(XQ[P.IDIV_BITSPERCYCLE], XInitE, DivStartE, XQNext); // registers before division steps flopen #(P.XLEN) wreg(clk, DivBusyE, WNext, W[0]); flopen #(P.XLEN) xreg(clk, DivBusyE, XQNext, XQ[0]); flopen #(P.XLEN) dabsreg(clk, DivStartE, DAbsBE, DAbsB); // one copy of divstep for each bit produced per cycle genvar i; for (i=0; i