mirror of
https://github.com/openhwgroup/cvw
synced 2025-02-03 10:15:19 +00:00
Merge branch 'main' of https://github.com/openhwgroup/cvw into dev
This commit is contained in:
commit
3986e84179
2
.gitignore
vendored
2
.gitignore
vendored
@ -76,7 +76,7 @@ synthDC/runs/
|
|||||||
synthDC/newRuns
|
synthDC/newRuns
|
||||||
synthDC/ppa/PPAruns
|
synthDC/ppa/PPAruns
|
||||||
synthDC/ppa/plots
|
synthDC/ppa/plots
|
||||||
synthDC/plots/
|
synthDC/wallyplots/
|
||||||
synthDC/runArchive
|
synthDC/runArchive
|
||||||
synthDC/hdl
|
synthDC/hdl
|
||||||
/pipelined/regression/power.saif
|
/pipelined/regression/power.saif
|
||||||
|
@ -1,86 +0,0 @@
|
|||||||
///////////////////////////////////////////
|
|
||||||
// ram2p1r1wb
|
|
||||||
//
|
|
||||||
// Written: Ross Thomposn
|
|
||||||
// Email: ross1728@gmail.com
|
|
||||||
// Created: February 14, 2021
|
|
||||||
// Modified:
|
|
||||||
//
|
|
||||||
// Purpose: Behavioral model of two port SRAM. While this is synthesizable it will produce a flip flop based memory which
|
|
||||||
// behaves with the timing of an SRAM typical of GF 14nm, 32nm, and 45nm.
|
|
||||||
//
|
|
||||||
//
|
|
||||||
// to preload this memory we can use the following command
|
|
||||||
// in modelsim's do file.
|
|
||||||
// mem load -infile <relative path to the text file > -format <bin|hex> <hierarchy to the memory.>
|
|
||||||
// example
|
|
||||||
// mem load -infile twoBitPredictor.txt -format bin testbench/dut/core/ifu/bpred/DirPredictor/memory/memory
|
|
||||||
//
|
|
||||||
// A component of the CORE-V-WALLY configurable RISC-V project.
|
|
||||||
//
|
|
||||||
// Copyright (C) 2021-23 Harvey Mudd College & Oklahoma State University
|
|
||||||
//
|
|
||||||
// SPDX-License-Identifier: Apache-2.0 WITH SHL-2.1
|
|
||||||
//
|
|
||||||
// Licensed under the Solderpad Hardware License v 2.1 (the “License”); you may not use this file
|
|
||||||
// except in compliance with the License, or, at your option, the Apache License version 2.0. You
|
|
||||||
// may obtain a copy of the License at
|
|
||||||
//
|
|
||||||
// https://solderpad.org/licenses/SHL-2.1/
|
|
||||||
//
|
|
||||||
// Unless required by applicable law or agreed to in writing, any work distributed under the
|
|
||||||
// License is distributed on an “AS IS” BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND,
|
|
||||||
// either express or implied. See the License for the specific language governing permissions
|
|
||||||
// and limitations under the License.
|
|
||||||
////////////////////////////////////////////////////////////////////////////////////////////////
|
|
||||||
|
|
||||||
`include "wally-config.vh"
|
|
||||||
|
|
||||||
module ram2p1r1wb #(parameter DEPTH = 10, WIDTH = 2) (
|
|
||||||
input logic clk,
|
|
||||||
input logic reset,
|
|
||||||
|
|
||||||
// port 1 is read only
|
|
||||||
input logic [DEPTH-1:0] ra1,
|
|
||||||
output logic [WIDTH-1:0] rd1,
|
|
||||||
input logic ren1,
|
|
||||||
|
|
||||||
// port 2 is write only
|
|
||||||
input logic [DEPTH-1:0] wa2,
|
|
||||||
input logic [WIDTH-1:0] wd2,
|
|
||||||
input logic wen2,
|
|
||||||
input logic [WIDTH-1:0] bwe2
|
|
||||||
);
|
|
||||||
|
|
||||||
|
|
||||||
logic [DEPTH-1:0] ra1q, wa2q;
|
|
||||||
logic wen2q;
|
|
||||||
logic [WIDTH-1:0] wd2q;
|
|
||||||
|
|
||||||
logic [WIDTH-1:0] mem[2**DEPTH-1:0];
|
|
||||||
logic [WIDTH-1:0] bwe;
|
|
||||||
|
|
||||||
|
|
||||||
// SRAMs address busses are always registered first
|
|
||||||
// *** likely issued DH and RT 12/20/22
|
|
||||||
// wrong enable for write port registers
|
|
||||||
// prefer to code read like ram1p1rw
|
|
||||||
// prefer not to have two-cycle write latency
|
|
||||||
// will require branch predictor changes
|
|
||||||
|
|
||||||
flopenr #(DEPTH) ra1Reg(clk, reset, ren1, ra1, ra1q);
|
|
||||||
flopenr #(DEPTH) wa2Reg(clk, reset, ren1, wa2, wa2q);
|
|
||||||
flopr #(1) wen2Reg(clk, reset, wen2, wen2q);
|
|
||||||
flopenr #(WIDTH) wd2Reg(clk, reset, ren1, wd2, wd2q);
|
|
||||||
|
|
||||||
// read port
|
|
||||||
assign rd1 = mem[ra1q];
|
|
||||||
|
|
||||||
// write port
|
|
||||||
assign bwe = {WIDTH{wen2q}} & bwe2;
|
|
||||||
always_ff @(posedge clk)
|
|
||||||
mem[wa2q] <= wd2q & bwe | mem[wa2q] & ~bwe;
|
|
||||||
|
|
||||||
endmodule
|
|
||||||
|
|
||||||
|
|
@ -1,8 +1,8 @@
|
|||||||
///////////////////////////////////////////
|
///////////////////////////////////////////
|
||||||
// 1 port sram.
|
// 2 port sram.
|
||||||
//
|
//
|
||||||
// Written: ross1728@gmail.com May 3, 2021
|
// Written: ross1728@gmail.com May 3, 2021
|
||||||
// Basic sram with 1 read write port.
|
// Two port SRAM 1 read port and 1 write port.
|
||||||
// When clk rises Addr and LineWriteData are sampled.
|
// When clk rises Addr and LineWriteData are sampled.
|
||||||
// Following the clk edge read data is output from the sampled Addr.
|
// Following the clk edge read data is output from the sampled Addr.
|
||||||
// Write
|
// Write
|
||||||
@ -31,7 +31,7 @@
|
|||||||
|
|
||||||
`include "wally-config.vh"
|
`include "wally-config.vh"
|
||||||
|
|
||||||
module ram2p1r1wbefix #(parameter DEPTH=128, WIDTH=256) (
|
module ram2p1r1wbe #(parameter DEPTH=128, WIDTH=256) (
|
||||||
input logic clk,
|
input logic clk,
|
||||||
input logic ce1, ce2,
|
input logic ce1, ce2,
|
||||||
input logic [$clog2(DEPTH)-1:0] ra1,
|
input logic [$clog2(DEPTH)-1:0] ra1,
|
||||||
@ -59,13 +59,13 @@ module ram2p1r1wbefix #(parameter DEPTH=128, WIDTH=256) (
|
|||||||
|
|
||||||
// Write divided into part for bytes and part for extra msbs
|
// Write divided into part for bytes and part for extra msbs
|
||||||
if(WIDTH >= 8)
|
if(WIDTH >= 8)
|
||||||
always_ff @(posedge clk)
|
always @(posedge clk)
|
||||||
if (ce2 & we2)
|
if (ce2 & we2)
|
||||||
for(i = 0; i < WIDTH/8; i++)
|
for(i = 0; i < WIDTH/8; i++)
|
||||||
if(bwe2[i]) mem[wa2][i*8 +: 8] <= #1 wd2[i*8 +: 8];
|
if(bwe2[i]) mem[wa2][i*8 +: 8] <= #1 wd2[i*8 +: 8];
|
||||||
|
|
||||||
if (WIDTH%8 != 0) // handle msbs if width not a multiple of 8
|
if (WIDTH%8 != 0) // handle msbs if width not a multiple of 8
|
||||||
always_ff @(posedge clk)
|
always @(posedge clk)
|
||||||
if (ce2 & we2 & bwe2[WIDTH/8])
|
if (ce2 & we2 & bwe2[WIDTH/8])
|
||||||
mem[wa2][WIDTH-1:WIDTH-WIDTH%8] <= #1 wd2[WIDTH-1:WIDTH-WIDTH%8];
|
mem[wa2][WIDTH-1:WIDTH-WIDTH%8] <= #1 wd2[WIDTH-1:WIDTH-WIDTH%8];
|
||||||
|
|
@ -135,20 +135,19 @@ module bpred (
|
|||||||
// Part 2 Branch target address prediction
|
// Part 2 Branch target address prediction
|
||||||
// *** For now the BTB will house the direct and indirect targets
|
// *** For now the BTB will house the direct and indirect targets
|
||||||
|
|
||||||
// *** getting to many false positivies from the BTB, we need a partial TAG to reduce this.
|
btb TargetPredictor(.clk(clk),
|
||||||
BTBPredictor TargetPredictor(.clk(clk),
|
|
||||||
.reset(reset),
|
.reset(reset),
|
||||||
.*, // Stalls and flushes
|
.*, // Stalls and flushes
|
||||||
.LookUpPC(PCNextF),
|
.PCNextF,
|
||||||
.TargetPC(BTBPredPCF),
|
.BTBPredPCF,
|
||||||
.InstrClass(PredInstrClassF),
|
.InstrClass(PredInstrClassF),
|
||||||
.Valid(BTBValidF),
|
.Valid(BTBValidF),
|
||||||
// update
|
// update
|
||||||
.UpdateEN((|InstrClassE | (PredictionInstrClassWrongE)) & ~StallE),
|
.UpdateEN((|InstrClassE | (PredictionInstrClassWrongE)) & ~StallE),
|
||||||
.UpdatePC(PCE),
|
.PCE,
|
||||||
.UpdateTarget(IEUAdrE),
|
.IEUAdrE,
|
||||||
.UpdateInvalid(PredictionInstrClassWrongE),
|
.UpdateInvalid(PredictionInstrClassWrongE),
|
||||||
.UpdateInstrClass(InstrClassE));
|
.InstrClassE);
|
||||||
|
|
||||||
// Part 3 RAS
|
// Part 3 RAS
|
||||||
// *** need to add the logic to restore RAS on flushes. We will use incr for this.
|
// *** need to add the logic to restore RAS on flushes. We will use incr for this.
|
@ -1,13 +1,14 @@
|
|||||||
///////////////////////////////////////////
|
///////////////////////////////////////////
|
||||||
// ram2p1r1wb
|
// btb.sv
|
||||||
//
|
//
|
||||||
// Written: Ross Thomposn
|
// Written: Ross Thomposn ross1728@gmail.com
|
||||||
// Email: ross1728@gmail.com
|
|
||||||
// Created: February 15, 2021
|
// Created: February 15, 2021
|
||||||
// Modified:
|
// Modified: 24 January 2023
|
||||||
//
|
//
|
||||||
// Purpose: BTB model. Outputs type of instruction (currently 1 hot encoded. Probably want
|
// Purpose: Branch Target Buffer (BTB). The BTB predicts the target address of all control flow instructions.
|
||||||
// to encode to reduce storage), valid, target PC.
|
// It also guesses the type of instrution; jalr(r), return, jump (jr), or branch.
|
||||||
|
//
|
||||||
|
// Documentation: RISC-V System on Chip Design Chapter 10 (Figure ***)
|
||||||
//
|
//
|
||||||
// A component of the CORE-V-WALLY configurable RISC-V project.
|
// A component of the CORE-V-WALLY configurable RISC-V project.
|
||||||
//
|
//
|
||||||
@ -29,43 +30,45 @@
|
|||||||
|
|
||||||
`include "wally-config.vh"
|
`include "wally-config.vh"
|
||||||
|
|
||||||
module BTBPredictor
|
module btb
|
||||||
#(parameter int Depth = 10
|
#(parameter int Depth = 10
|
||||||
)
|
)
|
||||||
(input logic clk,
|
(input logic clk,
|
||||||
input logic reset,
|
input logic reset,
|
||||||
input logic StallF, StallE,
|
input logic StallF, StallE,
|
||||||
input logic [`XLEN-1:0] LookUpPC,
|
input logic [`XLEN-1:0] PCNextF,
|
||||||
output logic [`XLEN-1:0] TargetPC,
|
output logic [`XLEN-1:0] BTBPredPCF,
|
||||||
output logic [3:0] InstrClass,
|
output logic [3:0] InstrClass,
|
||||||
output logic Valid,
|
output logic Valid,
|
||||||
// update
|
// update
|
||||||
input logic UpdateEN,
|
input logic UpdateEN,
|
||||||
input logic [`XLEN-1:0] UpdatePC,
|
input logic [`XLEN-1:0] PCE,
|
||||||
input logic [`XLEN-1:0] UpdateTarget,
|
input logic [`XLEN-1:0] IEUAdrE,
|
||||||
input logic [3:0] UpdateInstrClass,
|
input logic [3:0] InstrClassE,
|
||||||
input logic UpdateInvalid
|
input logic UpdateInvalid
|
||||||
);
|
);
|
||||||
|
|
||||||
localparam TotalDepth = 2 ** Depth;
|
localparam TotalDepth = 2 ** Depth;
|
||||||
logic [TotalDepth-1:0] ValidBits;
|
logic [TotalDepth-1:0] ValidBits;
|
||||||
logic [Depth-1:0] LookUpPCIndex, UpdatePCIndex, LookUpPCIndexQ, UpdatePCIndexQ;
|
logic [Depth-1:0] PCNextFIndex, PCEIndex, PCNextFIndexQ, PCEIndexQ;
|
||||||
logic UpdateENQ;
|
logic UpdateENQ;
|
||||||
|
logic [`XLEN-1:0] ResetPC;
|
||||||
|
|
||||||
|
|
||||||
// hashing function for indexing the PC
|
// hashing function for indexing the PC
|
||||||
// We have Depth bits to index, but XLEN bits as the input.
|
// We have Depth bits to index, but XLEN bits as the input.
|
||||||
// bit 0 is always 0, bit 1 is 0 if using 4 byte instructions, but is not always 0 if
|
// bit 0 is always 0, bit 1 is 0 if using 4 byte instructions, but is not always 0 if
|
||||||
// using compressed instructions. XOR bit 1 with the MSB of index.
|
// using compressed instructions. XOR bit 1 with the MSB of index.
|
||||||
assign UpdatePCIndex = {UpdatePC[Depth+1] ^ UpdatePC[1], UpdatePC[Depth:2]};
|
assign PCEIndex = {PCE[Depth+1] ^ PCE[1], PCE[Depth:2]};
|
||||||
assign LookUpPCIndex = {LookUpPC[Depth+1] ^ LookUpPC[1], LookUpPC[Depth:2]};
|
assign ResetPC = `RESET_VECTOR;
|
||||||
|
assign PCNextFIndex = reset ? ResetPC[Depth+1:2] : {PCNextF[Depth+1] ^ PCNextF[1], PCNextF[Depth:2]};
|
||||||
|
//assign PCNextFIndex = {PCNextF[Depth+1] ^ PCNextF[1], PCNextF[Depth:2]};
|
||||||
|
|
||||||
flopenr #(Depth) UpdatePCIndexReg(.clk(clk),
|
flopenr #(Depth) PCEIndexReg(.clk(clk),
|
||||||
.reset(reset),
|
.reset(reset),
|
||||||
.en(~StallE),
|
.en(~StallE),
|
||||||
.d(UpdatePCIndex),
|
.d(PCEIndex),
|
||||||
.q(UpdatePCIndexQ));
|
.q(PCEIndexQ));
|
||||||
|
|
||||||
// The valid bit must be resetable.
|
// The valid bit must be resetable.
|
||||||
always_ff @ (posedge clk) begin
|
always_ff @ (posedge clk) begin
|
||||||
@ -73,10 +76,10 @@ module BTBPredictor
|
|||||||
ValidBits <= #1 {TotalDepth{1'b0}};
|
ValidBits <= #1 {TotalDepth{1'b0}};
|
||||||
end else
|
end else
|
||||||
if (UpdateENQ) begin
|
if (UpdateENQ) begin
|
||||||
ValidBits[UpdatePCIndexQ] <= #1 ~ UpdateInvalid;
|
ValidBits[PCEIndexQ] <= #1 ~ UpdateInvalid;
|
||||||
end
|
end
|
||||||
end
|
end
|
||||||
assign Valid = ValidBits[LookUpPCIndexQ];
|
assign Valid = ValidBits[PCNextFIndexQ];
|
||||||
|
|
||||||
|
|
||||||
flopenr #(1) UpdateENReg(.clk(clk),
|
flopenr #(1) UpdateENReg(.clk(clk),
|
||||||
@ -89,8 +92,8 @@ module BTBPredictor
|
|||||||
flopenr #(Depth) LookupPCIndexReg(.clk(clk),
|
flopenr #(Depth) LookupPCIndexReg(.clk(clk),
|
||||||
.reset(reset),
|
.reset(reset),
|
||||||
.en(~StallF),
|
.en(~StallF),
|
||||||
.d(LookUpPCIndex),
|
.d(PCNextFIndex),
|
||||||
.q(LookUpPCIndexQ));
|
.q(PCNextFIndexQ));
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
@ -99,16 +102,9 @@ module BTBPredictor
|
|||||||
// *** need to add forwarding.
|
// *** need to add forwarding.
|
||||||
|
|
||||||
// *** optimize for byte write enables
|
// *** optimize for byte write enables
|
||||||
// *** switch to ram2p1r1wbefix
|
|
||||||
ram2p1r1wb #(Depth, `XLEN+4) memory(.clk(clk),
|
|
||||||
.reset(reset),
|
|
||||||
.ra1(LookUpPCIndex),
|
|
||||||
.rd1({{InstrClass, TargetPC}}),
|
|
||||||
.ren1(~StallF),
|
|
||||||
.wa2(UpdatePCIndex),
|
|
||||||
.wd2({UpdateInstrClass, UpdateTarget}),
|
|
||||||
.wen2(UpdateEN),
|
|
||||||
.bwe2({4'hF, {`XLEN{1'b1}}})); // *** definitely not right.
|
|
||||||
|
|
||||||
|
ram2p1r1wbe #(2**Depth, `XLEN+4) memory(
|
||||||
|
.clk, .ce1(~StallF | reset), .ra1(PCNextFIndex), .rd1({InstrClass, BTBPredPCF}),
|
||||||
|
.ce2(~StallE), .wa2(PCEIndex), .wd2({InstrClassE, IEUAdrE}), .we2(UpdateEN), .bwe2('1));
|
||||||
|
|
||||||
endmodule
|
endmodule
|
@ -77,7 +77,7 @@ module foldedgshare
|
|||||||
assign FinalIndexNextF = IndexNextF[depth-1:0] ^ {{delta{1'b0}} , IndexNextF[k-1:depth]};
|
assign FinalIndexNextF = IndexNextF[depth-1:0] ^ {{delta{1'b0}} , IndexNextF[k-1:depth]};
|
||||||
assign FinalIndexW = IndexW[depth-1:0] ^ {{delta{1'b0}} , IndexW[k-1:depth]};
|
assign FinalIndexW = IndexW[depth-1:0] ^ {{delta{1'b0}} , IndexW[k-1:depth]};
|
||||||
|
|
||||||
ram2p1r1wbefix #(2**depth, 2) PHT(.clk(clk),
|
ram2p1r1wbe #(2**depth, 2) PHT(.clk(clk),
|
||||||
.ce1(~StallF | reset), .ce2(~StallW & ~FlushW),
|
.ce1(~StallF | reset), .ce2(~StallW & ~FlushW),
|
||||||
.ra1(FinalIndexNextF),
|
.ra1(FinalIndexNextF),
|
||||||
.rd1(TableDirPredictionF),
|
.rd1(TableDirPredictionF),
|
@ -51,7 +51,7 @@ module globalhistory
|
|||||||
logic PCSrcM;
|
logic PCSrcM;
|
||||||
|
|
||||||
|
|
||||||
ram2p1r1wbefix #(2**k, 2) PHT(.clk(clk),
|
ram2p1r1wbe #(2**k, 2) PHT(.clk(clk),
|
||||||
.ce1(~StallF), .ce2(~StallM & ~FlushM),
|
.ce1(~StallF), .ce2(~StallM & ~FlushM),
|
||||||
.ra1(GHR),
|
.ra1(GHR),
|
||||||
.rd1(DirPredictionF),
|
.rd1(DirPredictionF),
|
@ -54,7 +54,7 @@ module gshare
|
|||||||
assign IndexNextF = GHR & {PCNextF[k+1] ^ PCNextF[1], PCNextF[k:2]};
|
assign IndexNextF = GHR & {PCNextF[k+1] ^ PCNextF[1], PCNextF[k:2]};
|
||||||
assign IndexM = GHRM & {PCM[k+1] ^ PCM[1], PCM[k:2]};
|
assign IndexM = GHRM & {PCM[k+1] ^ PCM[1], PCM[k:2]};
|
||||||
|
|
||||||
ram2p1r1wbefix #(2**k, 2) PHT(.clk(clk),
|
ram2p1r1wbe #(2**k, 2) PHT(.clk(clk),
|
||||||
.ce1(~StallF), .ce2(~StallM & ~FlushM),
|
.ce1(~StallF), .ce2(~StallM & ~FlushM),
|
||||||
.ra1(IndexNextF),
|
.ra1(IndexNextF),
|
||||||
.rd1(DirPredictionF),
|
.rd1(DirPredictionF),
|
@ -12,22 +12,18 @@
|
|||||||
//
|
//
|
||||||
// Copyright (C) 2021 Harvey Mudd College & Oklahoma State University
|
// Copyright (C) 2021 Harvey Mudd College & Oklahoma State University
|
||||||
//
|
//
|
||||||
// MIT LICENSE
|
// SPDX-License-Identifier: Apache-2.0 WITH SHL-2.1
|
||||||
// Permission is hereby granted, free of charge, to any person obtaining a copy of this
|
|
||||||
// software and associated documentation files (the "Software"), to deal in the Software
|
|
||||||
// without restriction, including without limitation the rights to use, copy, modify, merge,
|
|
||||||
// publish, distribute, sublicense, and/or sell copies of the Software, and to permit persons
|
|
||||||
// to whom the Software is furnished to do so, subject to the following conditions:
|
|
||||||
//
|
//
|
||||||
// The above copyright notice and this permission notice shall be included in all copies or
|
// Licensed under the Solderpad Hardware License v 2.1 (the “License”); you may not use this file
|
||||||
// substantial portions of the Software.
|
// except in compliance with the License, or, at your option, the Apache License version 2.0. You
|
||||||
|
// may obtain a copy of the License at
|
||||||
//
|
//
|
||||||
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED,
|
// https://solderpad.org/licenses/SHL-2.1/
|
||||||
// INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR
|
//
|
||||||
// PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
|
// Unless required by applicable law or agreed to in writing, any work distributed under the
|
||||||
// BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
|
// License is distributed on an “AS IS” BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND,
|
||||||
// TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE
|
// either express or implied. See the License for the specific language governing permissions
|
||||||
// OR OTHER DEALINGS IN THE SOFTWARE.
|
// and limitations under the License.
|
||||||
////////////////////////////////////////////////////////////////////////////////////////////////
|
////////////////////////////////////////////////////////////////////////////////////////////////
|
||||||
|
|
||||||
`include "wally-config.vh"
|
`include "wally-config.vh"
|
||||||
@ -153,7 +149,7 @@ module optgshare
|
|||||||
assign IndexM = GHRM[k-1:0] ^ {PCM[k+1] ^ PCM[1], PCM[k:2]};
|
assign IndexM = GHRM[k-1:0] ^ {PCM[k+1] ^ PCM[1], PCM[k:2]};
|
||||||
assign IndexW = GHRW[k-1:0] ^ {PCW[k+1] ^ PCW[1], PCW[k:2]};
|
assign IndexW = GHRW[k-1:0] ^ {PCW[k+1] ^ PCW[1], PCW[k:2]};
|
||||||
|
|
||||||
ram2p1r1wbefix #(2**k, 2) PHT(.clk(clk),
|
ram2p1r1wbe #(2**k, 2) PHT(.clk(clk),
|
||||||
.ce1(~StallF | reset), .ce2(~StallW & ~FlushW),
|
.ce1(~StallF | reset), .ce2(~StallW & ~FlushW),
|
||||||
.ra1(IndexNextF),
|
.ra1(IndexNextF),
|
||||||
.rd1(TableDirPredictionF),
|
.rd1(TableDirPredictionF),
|
@ -60,7 +60,7 @@ module speculativeglobalhistory
|
|||||||
logic [1:0] ForwardNewDirPrediction, ForwardDirPredictionF;
|
logic [1:0] ForwardNewDirPrediction, ForwardDirPredictionF;
|
||||||
|
|
||||||
|
|
||||||
ram2p1r1wbefix #(2**k, 2) PHT(.clk(clk),
|
ram2p1r1wbe #(2**k, 2) PHT(.clk(clk),
|
||||||
.ce1(~StallF | reset), .ce2(~StallW & ~FlushW),
|
.ce1(~StallF | reset), .ce2(~StallW & ~FlushW),
|
||||||
.ra1(GHRNextF),
|
.ra1(GHRNextF),
|
||||||
.rd1(TableDirPredictionF),
|
.rd1(TableDirPredictionF),
|
@ -70,7 +70,7 @@ module speculativegshare
|
|||||||
assign IndexE = GHRE[k-1:0] ^ {PCE[k+1] ^ PCE[1], PCE[k:2]};
|
assign IndexE = GHRE[k-1:0] ^ {PCE[k+1] ^ PCE[1], PCE[k:2]};
|
||||||
assign IndexM = GHRM[k-1:0] ^ {PCM[k+1] ^ PCM[1], PCM[k:2]};
|
assign IndexM = GHRM[k-1:0] ^ {PCM[k+1] ^ PCM[1], PCM[k:2]};
|
||||||
|
|
||||||
ram2p1r1wbefix #(2**k, 2) PHT(.clk(clk),
|
ram2p1r1wbe #(2**k, 2) PHT(.clk(clk),
|
||||||
.ce1(~StallF | reset), .ce2(~StallW & ~FlushW),
|
.ce1(~StallF | reset), .ce2(~StallW & ~FlushW),
|
||||||
.ra1(IndexNextF),
|
.ra1(IndexNextF),
|
||||||
.rd1(TableDirPredictionF),
|
.rd1(TableDirPredictionF),
|
@ -56,7 +56,7 @@ module twoBitPredictor
|
|||||||
assign IndexM = {PCM[k+1] ^ PCM[1], PCM[k:2]};
|
assign IndexM = {PCM[k+1] ^ PCM[1], PCM[k:2]};
|
||||||
|
|
||||||
|
|
||||||
ram2p1r1wbefix #(2**k, 2) PHT(.clk(clk),
|
ram2p1r1wbe #(2**k, 2) PHT(.clk(clk),
|
||||||
.ce1(~StallF), .ce2(~StallM & ~FlushM),
|
.ce1(~StallF), .ce2(~StallM & ~FlushM),
|
||||||
.ra1(IndexNextF),
|
.ra1(IndexNextF),
|
||||||
.rd1(DirPredictionF),
|
.rd1(DirPredictionF),
|
@ -1,123 +0,0 @@
|
|||||||
///////////////////////////////////////////
|
|
||||||
// globalHistoryPredictor.sv
|
|
||||||
//
|
|
||||||
// Written: Shreya Sanghai
|
|
||||||
// Email: ssanghai@hmc.edu
|
|
||||||
// Created: March 16, 2021
|
|
||||||
// Modified:
|
|
||||||
//
|
|
||||||
// Purpose: Global History Branch predictor with parameterized global history register
|
|
||||||
//
|
|
||||||
// A component of the CORE-V-WALLY configurable RISC-V project.
|
|
||||||
//
|
|
||||||
// Copyright (C) 2021-23 Harvey Mudd College & Oklahoma State University
|
|
||||||
//
|
|
||||||
// SPDX-License-Identifier: Apache-2.0 WITH SHL-2.1
|
|
||||||
//
|
|
||||||
// Licensed under the Solderpad Hardware License v 2.1 (the “License”); you may not use this file
|
|
||||||
// except in compliance with the License, or, at your option, the Apache License version 2.0. You
|
|
||||||
// may obtain a copy of the License at
|
|
||||||
//
|
|
||||||
// https://solderpad.org/licenses/SHL-2.1/
|
|
||||||
//
|
|
||||||
// Unless required by applicable law or agreed to in writing, any work distributed under the
|
|
||||||
// License is distributed on an “AS IS” BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND,
|
|
||||||
// either express or implied. See the License for the specific language governing permissions
|
|
||||||
// and limitations under the License.
|
|
||||||
////////////////////////////////////////////////////////////////////////////////////////////////
|
|
||||||
|
|
||||||
`include "wally-config.vh"
|
|
||||||
|
|
||||||
module globalHistoryPredictor
|
|
||||||
#(parameter int k = 10
|
|
||||||
)
|
|
||||||
(input logic clk,
|
|
||||||
input logic reset,
|
|
||||||
input logic StallF, StallE,
|
|
||||||
input logic [`XLEN-1:0] PCNextF,
|
|
||||||
output logic [1:0] BPPredF,
|
|
||||||
// update
|
|
||||||
input logic [4:0] InstrClassE,
|
|
||||||
input logic [4:0] BPInstrClassE,
|
|
||||||
input logic [4:0] BPInstrClassD,
|
|
||||||
input logic [4:0] BPInstrClassF,
|
|
||||||
input logic BPPredDirWrongE,
|
|
||||||
|
|
||||||
input logic [`XLEN-1:0] PCE,
|
|
||||||
input logic PCSrcE,
|
|
||||||
input logic [1:0] UpdateBPPredE
|
|
||||||
|
|
||||||
);
|
|
||||||
logic [k+1:0] GHR, GHRNext;
|
|
||||||
logic [k-1:0] PHTUpdateAdr, PHTUpdateAdr0, PHTUpdateAdr1;
|
|
||||||
logic PHTUpdateEN;
|
|
||||||
logic BPClassWrongNonCFI;
|
|
||||||
logic BPClassWrongCFI;
|
|
||||||
logic BPClassRightNonCFI;
|
|
||||||
logic BPClassRightBPWrong;
|
|
||||||
logic BPClassRightBPRight;
|
|
||||||
|
|
||||||
logic [6:0] GHRMuxSel;
|
|
||||||
logic GHRUpdateEN;
|
|
||||||
logic [k-1:0] GHRLookup;
|
|
||||||
|
|
||||||
assign BPClassRightNonCFI = ~BPInstrClassE[0] & ~InstrClassE[0];
|
|
||||||
assign BPClassWrongCFI = ~BPInstrClassE[0] & InstrClassE[0];
|
|
||||||
assign BPClassWrongNonCFI = BPInstrClassE[0] & ~InstrClassE[0];
|
|
||||||
assign BPClassRightBPWrong = BPInstrClassE[0] & InstrClassE[0] & BPPredDirWrongE;
|
|
||||||
assign BPClassRightBPRight = BPInstrClassE[0] & InstrClassE[0] & ~BPPredDirWrongE;
|
|
||||||
|
|
||||||
|
|
||||||
// GHR update selection, 1 hot encoded.
|
|
||||||
assign GHRMuxSel[0] = ~BPInstrClassF[0] & (BPClassRightNonCFI | BPClassRightBPRight);
|
|
||||||
assign GHRMuxSel[1] = BPClassWrongCFI & ~BPInstrClassD[0];
|
|
||||||
assign GHRMuxSel[2] = BPClassWrongNonCFI & ~BPInstrClassD[0];
|
|
||||||
assign GHRMuxSel[3] = (BPClassRightBPWrong & ~BPInstrClassD[0]) | (BPClassWrongCFI & BPInstrClassD[0]);
|
|
||||||
assign GHRMuxSel[4] = BPClassWrongNonCFI & BPInstrClassD[0];
|
|
||||||
assign GHRMuxSel[5] = InstrClassE[0] & BPClassRightBPWrong & BPInstrClassD[0];
|
|
||||||
assign GHRMuxSel[6] = BPInstrClassF[0] & (BPClassRightNonCFI | (InstrClassE[0] & BPClassRightBPRight));
|
|
||||||
assign GHRUpdateEN = (| GHRMuxSel[5:1] & ~StallE) | GHRMuxSel[6] & ~StallF;
|
|
||||||
|
|
||||||
// hoping this created a AND-OR mux.
|
|
||||||
always_comb begin
|
|
||||||
case (GHRMuxSel)
|
|
||||||
7'b000_0001: GHRNext = GHR[k-1+2:0]; // no change
|
|
||||||
7'b000_0010: GHRNext = {GHR[k-2+2:0], PCSrcE}; // branch update
|
|
||||||
7'b000_0100: GHRNext = {1'b0, GHR[k+1:1]}; // repair 1
|
|
||||||
7'b000_1000: GHRNext = {GHR[k-1+2:1], PCSrcE}; // branch update with mis prediction correction
|
|
||||||
7'b001_0000: GHRNext = {2'b00, GHR[k+1:2]}; // repair 2
|
|
||||||
7'b010_0000: GHRNext = {1'b0, GHR[k+1:2], PCSrcE}; // branch update + repair 1
|
|
||||||
7'b100_0000: GHRNext = {GHR[k-2+2:0], BPPredF[1]}; // speculative update
|
|
||||||
default: GHRNext = GHR[k-1+2:0];
|
|
||||||
endcase
|
|
||||||
end
|
|
||||||
|
|
||||||
flopenr #(k+2) GlobalHistoryRegister(.clk(clk),
|
|
||||||
.reset(reset),
|
|
||||||
.en((GHRUpdateEN)),
|
|
||||||
.d(GHRNext),
|
|
||||||
.q(GHR));
|
|
||||||
|
|
||||||
// if actively updating the GHR at the time of prediction we want to us
|
|
||||||
// GHRNext as the lookup rather than GHR.
|
|
||||||
|
|
||||||
assign PHTUpdateAdr0 = InstrClassE[0] ? GHR[k:1] : GHR[k-1:0];
|
|
||||||
assign PHTUpdateAdr1 = InstrClassE[0] ? GHR[k+1:2] : GHR[k:1];
|
|
||||||
assign PHTUpdateAdr = BPInstrClassD[0] ? PHTUpdateAdr1 : PHTUpdateAdr0;
|
|
||||||
assign PHTUpdateEN = InstrClassE[0] & ~StallE;
|
|
||||||
|
|
||||||
assign GHRLookup = |GHRMuxSel[6:1] ? GHRNext[k-1:0] : GHR[k-1:0];
|
|
||||||
|
|
||||||
// Make Prediction by reading the correct address in the PHT and also update the new address in the PHT
|
|
||||||
ram2p1r1wb #(k, 2) PHT(.clk(clk),
|
|
||||||
.reset(reset),
|
|
||||||
//.RA1(GHR[k-1:0]),
|
|
||||||
.ra1(GHRLookup),
|
|
||||||
.rd1(BPPredF),
|
|
||||||
.ren1(~StallF),
|
|
||||||
.wa2(PHTUpdateAdr),
|
|
||||||
.wd2(UpdateBPPredE),
|
|
||||||
.wen2(PHTUpdateEN),
|
|
||||||
.bwe2(2'b11));
|
|
||||||
|
|
||||||
endmodule
|
|
@ -1,130 +0,0 @@
|
|||||||
///////////////////////////////////////////
|
|
||||||
// globalHistoryPredictor.sv
|
|
||||||
//
|
|
||||||
// Written: Shreya Sanghai
|
|
||||||
// Email: ssanghai@hmc.edu
|
|
||||||
// Created: March 16, 2021
|
|
||||||
// Modified:
|
|
||||||
//
|
|
||||||
// Purpose: Gshare predictor with parameterized global history register
|
|
||||||
//
|
|
||||||
// A component of the CORE-V-WALLY configurable RISC-V project.
|
|
||||||
//
|
|
||||||
// Copyright (C) 2021-23 Harvey Mudd College & Oklahoma State University
|
|
||||||
//
|
|
||||||
// SPDX-License-Identifier: Apache-2.0 WITH SHL-2.1
|
|
||||||
//
|
|
||||||
// Licensed under the Solderpad Hardware License v 2.1 (the “License”); you may not use this file
|
|
||||||
// except in compliance with the License, or, at your option, the Apache License version 2.0. You
|
|
||||||
// may obtain a copy of the License at
|
|
||||||
//
|
|
||||||
// https://solderpad.org/licenses/SHL-2.1/
|
|
||||||
//
|
|
||||||
// Unless required by applicable law or agreed to in writing, any work distributed under the
|
|
||||||
// License is distributed on an “AS IS” BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND,
|
|
||||||
// either express or implied. See the License for the specific language governing permissions
|
|
||||||
// and limitations under the License.
|
|
||||||
////////////////////////////////////////////////////////////////////////////////////////////////
|
|
||||||
|
|
||||||
`include "wally-config.vh"
|
|
||||||
module oldgsharepredictor
|
|
||||||
(input logic clk,
|
|
||||||
input logic reset,
|
|
||||||
input logic StallF, StallD, StallE, StallM, StallW,
|
|
||||||
input logic FlushD, FlushE, FlushM, FlushW,
|
|
||||||
input logic [`XLEN-1:0] PCNextF, PCF, PCD, PCE, PCM,
|
|
||||||
output logic [1:0] DirPredictionF,
|
|
||||||
// update
|
|
||||||
input logic [4:0] InstrClassE,
|
|
||||||
input logic [4:0] BPInstrClassE,
|
|
||||||
input logic [4:0] BPInstrClassD,
|
|
||||||
input logic [4:0] BPInstrClassF,
|
|
||||||
output logic DirPredictionWrongE,
|
|
||||||
|
|
||||||
input logic PCSrcE
|
|
||||||
|
|
||||||
);
|
|
||||||
logic [`BPRED_SIZE+1:0] GHR, GHRNext;
|
|
||||||
logic [`BPRED_SIZE-1:0] PHTUpdateAdr, PHTUpdateAdr0, PHTUpdateAdr1;
|
|
||||||
logic PHTUpdateEN;
|
|
||||||
logic BPClassWrongNonCFI;
|
|
||||||
logic BPClassWrongCFI;
|
|
||||||
logic BPClassRightNonCFI;
|
|
||||||
logic BPClassRightBPWrong;
|
|
||||||
logic BPClassRightBPRight;
|
|
||||||
logic [1:0] DirPredictionD, DirPredictionE;
|
|
||||||
logic [1:0] NewDirPredictionE;
|
|
||||||
|
|
||||||
logic [6:0] GHRMuxSel;
|
|
||||||
logic GHRUpdateEN;
|
|
||||||
logic [`BPRED_SIZE-1:0] GHRLookup;
|
|
||||||
|
|
||||||
assign BPClassRightNonCFI = ~BPInstrClassE[0] & ~InstrClassE[0];
|
|
||||||
assign BPClassWrongCFI = ~BPInstrClassE[0] & InstrClassE[0];
|
|
||||||
assign BPClassWrongNonCFI = BPInstrClassE[0] & ~InstrClassE[0];
|
|
||||||
assign BPClassRightBPWrong = BPInstrClassE[0] & InstrClassE[0] & DirPredictionWrongE;
|
|
||||||
assign BPClassRightBPRight = BPInstrClassE[0] & InstrClassE[0] & ~DirPredictionWrongE;
|
|
||||||
|
|
||||||
|
|
||||||
// GHR update selection, 1 hot encoded.
|
|
||||||
assign GHRMuxSel[0] = ~BPInstrClassF[0] & (BPClassRightNonCFI | BPClassRightBPRight);
|
|
||||||
assign GHRMuxSel[1] = BPClassWrongCFI & ~BPInstrClassD[0];
|
|
||||||
assign GHRMuxSel[2] = BPClassWrongNonCFI & ~BPInstrClassD[0];
|
|
||||||
assign GHRMuxSel[3] = (BPClassRightBPWrong & ~BPInstrClassD[0]) | (BPClassWrongCFI & BPInstrClassD[0]);
|
|
||||||
assign GHRMuxSel[4] = BPClassWrongNonCFI & BPInstrClassD[0];
|
|
||||||
assign GHRMuxSel[5] = InstrClassE[0] & BPClassRightBPWrong & BPInstrClassD[0];
|
|
||||||
assign GHRMuxSel[6] = BPInstrClassF[0] & (BPClassRightNonCFI | (InstrClassE[0] & BPClassRightBPRight));
|
|
||||||
assign GHRUpdateEN = (| GHRMuxSel[5:1] & ~StallE) | GHRMuxSel[6] & ~StallF;
|
|
||||||
|
|
||||||
// hoping this created a AND-OR mux.
|
|
||||||
always_comb begin
|
|
||||||
case (GHRMuxSel)
|
|
||||||
7'b000_0001: GHRNext = GHR[`BPRED_SIZE-1+2:0]; // no change
|
|
||||||
7'b000_0010: GHRNext = {GHR[`BPRED_SIZE-2+2:0], PCSrcE}; // branch update
|
|
||||||
7'b000_0100: GHRNext = {1'b0, GHR[`BPRED_SIZE+1:1]}; // repair 1
|
|
||||||
7'b000_1000: GHRNext = {GHR[`BPRED_SIZE-1+2:1], PCSrcE}; // branch update with mis prediction correction
|
|
||||||
7'b001_0000: GHRNext = {2'b00, GHR[`BPRED_SIZE+1:2]}; // repair 2
|
|
||||||
7'b010_0000: GHRNext = {1'b0, GHR[`BPRED_SIZE+1:2], PCSrcE}; // branch update + repair 1
|
|
||||||
7'b100_0000: GHRNext = {GHR[`BPRED_SIZE-2+2:0], DirPredictionF[1]}; // speculative update
|
|
||||||
default: GHRNext = GHR[`BPRED_SIZE-1+2:0];
|
|
||||||
endcase
|
|
||||||
end
|
|
||||||
|
|
||||||
flopenr #(`BPRED_SIZE+2) GlobalHistoryRegister(.clk(clk),
|
|
||||||
.reset(reset),
|
|
||||||
.en((GHRUpdateEN)),
|
|
||||||
.d(GHRNext),
|
|
||||||
.q(GHR));
|
|
||||||
|
|
||||||
// if actively updating the GHR at the time of prediction we want to us
|
|
||||||
// GHRNext as the lookup rather than GHR.
|
|
||||||
|
|
||||||
assign PHTUpdateAdr0 = InstrClassE[0] ? GHR[`BPRED_SIZE:1] : GHR[`BPRED_SIZE-1:0];
|
|
||||||
assign PHTUpdateAdr1 = InstrClassE[0] ? GHR[`BPRED_SIZE+1:2] : GHR[`BPRED_SIZE:1];
|
|
||||||
assign PHTUpdateAdr = BPInstrClassD[0] ? PHTUpdateAdr1 : PHTUpdateAdr0;
|
|
||||||
assign PHTUpdateEN = InstrClassE[0] & ~StallE;
|
|
||||||
|
|
||||||
assign GHRLookup = |GHRMuxSel[6:1] ? GHRNext[`BPRED_SIZE-1:0] : GHR[`BPRED_SIZE-1:0];
|
|
||||||
|
|
||||||
// Make Prediction by reading the correct address in the PHT and also update the new address in the PHT
|
|
||||||
ram2p1r1wb #(`BPRED_SIZE, 2) PHT(.clk(clk),
|
|
||||||
.reset(reset),
|
|
||||||
//.RA1(GHR[`BPRED_SIZE-1:0]),
|
|
||||||
.ra1(GHRLookup ^ PCNextF[`BPRED_SIZE:1]),
|
|
||||||
.rd1(DirPredictionF),
|
|
||||||
.ren1(~StallF),
|
|
||||||
.wa2(PHTUpdateAdr ^ PCE[`BPRED_SIZE:1]),
|
|
||||||
.wd2(NewDirPredictionE),
|
|
||||||
.wen2(PHTUpdateEN),
|
|
||||||
.bwe2(2'b11));
|
|
||||||
|
|
||||||
// DirPrediction pipeline
|
|
||||||
flopenr #(2) PredictionRegD(clk, reset, ~StallD, DirPredictionF, DirPredictionD);
|
|
||||||
flopenr #(2) PredictionRegE(clk, reset, ~StallE, DirPredictionD, DirPredictionE);
|
|
||||||
|
|
||||||
// New prediction pipeline
|
|
||||||
satCounter2 BPDirUpdateE(.BrDir(PCSrcE), .OldState(DirPredictionE), .NewState(NewDirPredictionE));
|
|
||||||
|
|
||||||
assign DirPredictionWrongE = PCSrcE != DirPredictionE[1] & InstrClassE[0];
|
|
||||||
|
|
||||||
endmodule // gsharePredictor
|
|
@ -1,130 +0,0 @@
|
|||||||
///////////////////////////////////////////
|
|
||||||
// globalHistoryPredictor.sv
|
|
||||||
//
|
|
||||||
// Written: Shreya Sanghai
|
|
||||||
// Email: ssanghai@hmc.edu
|
|
||||||
// Created: March 16, 2021
|
|
||||||
// Modified:
|
|
||||||
//
|
|
||||||
// Purpose: Gshare predictor with parameterized global history register
|
|
||||||
//
|
|
||||||
// A component of the CORE-V-WALLY configurable RISC-V project.
|
|
||||||
//
|
|
||||||
// Copyright (C) 2021-23 Harvey Mudd College & Oklahoma State University
|
|
||||||
//
|
|
||||||
// SPDX-License-Identifier: Apache-2.0 WITH SHL-2.1
|
|
||||||
//
|
|
||||||
// Licensed under the Solderpad Hardware License v 2.1 (the “License”); you may not use this file
|
|
||||||
// except in compliance with the License, or, at your option, the Apache License version 2.0. You
|
|
||||||
// may obtain a copy of the License at
|
|
||||||
//
|
|
||||||
// https://solderpad.org/licenses/SHL-2.1/
|
|
||||||
//
|
|
||||||
// Unless required by applicable law or agreed to in writing, any work distributed under the
|
|
||||||
// License is distributed on an “AS IS” BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND,
|
|
||||||
// either express or implied. See the License for the specific language governing permissions
|
|
||||||
// and limitations under the License.
|
|
||||||
////////////////////////////////////////////////////////////////////////////////////////////////
|
|
||||||
|
|
||||||
`include "wally-config.vh"
|
|
||||||
module oldgsharepredictor2
|
|
||||||
(input logic clk,
|
|
||||||
input logic reset,
|
|
||||||
input logic StallF, StallD, StallE, StallM, StallW,
|
|
||||||
input logic FlushD, FlushE, FlushM, FlushW,
|
|
||||||
input logic [`XLEN-1:0] PCNextF, PCF, PCD, PCE, PCM,
|
|
||||||
output logic [1:0] DirPredictionF,
|
|
||||||
// update
|
|
||||||
input logic [4:0] InstrClassE,
|
|
||||||
input logic [4:0] BPInstrClassE,
|
|
||||||
input logic [4:0] BPInstrClassD,
|
|
||||||
input logic [4:0] BPInstrClassF,
|
|
||||||
output logic DirPredictionWrongE,
|
|
||||||
|
|
||||||
input logic PCSrcE
|
|
||||||
|
|
||||||
);
|
|
||||||
logic [`BPRED_SIZE+1:0] GHR, GHRNext;
|
|
||||||
logic [`BPRED_SIZE-1:0] PHTUpdateAdr, PHTUpdateAdr0, PHTUpdateAdr1;
|
|
||||||
logic PHTUpdateEN;
|
|
||||||
logic BPClassWrongNonCFI;
|
|
||||||
logic BPClassWrongCFI;
|
|
||||||
logic BPClassRightNonCFI;
|
|
||||||
logic BPClassRightBPWrong;
|
|
||||||
logic BPClassRightBPRight;
|
|
||||||
logic [1:0] DirPredictionD, DirPredictionE;
|
|
||||||
logic [1:0] NewDirPredictionE;
|
|
||||||
|
|
||||||
logic [6:0] GHRMuxSel;
|
|
||||||
logic GHRUpdateEN;
|
|
||||||
logic [`BPRED_SIZE-1:0] GHRLookup;
|
|
||||||
|
|
||||||
assign BPClassRightNonCFI = ~BPInstrClassE[0] & ~InstrClassE[0];
|
|
||||||
assign BPClassWrongCFI = ~BPInstrClassE[0] & InstrClassE[0];
|
|
||||||
assign BPClassWrongNonCFI = BPInstrClassE[0] & ~InstrClassE[0];
|
|
||||||
assign BPClassRightBPWrong = BPInstrClassE[0] & InstrClassE[0] & DirPredictionWrongE;
|
|
||||||
assign BPClassRightBPRight = BPInstrClassE[0] & InstrClassE[0] & ~DirPredictionWrongE;
|
|
||||||
|
|
||||||
|
|
||||||
// GHR update selection, 1 hot encoded.
|
|
||||||
assign GHRMuxSel[0] = ~BPInstrClassF[0] & (BPClassRightNonCFI | BPClassRightBPRight);
|
|
||||||
assign GHRMuxSel[1] = BPClassWrongCFI & ~BPInstrClassD[0];
|
|
||||||
assign GHRMuxSel[2] = BPClassWrongNonCFI & ~BPInstrClassD[0];
|
|
||||||
assign GHRMuxSel[3] = (BPClassRightBPWrong & ~BPInstrClassD[0]) | (BPClassWrongCFI & BPInstrClassD[0]);
|
|
||||||
assign GHRMuxSel[4] = BPClassWrongNonCFI & BPInstrClassD[0];
|
|
||||||
assign GHRMuxSel[5] = InstrClassE[0] & BPClassRightBPWrong & BPInstrClassD[0];
|
|
||||||
assign GHRMuxSel[6] = BPInstrClassF[0] & (BPClassRightNonCFI | (InstrClassE[0] & BPClassRightBPRight));
|
|
||||||
assign GHRUpdateEN = (| GHRMuxSel[5:1] & ~StallE) | GHRMuxSel[6] & ~StallF;
|
|
||||||
|
|
||||||
// hoping this created a AND-OR mux.
|
|
||||||
always_comb begin
|
|
||||||
case (GHRMuxSel)
|
|
||||||
7'b000_0001: GHRNext = GHR[`BPRED_SIZE-1+2:0]; // no change
|
|
||||||
7'b000_0010: GHRNext = {GHR[`BPRED_SIZE-2+2:0], PCSrcE}; // branch update
|
|
||||||
7'b000_0100: GHRNext = {1'b0, GHR[`BPRED_SIZE+1:1]}; // repair 1
|
|
||||||
7'b000_1000: GHRNext = {GHR[`BPRED_SIZE-1+2:1], PCSrcE}; // branch update with mis prediction correction
|
|
||||||
7'b001_0000: GHRNext = {2'b00, GHR[`BPRED_SIZE+1:2]}; // repair 2
|
|
||||||
7'b010_0000: GHRNext = {1'b0, GHR[`BPRED_SIZE+1:2], PCSrcE}; // branch update + repair 1
|
|
||||||
7'b100_0000: GHRNext = {GHR[`BPRED_SIZE-2+2:0], DirPredictionF[1]}; // speculative update
|
|
||||||
default: GHRNext = GHR[`BPRED_SIZE-1+2:0];
|
|
||||||
endcase
|
|
||||||
end
|
|
||||||
|
|
||||||
flopenr #(`BPRED_SIZE+2) GlobalHistoryRegister(.clk(clk),
|
|
||||||
.reset(reset),
|
|
||||||
.en((GHRUpdateEN)),
|
|
||||||
.d(GHRNext),
|
|
||||||
.q(GHR));
|
|
||||||
|
|
||||||
// if actively updating the GHR at the time of prediction we want to us
|
|
||||||
// GHRNext as the lookup rather than GHR.
|
|
||||||
|
|
||||||
assign PHTUpdateAdr0 = InstrClassE[0] ? GHR[`BPRED_SIZE:1] : GHR[`BPRED_SIZE-1:0];
|
|
||||||
assign PHTUpdateAdr1 = InstrClassE[0] ? GHR[`BPRED_SIZE+1:2] : GHR[`BPRED_SIZE:1];
|
|
||||||
assign PHTUpdateAdr = BPInstrClassD[0] ? PHTUpdateAdr1 : PHTUpdateAdr0;
|
|
||||||
assign PHTUpdateEN = InstrClassE[0] & ~StallE;
|
|
||||||
|
|
||||||
assign GHRLookup = |GHRMuxSel[6:1] ? GHRNext[`BPRED_SIZE-1:0] : GHR[`BPRED_SIZE-1:0];
|
|
||||||
|
|
||||||
// Make Prediction by reading the correct address in the PHT and also update the new address in the PHT
|
|
||||||
ram2p1r1wb #(`BPRED_SIZE, 2) PHT(.clk(clk),
|
|
||||||
.reset(reset),
|
|
||||||
//.RA1(GHR[`BPRED_SIZE-1:0]),
|
|
||||||
.ra1(GHRLookup ^ PCNextF[`BPRED_SIZE:1]),
|
|
||||||
.rd1(DirPredictionF),
|
|
||||||
.ren1(~StallF),
|
|
||||||
.wa2(PHTUpdateAdr ^ PCE[`BPRED_SIZE:1]),
|
|
||||||
.wd2(NewDirPredictionE),
|
|
||||||
.wen2(PHTUpdateEN),
|
|
||||||
.bwe2(2'b11));
|
|
||||||
|
|
||||||
// DirPrediction pipeline
|
|
||||||
flopenr #(2) PredictionRegD(clk, reset, ~StallD, DirPredictionF, DirPredictionD);
|
|
||||||
flopenr #(2) PredictionRegE(clk, reset, ~StallE, DirPredictionD, DirPredictionE);
|
|
||||||
|
|
||||||
// New prediction pipeline
|
|
||||||
satCounter2 BPDirUpdateE(.BrDir(PCSrcE), .OldState(DirPredictionE), .NewState(NewDirPredictionE));
|
|
||||||
|
|
||||||
assign DirPredictionWrongE = PCSrcE != DirPredictionE[1] & InstrClassE[0];
|
|
||||||
|
|
||||||
endmodule // gsharePredictor
|
|
@ -8,6 +8,7 @@ NAME := synth
|
|||||||
export DESIGN ?= wallypipelinedcore
|
export DESIGN ?= wallypipelinedcore
|
||||||
export FREQ ?= 3000
|
export FREQ ?= 3000
|
||||||
export CONFIG ?= rv32e
|
export CONFIG ?= rv32e
|
||||||
|
export MOD ?= orig
|
||||||
# title to add a note in the synth's directory name
|
# title to add a note in the synth's directory name
|
||||||
TITLE =
|
TITLE =
|
||||||
# tsmc28, sky130, and sky90 presently supported
|
# tsmc28, sky130, and sky90 presently supported
|
||||||
@ -22,13 +23,15 @@ export DRIVE ?= FLOP
|
|||||||
|
|
||||||
time := $(shell date +%F-%H-%M)
|
time := $(shell date +%F-%H-%M)
|
||||||
hash := $(shell git rev-parse --short HEAD)
|
hash := $(shell git rev-parse --short HEAD)
|
||||||
export OUTPUTDIR := runs/$(DESIGN)_$(CONFIG)_$(TECH)nm_$(FREQ)_MHz_$(time)_$(TITLE)_$(hash)
|
export OUTPUTDIR := runs/$(DESIGN)_$(CONFIG)_$(MOD)_$(TECH)nm_$(FREQ)_MHz_$(time)_$(TITLE)_$(hash)
|
||||||
export SAIFPOWER ?= 0
|
export SAIFPOWER ?= 0
|
||||||
|
|
||||||
CONFIGDIR ?= ${WALLY}/pipelined/config
|
configAsList := $(subst _, ,$(CONFIG))
|
||||||
|
BASECONFIG := $(word 1, $(configAsList))
|
||||||
|
OLDCONFIGDIR ?= ${WALLY}/pipelined/config
|
||||||
|
CONFIGDIR ?= $(OUTPUTDIR)/hdl/config
|
||||||
CONFIGFILES ?= $(shell find $(CONFIGDIR) -name rv*_*)
|
CONFIGFILES ?= $(shell find $(CONFIGDIR) -name rv*_*)
|
||||||
CONFIGFILESTRIM = $(notdir $(CONFIGFILES))
|
CONFIGFILESTRIM = $(notdir $(CONFIGFILES))
|
||||||
# FREQS = 25 50 100 150 200 250 300 350 400
|
|
||||||
# k = 3 6
|
# k = 3 6
|
||||||
|
|
||||||
print:
|
print:
|
||||||
@ -42,8 +45,8 @@ default:
|
|||||||
@echo "Use wallySynth.py to run a concurrent sweep "
|
@echo "Use wallySynth.py to run a concurrent sweep "
|
||||||
|
|
||||||
|
|
||||||
DIRS32 = rv32e rv32gc rv32ic
|
DIRS32 = rv32e rv32gc rv32ic rv32i
|
||||||
DIRS64 = rv64ic rv64gc
|
DIRS64 = rv64i rv64gc
|
||||||
DIRS = $(DIRS32) $(DIRS64)
|
DIRS = $(DIRS32) $(DIRS64)
|
||||||
|
|
||||||
# bpred:
|
# bpred:
|
||||||
@ -51,73 +54,72 @@ DIRS = $(DIRS32) $(DIRS64)
|
|||||||
# @$(foreach kval, $(k), cp -r $(CONFIGDIR)/rv64gc $(CONFIGDIR)/rv64gc_bpred_$(kval);)
|
# @$(foreach kval, $(k), cp -r $(CONFIGDIR)/rv64gc $(CONFIGDIR)/rv64gc_bpred_$(kval);)
|
||||||
# @$(foreach kval, $(k), sed -i 's/BPRED_SIZE.*/BPRED_SIZE $(kval)/g' $(CONFIGDIR)/rv64gc_bpred_$(kval)/wally-config.vh;)
|
# @$(foreach kval, $(k), sed -i 's/BPRED_SIZE.*/BPRED_SIZE $(kval)/g' $(CONFIGDIR)/rv64gc_bpred_$(kval)/wally-config.vh;)
|
||||||
# @$(foreach kval, $(k), make synth DESIGN=wallypipelinedcore CONFIG=rv64gc_bpred_$(kval) TECH=sky90 FREQ=500 MAXCORES=4 --jobs;)
|
# @$(foreach kval, $(k), make synth DESIGN=wallypipelinedcore CONFIG=rv64gc_bpred_$(kval) TECH=sky90 FREQ=500 MAXCORES=4 --jobs;)
|
||||||
copy:
|
|
||||||
# remove old config files
|
|
||||||
rm -rf $(CONFIGDIR)/*_*
|
|
||||||
|
|
||||||
@$(foreach dir, $(DIRS), rm -rf $(CONFIGDIR)/$(dir)_orig;)
|
configs: $(BASECONFIG)
|
||||||
@$(foreach dir, $(DIRS), cp -r $(CONFIGDIR)/$(dir) $(CONFIGDIR)/$(dir)_orig;)
|
$(BASECONFIG):
|
||||||
@$(foreach dir, $(DIRS), sed -i 's/WAYSIZEINBYTES.*/WAYSIZEINBYTES 512/g' $(CONFIGDIR)/$(dir)_orig/wally-config.vh;)
|
@echo $(BASECONFIG)
|
||||||
@$(foreach dir, $(DIRS), sed -i 's/NUMWAYS.*/NUMWAYS 1/g' $(CONFIGDIR)/$(dir)_orig/wally-config.vh;)
|
cp -r $(OLDCONFIGDIR)/$(BASECONFIG) $(CONFIGDIR)/$(BASECONFIG)_orig
|
||||||
@$(foreach dir, $(DIRS), sed -i 's/BPRED_SIZE.*/BPRED_SIZE 4/g' $(CONFIGDIR)/$(dir)_orig/wally-config.vh;)
|
sed -i 's/WAYSIZEINBYTES.*/WAYSIZEINBYTES 512/g' $(CONFIGDIR)/$(BASECONFIG)_orig/wally-config.vh
|
||||||
|
sed -i 's/NUMWAYS.*/NUMWAYS 1/g' $(CONFIGDIR)/$(BASECONFIG)_orig/wally-config.vh
|
||||||
|
sed -i 's/BPRED_SIZE.*/BPRED_SIZE 4/g' $(CONFIGDIR)/$(BASECONFIG)_orig/wally-config.vh
|
||||||
|
|
||||||
@$(foreach dir, $(DIRS32), sed -i "s/RAM_RANGE.*/RAM_RANGE 34\'h01FF/g" $(CONFIGDIR)/$(dir)_orig/wally-config.vh ;)
|
ifneq ($(filter $ $(BASECONFIG), $(DIRS32)),)
|
||||||
@$(foreach dir, $(DIRS64), sed -i "s/RAM_RANGE.*/RAM_RANGE 56\'h01FF/g" $(CONFIGDIR)/$(dir)_orig/wally-config.vh ;)
|
sed -i "s/RAM_RANGE.*/RAM_RANGE 34\'h01FF/g" $(CONFIGDIR)/$(BASECONFIG)_orig/wally-config.vh
|
||||||
|
else ifneq ($(filter $ $(BASECONFIG), $(DIRS64)),)
|
||||||
configs: $(DIRS)
|
sed -i "s/RAM_RANGE.*/RAM_RANGE 56\'h01FF/g" $(CONFIGDIR)/$(BASECONFIG)_orig/wally-config.vh
|
||||||
$(DIRS):
|
else
|
||||||
|
$(info $(BASECONFIG) does not exist in $(DIRS32) or $(DIRS64))
|
||||||
|
@echo "Config not in list, RAM_RANGE will be unmodified"
|
||||||
|
endif
|
||||||
|
|
||||||
# turn off FPU
|
# turn off FPU
|
||||||
rm -rf $(CONFIGDIR)/$@_FPUoff
|
|
||||||
cp -r $(CONFIGDIR)/$@_orig $(CONFIGDIR)/$@_FPUoff
|
cp -r $(CONFIGDIR)/$@_orig $(CONFIGDIR)/$@_FPUoff
|
||||||
sed -i 's/1 *<< *3/0 << 3/' $(CONFIGDIR)/$@_FPUoff/wally-config.vh
|
sed -i 's/1 *<< *3/0 << 3/' $(CONFIGDIR)/$@_FPUoff/wally-config.vh
|
||||||
sed -i 's/1 *<< *5/0 << 5/' $(CONFIGDIR)/$@_FPUoff/wally-config.vh
|
sed -i 's/1 *<< *5/0 << 5/' $(CONFIGDIR)/$@_FPUoff/wally-config.vh
|
||||||
|
|
||||||
# PMP 16
|
# PMP 16
|
||||||
rm -rf $(CONFIGDIR)/$@_PMP16
|
|
||||||
cp -r $(CONFIGDIR)/$@_FPUoff $(CONFIGDIR)/$@_PMP16
|
cp -r $(CONFIGDIR)/$@_FPUoff $(CONFIGDIR)/$@_PMP16
|
||||||
sed -i 's/PMP_ENTRIES \(64\|16\|0\)/PMP_ENTRIES 16/' $(CONFIGDIR)/$@_PMP16/wally-config.vh
|
sed -i 's/PMP_ENTRIES \(64\|16\|0\)/PMP_ENTRIES 16/' $(CONFIGDIR)/$@_PMP16/wally-config.vh
|
||||||
|
|
||||||
# PMP 0
|
# PMP 0
|
||||||
rm -rf $(CONFIGDIR)/$@_PMP0
|
|
||||||
cp -r $(CONFIGDIR)/$@_FPUoff $(CONFIGDIR)/$@_PMP0
|
cp -r $(CONFIGDIR)/$@_FPUoff $(CONFIGDIR)/$@_PMP0
|
||||||
sed -i 's/PMP_ENTRIES \(64\|16\|0\)/PMP_ENTRIES 0/' $(CONFIGDIR)/$@_PMP0/wally-config.vh
|
sed -i 's/PMP_ENTRIES \(64\|16\|0\)/PMP_ENTRIES 0/' $(CONFIGDIR)/$@_PMP0/wally-config.vh
|
||||||
|
|
||||||
# no muldiv
|
# no muldiv
|
||||||
rm -rf $(CONFIGDIR)/$@_noMulDiv
|
|
||||||
cp -r $(CONFIGDIR)/$@_PMP0 $(CONFIGDIR)/$@_noMulDiv
|
cp -r $(CONFIGDIR)/$@_PMP0 $(CONFIGDIR)/$@_noMulDiv
|
||||||
sed -i 's/1 *<< *12/0 << 12/' $(CONFIGDIR)/$@_noMulDiv/wally-config.vh
|
sed -i 's/1 *<< *12/0 << 12/' $(CONFIGDIR)/$@_noMulDiv/wally-config.vh
|
||||||
|
|
||||||
# no priv
|
# no priv
|
||||||
rm -rf $(CONFIGDIR)/$@_noPriv
|
|
||||||
cp -r $(CONFIGDIR)/$@_noMulDiv $(CONFIGDIR)/$@_noPriv
|
cp -r $(CONFIGDIR)/$@_noMulDiv $(CONFIGDIR)/$@_noPriv
|
||||||
sed -i 's/ZICSR_SUPPORTED *1/ZICSR_SUPPORTED 0/' $(CONFIGDIR)/$@_noPriv/wally-config.vh
|
sed -i 's/ZICSR_SUPPORTED *1/ZICSR_SUPPORTED 0/' $(CONFIGDIR)/$@_noPriv/wally-config.vh
|
||||||
|
|
||||||
|
ifeq ($(SAIFPOWER), 1)
|
||||||
|
cp -f ../pipelined/regression/power.saif .
|
||||||
|
endif
|
||||||
|
|
||||||
freqs:
|
freqs:
|
||||||
@$(foreach freq, $(FREQS), make synth DESIGN=wallypipelinedcore CONFIG=rv32e FREQ=$(freq) MAXCORES=1;)
|
@$(foreach freq, $(FREQS), make synth DESIGN=wallypipelinedcore CONFIG=rv32e FREQ=$(freq) MAXCORES=1;)
|
||||||
|
|
||||||
synth:
|
mkdirecs:
|
||||||
@echo "DC Synthesis"
|
@echo "DC Synthesis"
|
||||||
@mkdir -p $(OUTPUTDIR)
|
@mkdir -p $(OUTPUTDIR)
|
||||||
@mkdir -p $(OUTPUTDIR)/hdl
|
@mkdir -p $(OUTPUTDIR)/hdl/config
|
||||||
@mkdir -p $(OUTPUTDIR)/reports
|
@mkdir -p $(OUTPUTDIR)/reports
|
||||||
@mkdir -p $(OUTPUTDIR)/mapped
|
@mkdir -p $(OUTPUTDIR)/mapped
|
||||||
@mkdir -p $(OUTPUTDIR)/unmapped
|
@mkdir -p $(OUTPUTDIR)/unmapped
|
||||||
ifeq ($(SAIFPOWER), 1)
|
|
||||||
cp -f ../pipelined/regression/power.saif .
|
synth: mkdirecs configs rundc clean
|
||||||
endif
|
|
||||||
|
rundc:
|
||||||
dc_shell-xg-t -64bit -f scripts/$(NAME).tcl | tee $(OUTPUTDIR)/$(NAME).out
|
dc_shell-xg-t -64bit -f scripts/$(NAME).tcl | tee $(OUTPUTDIR)/$(NAME).out
|
||||||
# rm -rf $(OUTPUTDIR)/hdl
|
|
||||||
|
clean:
|
||||||
|
rm -rf $(OUTPUTDIR)/hdl
|
||||||
rm -rf $(OUTPUTDIR)/WORK
|
rm -rf $(OUTPUTDIR)/WORK
|
||||||
rm -rf $(OUTPUTDIR)/alib-52
|
rm -rf $(OUTPUTDIR)/alib-52
|
||||||
|
|
||||||
clean:
|
|
||||||
rm -f default.svf
|
rm -f default.svf
|
||||||
rm -f command.log
|
rm -f command.log
|
||||||
rm -f filenames*.log
|
rm -f filenames*.log
|
||||||
rm -f power.saif
|
rm -f power.saif
|
||||||
rm -f Synopsys_stack_trace_*.txt
|
rm -f Synopsys_stack_trace_*.txt
|
||||||
rm -f crte_*.txt
|
rm -f crte_*.txt
|
||||||
|
|
||||||
fresh: clean copy configs
|
|
||||||
@echo "synth directory cleaned and fresh config files written"
|
|
@ -28,16 +28,16 @@ def synthsintocsv():
|
|||||||
|
|
||||||
file = open("Summary.csv", "w")
|
file = open("Summary.csv", "w")
|
||||||
writer = csv.writer(file)
|
writer = csv.writer(file)
|
||||||
writer.writerow(['Width', 'Config', 'Special', 'Tech', 'Target Freq', 'Delay', 'Area'])
|
writer.writerow(['Width', 'Config', 'Mod', 'Tech', 'Target Freq', 'Delay', 'Area'])
|
||||||
|
|
||||||
for oneSynth in allSynths:
|
for oneSynth in allSynths:
|
||||||
descrip = specReg.findall(oneSynth)
|
descrip = specReg.findall(oneSynth)
|
||||||
width = descrip[2][:4]
|
width = descrip[2][:4]
|
||||||
config = descrip[2][4:]
|
config = descrip[2][4:]
|
||||||
if descrip[3][-2:] == 'nm':
|
if descrip[3][-2:] == 'nm':
|
||||||
special = ''
|
mod = ''
|
||||||
else:
|
else:
|
||||||
special = descrip[3]
|
mod = descrip[3]
|
||||||
descrip = descrip[1:]
|
descrip = descrip[1:]
|
||||||
tech = descrip[3][:-2]
|
tech = descrip[3][:-2]
|
||||||
freq = descrip[4]
|
freq = descrip[4]
|
||||||
@ -57,12 +57,12 @@ def synthsintocsv():
|
|||||||
else:
|
else:
|
||||||
delay = 1000/int(freq) - metrics[0]
|
delay = 1000/int(freq) - metrics[0]
|
||||||
area = metrics[1]
|
area = metrics[1]
|
||||||
writer.writerow([width, config, special, tech, freq, delay, area])
|
writer.writerow([width, config, mod, tech, freq, delay, area])
|
||||||
file.close()
|
file.close()
|
||||||
|
|
||||||
|
|
||||||
def synthsfromcsv(filename):
|
def synthsfromcsv(filename):
|
||||||
Synth = namedtuple("Synth", "width config special tech freq delay area")
|
Synth = namedtuple("Synth", "width config mod tech freq delay area")
|
||||||
with open(filename, newline='') as csvfile:
|
with open(filename, newline='') as csvfile:
|
||||||
csvreader = csv.reader(csvfile)
|
csvreader = csv.reader(csvfile)
|
||||||
global allSynths
|
global allSynths
|
||||||
@ -81,14 +81,9 @@ def freqPlot(tech, width, config):
|
|||||||
''' plots delay, area for syntheses with specified tech, module, width
|
''' plots delay, area for syntheses with specified tech, module, width
|
||||||
'''
|
'''
|
||||||
|
|
||||||
current_directory = os.getcwd()
|
|
||||||
final_directory = os.path.join(current_directory, 'plots/wally')
|
|
||||||
if not os.path.exists(final_directory):
|
|
||||||
os.makedirs(final_directory)
|
|
||||||
|
|
||||||
freqsL, delaysL, areasL = ([[], []] for i in range(3))
|
freqsL, delaysL, areasL = ([[], []] for i in range(3))
|
||||||
for oneSynth in allSynths:
|
for oneSynth in allSynths:
|
||||||
if (width == oneSynth.width) & (config == oneSynth.config) & (tech == oneSynth.tech) & ('' == oneSynth.special):
|
if (width == oneSynth.width) & (config == oneSynth.config) & (tech == oneSynth.tech) & ('orig' == oneSynth.mod):
|
||||||
ind = (1000/oneSynth.delay < oneSynth.freq) # when delay is within target clock period
|
ind = (1000/oneSynth.delay < oneSynth.freq) # when delay is within target clock period
|
||||||
freqsL[ind] += [oneSynth.freq]
|
freqsL[ind] += [oneSynth.freq]
|
||||||
delaysL[ind] += [oneSynth.delay]
|
delaysL[ind] += [oneSynth.delay]
|
||||||
@ -130,7 +125,7 @@ def freqPlot(tech, width, config):
|
|||||||
ax2.yaxis.set_major_formatter(ticker.StrMethodFormatter('{x:,.0f}'))
|
ax2.yaxis.set_major_formatter(ticker.StrMethodFormatter('{x:,.0f}'))
|
||||||
addFO4axis(fig, ax1, tech)
|
addFO4axis(fig, ax1, tech)
|
||||||
|
|
||||||
plt.savefig('./plots/wally/freqSweep_' + tech + '_' + width + config + '.png')
|
plt.savefig(final_directory + '/freqSweep_' + tech + '_' + width + config + '.png')
|
||||||
|
|
||||||
|
|
||||||
def areaDelay(tech, delays, areas, labels, fig, ax, norm=False):
|
def areaDelay(tech, delays, areas, labels, fig, ax, norm=False):
|
||||||
@ -168,7 +163,7 @@ def plotFeatures(tech, width, config):
|
|||||||
if (oneSynth.config == config) & (width == oneSynth.width):
|
if (oneSynth.config == config) & (width == oneSynth.width):
|
||||||
delays += [oneSynth.delay]
|
delays += [oneSynth.delay]
|
||||||
areas += [oneSynth.area]
|
areas += [oneSynth.area]
|
||||||
labels += [oneSynth.special]
|
labels += [oneSynth.mod]
|
||||||
|
|
||||||
fig, (ax) = plt.subplots(1, 1)
|
fig, (ax) = plt.subplots(1, 1)
|
||||||
|
|
||||||
@ -176,28 +171,28 @@ def plotFeatures(tech, width, config):
|
|||||||
|
|
||||||
titlestr = tech+'_'+width+config
|
titlestr = tech+'_'+width+config
|
||||||
plt.title(titlestr)
|
plt.title(titlestr)
|
||||||
plt.savefig('./plots/wally/features_'+titlestr+'.png')
|
plt.savefig(final_directory + '/features_'+titlestr+'.png')
|
||||||
|
|
||||||
|
|
||||||
def plotConfigs(tech, special=''):
|
def plotConfigs(tech, mod=''):
|
||||||
delays, areas, labels = ([] for i in range(3))
|
delays, areas, labels = ([] for i in range(3))
|
||||||
freq = techdict[tech].targfreq
|
freq = techdict[tech].targfreq
|
||||||
for oneSynth in allSynths:
|
for oneSynth in allSynths:
|
||||||
if (tech == oneSynth.tech) & (freq == oneSynth.freq) & (oneSynth.special == special):
|
if (tech == oneSynth.tech) & (freq == oneSynth.freq) & (oneSynth.mod == mod):
|
||||||
delays += [oneSynth.delay]
|
delays += [oneSynth.delay]
|
||||||
areas += [oneSynth.area]
|
areas += [oneSynth.area]
|
||||||
labels += [oneSynth.width + oneSynth.config]
|
labels += [oneSynth.width + oneSynth.config]
|
||||||
|
|
||||||
fig, (ax) = plt.subplots(1, 1)
|
fig, (ax) = plt.subplots(1, 1)
|
||||||
|
|
||||||
fig = areaDelay(tech, delays, areas, labels, fig, ax)
|
fig = areaDelay(tech, delays, areas, labels, fig, ax)
|
||||||
|
|
||||||
titleStr = tech+'_'+special
|
titleStr = tech+'_'+mod
|
||||||
plt.title(titleStr)
|
plt.title(titleStr)
|
||||||
plt.savefig('./plots/wally/configs_' + titleStr + '.png')
|
plt.savefig(final_directory + '/configs_' + titleStr + '.png')
|
||||||
|
|
||||||
|
|
||||||
def normAreaDelay(special=''):
|
def normAreaDelay(mod=''):
|
||||||
fig, (ax) = plt.subplots(1, 1)
|
fig, (ax) = plt.subplots(1, 1)
|
||||||
fullLeg = []
|
fullLeg = []
|
||||||
for tech in list(techdict.keys()):
|
for tech in list(techdict.keys()):
|
||||||
@ -205,7 +200,7 @@ def normAreaDelay(special=''):
|
|||||||
spec = techdict[tech]
|
spec = techdict[tech]
|
||||||
freq = spec.targfreq
|
freq = spec.targfreq
|
||||||
for oneSynth in allSynths:
|
for oneSynth in allSynths:
|
||||||
if (tech == oneSynth.tech) & (freq == oneSynth.freq) & (oneSynth.special == special):
|
if (tech == oneSynth.tech) & (freq == oneSynth.freq) & (oneSynth.mod == mod):
|
||||||
delays += [oneSynth.delay]
|
delays += [oneSynth.delay]
|
||||||
areas += [oneSynth.area]
|
areas += [oneSynth.area]
|
||||||
labels += [oneSynth.width + oneSynth.config]
|
labels += [oneSynth.width + oneSynth.config]
|
||||||
@ -216,7 +211,7 @@ def normAreaDelay(special=''):
|
|||||||
ax.set_xlabel('Cycle Time (FO4)')
|
ax.set_xlabel('Cycle Time (FO4)')
|
||||||
ax.set_ylabel('Area (add32)')
|
ax.set_ylabel('Area (add32)')
|
||||||
ax.legend(handles = fullLeg, loc='upper left')
|
ax.legend(handles = fullLeg, loc='upper left')
|
||||||
plt.savefig('./plots/wally/normAreaDelay.png')
|
plt.savefig(final_directory + '/normAreaDelay.png')
|
||||||
|
|
||||||
|
|
||||||
def addFO4axis(fig, ax, tech):
|
def addFO4axis(fig, ax, tech):
|
||||||
@ -254,12 +249,17 @@ if __name__ == '__main__':
|
|||||||
techdict['sky90'] = TechSpec('green', 'o', args.skyfreq, 43.2e-3, 1440.600027, 714.057, 0.658023)
|
techdict['sky90'] = TechSpec('green', 'o', args.skyfreq, 43.2e-3, 1440.600027, 714.057, 0.658023)
|
||||||
techdict['tsmc28'] = TechSpec('blue', 's', args.tsmcfreq, 12.2e-3, 209.286002, 1060.0, .081533)
|
techdict['tsmc28'] = TechSpec('blue', 's', args.tsmcfreq, 12.2e-3, 209.286002, 1060.0, .081533)
|
||||||
|
|
||||||
|
current_directory = os.getcwd()
|
||||||
|
final_directory = os.path.join(current_directory, 'wallyplots')
|
||||||
|
if not os.path.exists(final_directory):
|
||||||
|
os.makedirs(final_directory)
|
||||||
|
|
||||||
synthsintocsv()
|
synthsintocsv()
|
||||||
synthsfromcsv('Summary.csv')
|
synthsfromcsv('Summary.csv')
|
||||||
freqPlot('tsmc28', 'rv32', 'e')
|
freqPlot('tsmc28', 'rv32', 'e')
|
||||||
freqPlot('sky90', 'rv32', 'e')
|
freqPlot('sky90', 'rv32', 'e')
|
||||||
plotFeatures('sky90', 'rv64', 'gc')
|
plotFeatures('sky90', 'rv64', 'gc')
|
||||||
plotFeatures('tsmc28', 'rv64', 'gc')
|
plotFeatures('tsmc28', 'rv64', 'gc')
|
||||||
plotConfigs('sky90', special='orig')
|
plotConfigs('sky90', mod='orig')
|
||||||
plotConfigs('tsmc28', special='orig')
|
plotConfigs('tsmc28', mod='orig')
|
||||||
normAreaDelay(special='orig')
|
normAreaDelay(mod='orig')
|
||||||
|
@ -5,20 +5,14 @@ import subprocess
|
|||||||
from multiprocessing import Pool
|
from multiprocessing import Pool
|
||||||
import argparse
|
import argparse
|
||||||
|
|
||||||
def runSynth(config, tech, freq, maxopt):
|
def runSynth(config, mod, tech, freq, maxopt):
|
||||||
global pool
|
global pool
|
||||||
command = "make synth DESIGN=wallypipelinedcore CONFIG={} TECH={} DRIVE=FLOP FREQ={} MAXOPT={} MAXCORES=1".format(config, tech, freq, maxopt)
|
command = "make synth DESIGN=wallypipelinedcore CONFIG={} MOD={} TECH={} DRIVE=FLOP FREQ={} MAXOPT={} MAXCORES=1".format(config, mod, tech, freq, maxopt)
|
||||||
pool.map(mask, [command])
|
pool.map(mask, [command])
|
||||||
|
|
||||||
def mask(command):
|
def mask(command):
|
||||||
subprocess.Popen(command, shell=True)
|
subprocess.Popen(command, shell=True)
|
||||||
|
|
||||||
def freshStart():
|
|
||||||
out = subprocess.check_output(['bash','-c', 'make fresh'])
|
|
||||||
for x in out.decode("utf-8").split('\n')[:-1]:
|
|
||||||
print(x)
|
|
||||||
return
|
|
||||||
|
|
||||||
|
|
||||||
if __name__ == '__main__':
|
if __name__ == '__main__':
|
||||||
|
|
||||||
@ -41,24 +35,21 @@ if __name__ == '__main__':
|
|||||||
|
|
||||||
args = parser.parse_args()
|
args = parser.parse_args()
|
||||||
|
|
||||||
freq = args.targetfreq if args.targetfreq else 3000
|
|
||||||
tech = args.tech if args.tech else 'sky90'
|
tech = args.tech if args.tech else 'sky90'
|
||||||
|
defaultfreq = 3000 if tech == 'sky90' else 10000
|
||||||
|
freq = args.targetfreq if args.targetfreq else defaultfreq
|
||||||
maxopt = int(args.maxopt)
|
maxopt = int(args.maxopt)
|
||||||
|
mod = 'orig' # until memory integrated
|
||||||
|
|
||||||
if args.freqsweep:
|
if args.freqsweep:
|
||||||
sc = args.freqsweep
|
sc = args.freqsweep
|
||||||
config = args.version if args.version else 'rv32e'
|
config = args.version if args.version else 'rv32e'
|
||||||
freshStart()
|
|
||||||
for freq in [round(sc+sc*x/100) for x in freqVaryPct]: # rv32e freq sweep
|
for freq in [round(sc+sc*x/100) for x in freqVaryPct]: # rv32e freq sweep
|
||||||
runSynth(config, tech, freq, maxopt)
|
runSynth(config, mod, tech, freq, maxopt)
|
||||||
if args.configsweep:
|
if args.configsweep:
|
||||||
freshStart()
|
for config in ['rv32i', 'rv64gc', 'rv64i', 'rv32gc', 'rv32ic', 'rv32e']: #configs
|
||||||
for config in ['rv32gc', 'rv32ic', 'rv64gc', 'rv64ic', 'rv32e']: # configs
|
runSynth(config, mod, tech, freq, maxopt)
|
||||||
config = config + '_orig' # until memory integrated
|
|
||||||
runSynth(config, tech, freq, maxopt)
|
|
||||||
if args.featuresweep:
|
if args.featuresweep:
|
||||||
freshStart()
|
config = args.version if args.version else 'rv64gc'
|
||||||
v = args.version if args.version else 'rv64gc'
|
for mod in ['FPUoff', 'noMulDiv', 'noPriv', 'PMP0', 'PMP16']: # rv64gc path variations 'orig',
|
||||||
for mod in ['FPUoff', 'noMulDiv', 'noPriv', 'PMP0', 'PMP16']: # rv64gc path variations
|
runSynth(config, mod, tech, freq, maxopt)
|
||||||
config = v + '_' + mod
|
|
||||||
runSynth(config, tech, freq, maxopt)
|
|
||||||
|
Loading…
Reference in New Issue
Block a user