mirror of
https://github.com/openhwgroup/cvw
synced 2025-02-11 06:05:49 +00:00
221 lines
11 KiB
Systemverilog
221 lines
11 KiB
Systemverilog
///////////////////////////////////////////
|
|
// cache (data cache)
|
|
//
|
|
// Written: ross1728@gmail.com July 07, 2021
|
|
// Implements the L1 data cache
|
|
//
|
|
// Purpose: Storage for data and meta data.
|
|
//
|
|
// A component of the Wally configurable RISC-V project.
|
|
//
|
|
// Copyright (C) 2021 Harvey Mudd College & Oklahoma State University
|
|
//
|
|
// MIT LICENSE
|
|
// Permission is hereby granted, free of charge, to any person obtaining a copy of this
|
|
// software and associated documentation files (the "Software"), to deal in the Software
|
|
// without restriction, including without limitation the rights to use, copy, modify, merge,
|
|
// publish, distribute, sublicense, and/or sell copies of the Software, and to permit persons
|
|
// to whom the Software is furnished to do so, subject to the following conditions:
|
|
//
|
|
// The above copyright notice and this permission notice shall be included in all copies or
|
|
// substantial portions of the Software.
|
|
//
|
|
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED,
|
|
// INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR
|
|
// PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
|
|
// BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
|
|
// TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE
|
|
// OR OTHER DEALINGS IN THE SOFTWARE.
|
|
////////////////////////////////////////////////////////////////////////////////////////////////
|
|
|
|
`include "wally-config.vh"
|
|
|
|
module cache #(parameter LINELEN, NUMLINES, NUMWAYS, LOGBWPL, WORDLEN, MUXINTERVAL, DCACHE) (
|
|
input logic clk,
|
|
input logic reset,
|
|
// cpu side
|
|
input logic FlushStage,
|
|
input logic CPUBusy,
|
|
input logic [1:0] CacheRW,
|
|
input logic [1:0] CacheAtomic,
|
|
input logic FlushCache,
|
|
input logic InvalidateCache,
|
|
input logic [11:0] NextAdr, // virtual address, but we only use the lower 12 bits.
|
|
input logic [`PA_BITS-1:0] PAdr, // physical address
|
|
input logic [(WORDLEN-1)/8:0] ByteMask,
|
|
input logic [WORDLEN-1:0] CacheWriteData,
|
|
output logic CacheCommitted,
|
|
output logic CacheStall,
|
|
// to performance counters to cpu
|
|
output logic CacheMiss,
|
|
output logic CacheAccess,
|
|
// lsu control
|
|
input logic SelHPTW,
|
|
// Bus fsm interface
|
|
output logic [1:0] CacheBusRW,
|
|
input logic CacheBusAck,
|
|
input logic SelBusBeat,
|
|
input logic [LOGBWPL-1:0] BeatCount,
|
|
input logic [LINELEN-1:0] FetchBuffer,
|
|
output logic [`PA_BITS-1:0] CacheBusAdr,
|
|
output logic [WORDLEN-1:0] ReadDataWord);
|
|
|
|
// Cache parameters
|
|
localparam LINEBYTELEN = LINELEN/8;
|
|
localparam OFFSETLEN = $clog2(LINEBYTELEN);
|
|
localparam SETLEN = $clog2(NUMLINES);
|
|
localparam SETTOP = SETLEN+OFFSETLEN;
|
|
localparam TAGLEN = `PA_BITS - SETTOP;
|
|
localparam WORDSPERLINE = LINELEN/WORDLEN;
|
|
localparam FlushAdrThreshold = NUMLINES - 1;
|
|
|
|
logic SelAdr;
|
|
logic [SETLEN-1:0] CAdr;
|
|
logic [LINELEN-1:0] LineWriteData;
|
|
logic ClearValid;
|
|
logic ClearDirty;
|
|
logic [LINELEN-1:0] ReadDataLineWay [NUMWAYS-1:0];
|
|
logic [NUMWAYS-1:0] HitWay, ValidWay;
|
|
logic CacheHit;
|
|
logic SetDirty;
|
|
logic SetValid;
|
|
logic [NUMWAYS-1:0] VictimWay;
|
|
logic [NUMWAYS-1:0] VictimDirtyWay;
|
|
logic VictimDirty;
|
|
logic [TAGLEN-1:0] VictimTagWay [NUMWAYS-1:0];
|
|
logic [TAGLEN-1:0] VictimTag;
|
|
logic [SETLEN-1:0] FlushAdr;
|
|
logic [SETLEN-1:0] FlushAdrP1;
|
|
logic FlushAdrCntEn;
|
|
logic FlushAdrCntRst;
|
|
logic FlushAdrFlag;
|
|
logic FlushWayFlag;
|
|
logic [NUMWAYS-1:0] FlushWay;
|
|
logic [NUMWAYS-1:0] NextFlushWay;
|
|
logic FlushWayCntEn;
|
|
logic FlushWayCntRst;
|
|
logic SelEvict;
|
|
logic LRUWriteEn;
|
|
logic SelFlush;
|
|
logic ResetOrFlushAdr, ResetOrFlushWay;
|
|
logic [NUMWAYS-1:0] SelectedWay;
|
|
logic [NUMWAYS-1:0] SetValidWay, ClearValidWay, SetDirtyWay, ClearDirtyWay;
|
|
logic [LINELEN-1:0] ReadDataLine, ReadDataLineCache;
|
|
logic [$clog2(LINELEN/8) - $clog2(MUXINTERVAL/8) - 1:0] WordOffsetAddr;
|
|
logic SelBusBuffer;
|
|
logic ce;
|
|
|
|
localparam LOGLLENBYTES = $clog2(WORDLEN/8);
|
|
localparam CACHEWORDSPERLINE = `DCACHE_LINELENINBITS/WORDLEN;
|
|
localparam LOGCWPL = $clog2(CACHEWORDSPERLINE);
|
|
logic [CACHEWORDSPERLINE-1:0] MemPAdrDecoded;
|
|
logic [LINELEN/8-1:0] LineByteMask, DemuxedByteMask, FetchBufferByteSel;
|
|
genvar index;
|
|
|
|
/////////////////////////////////////////////////////////////////////////////////////////////
|
|
// Read Path
|
|
/////////////////////////////////////////////////////////////////////////////////////////////
|
|
|
|
// Choose read address (CAdr). Normally use NextAdr, but use PAdr during stalls
|
|
// and FlushAdr when handling D$ flushes
|
|
// The icache must update to the newest PCNextF on flush as it is probably a trap. Trap
|
|
// sets PCNextF to XTVEC and the icache must start reading the instruction.
|
|
mux3 #(SETLEN) AdrSelMux(
|
|
.d0(NextAdr[SETTOP-1:OFFSETLEN]), .d1(PAdr[SETTOP-1:OFFSETLEN]), .d2(FlushAdr),
|
|
.s({SelFlush, ((SelAdr | SelHPTW) & ~((DCACHE == 0) & FlushStage))}), .y(CAdr));
|
|
|
|
// Array of cache ways, along with victim, hit, dirty, and read merging logic
|
|
cacheway #(NUMLINES, LINELEN, TAGLEN, OFFSETLEN, SETLEN, DCACHE)
|
|
CacheWays[NUMWAYS-1:0](.clk, .reset, .ce, .CAdr, .PAdr, .LineWriteData, .LineByteMask,
|
|
.SetValid, .ClearValid, .SetDirty, .ClearDirty, .SelEvict, .VictimWay,
|
|
.FlushWay, .SelFlush, .ReadDataLineWay, .HitWay, .ValidWay, .VictimDirtyWay, .VictimTagWay, .FlushStage, .InvalidateCache);
|
|
if(NUMWAYS > 1) begin:vict
|
|
cacheLRU #(NUMWAYS, SETLEN, OFFSETLEN, NUMLINES) cacheLRU(
|
|
.clk, .reset, .ce, .FlushStage, .HitWay, .ValidWay, .VictimWay, .CAdr, .LRUWriteEn(LRUWriteEn & ~FlushStage),
|
|
.SetValid, .PAdr(PAdr[SETTOP-1:OFFSETLEN]), .InvalidateCache, .FlushCache);
|
|
end else assign VictimWay = 1'b1; // one hot.
|
|
assign CacheHit = | HitWay;
|
|
assign VictimDirty = | VictimDirtyWay;
|
|
// ReadDataLineWay is a 2d array of cache line len by number of ways.
|
|
// Need to OR together each way in a bitwise manner.
|
|
// Final part of the AO Mux. First is the AND in the cacheway.
|
|
or_rows #(NUMWAYS, LINELEN) ReadDataAOMux(.a(ReadDataLineWay), .y(ReadDataLineCache));
|
|
or_rows #(NUMWAYS, TAGLEN) VictimTagAOMux(.a(VictimTagWay), .y(VictimTag));
|
|
|
|
// like to fix this.
|
|
if(DCACHE)
|
|
mux2 #(LOGBWPL) WordAdrrMux(.d0(PAdr[$clog2(LINELEN/8) - 1 : $clog2(MUXINTERVAL/8)]),
|
|
.d1(BeatCount), .s(SelBusBeat),
|
|
.y(WordOffsetAddr));
|
|
else assign WordOffsetAddr = PAdr[$clog2(LINELEN/8) - 1 : $clog2(MUXINTERVAL/8)];
|
|
|
|
mux2 #(LINELEN) EarlyReturnMux(ReadDataLineCache, FetchBuffer, SelBusBuffer, ReadDataLine);
|
|
|
|
subcachelineread #(LINELEN, WORDLEN, MUXINTERVAL) subcachelineread(
|
|
.PAdr(WordOffsetAddr),
|
|
.ReadDataLine, .ReadDataWord);
|
|
|
|
/////////////////////////////////////////////////////////////////////////////////////////////
|
|
// Write Path: Write data and address. Muxes between writes from bus and writes from CPU.
|
|
/////////////////////////////////////////////////////////////////////////////////////////////
|
|
onehotdecoder #(LOGCWPL) adrdec(
|
|
.bin(PAdr[LOGCWPL+LOGLLENBYTES-1:LOGLLENBYTES]), .decoded(MemPAdrDecoded));
|
|
for(index = 0; index < 2**LOGCWPL; index++) begin
|
|
assign DemuxedByteMask[(index+1)*(WORDLEN/8)-1:index*(WORDLEN/8)] = MemPAdrDecoded[index] ? ByteMask : '0;
|
|
end
|
|
|
|
assign FetchBufferByteSel = SetValid & ~SetDirty ? '1 : ~DemuxedByteMask; // If load miss set all muxes to 1.
|
|
assign LineByteMask = ~SetValid & ~SetDirty ? '0 : ~SetValid & SetDirty ? DemuxedByteMask : '1; // if store hit only enable the word and subword bytes, else write all bytes.
|
|
|
|
for(index = 0; index < LINELEN/8; index++) begin
|
|
mux2 #(8) WriteDataMux(.d0(CacheWriteData[(8*index)%WORDLEN+7:(8*index)%WORDLEN]),
|
|
.d1(FetchBuffer[8*index+7:8*index]), .s(FetchBufferByteSel[index]), .y(LineWriteData[8*index+7:8*index]));
|
|
end
|
|
|
|
mux3 #(`PA_BITS) CacheBusAdrMux(.d0({PAdr[`PA_BITS-1:OFFSETLEN], {OFFSETLEN{1'b0}}}),
|
|
.d1({VictimTag, PAdr[SETTOP-1:OFFSETLEN], {OFFSETLEN{1'b0}}}),
|
|
.d2({VictimTag, FlushAdr, {OFFSETLEN{1'b0}}}),
|
|
.s({SelFlush, SelEvict}), .y(CacheBusAdr));
|
|
|
|
/////////////////////////////////////////////////////////////////////////////////////////////
|
|
// Flush address and way generation during flush
|
|
/////////////////////////////////////////////////////////////////////////////////////////////
|
|
assign ResetOrFlushAdr = reset | FlushAdrCntRst;
|
|
flopenr #(SETLEN) FlushAdrReg(.clk, .reset(ResetOrFlushAdr), .en(FlushAdrCntEn),
|
|
.d(FlushAdrP1), .q(FlushAdr));
|
|
assign FlushAdrP1 = FlushAdr + 1'b1;
|
|
assign FlushAdrFlag = (FlushAdr == FlushAdrThreshold[SETLEN-1:0]);
|
|
assign ResetOrFlushWay = reset | FlushWayCntRst;
|
|
flopenl #(NUMWAYS) FlushWayReg(.clk, .load(ResetOrFlushWay), .en(FlushWayCntEn),
|
|
.val({{NUMWAYS-1{1'b0}}, 1'b1}), .d(NextFlushWay), .q(FlushWay));
|
|
assign FlushWayFlag = FlushWay[NUMWAYS-1];
|
|
if(NUMWAYS > 1) assign NextFlushWay = {FlushWay[NUMWAYS-2:0], FlushWay[NUMWAYS-1]};
|
|
else assign NextFlushWay = FlushWay[NUMWAYS-1];
|
|
|
|
/////////////////////////////////////////////////////////////////////////////////////////////
|
|
// Write Path: Write Enables
|
|
/////////////////////////////////////////////////////////////////////////////////////////////
|
|
/* -----\/----- EXCLUDED -----\/-----
|
|
mux3 #(NUMWAYS) selectwaymux(HitWay, VictimWay, FlushWay, {SelFlush, SetValid}, SelectedWay);
|
|
assign SetValidWay = SetValid ? SelectedWay : '0;
|
|
assign ClearValidWay = ClearValid ? SelectedWay : '0;
|
|
assign SetDirtyWay = SetDirty ? SelectedWay : '0;
|
|
assign ClearDirtyWay = ClearDirty ? SelectedWay : '0;
|
|
-----/\----- EXCLUDED -----/\----- */
|
|
|
|
/////////////////////////////////////////////////////////////////////////////////////////////
|
|
// Cache FSM
|
|
/////////////////////////////////////////////////////////////////////////////////////////////
|
|
cachefsm cachefsm(.clk, .reset, .CacheBusRW, .CacheBusAck,
|
|
.FlushStage, .CacheRW, .CacheAtomic, .CPUBusy,
|
|
.CacheHit, .VictimDirty, .CacheStall, .CacheCommitted,
|
|
.CacheMiss, .CacheAccess, .SelAdr,
|
|
.ClearValid, .ClearDirty, .SetDirty,
|
|
.SetValid, .SelEvict, .SelFlush,
|
|
.FlushAdrCntEn, .FlushWayCntEn, .FlushAdrCntRst,
|
|
.FlushWayCntRst, .FlushAdrFlag, .FlushWayFlag, .FlushCache, .SelBusBuffer,
|
|
.InvalidateCache,
|
|
.ce,
|
|
.LRUWriteEn);
|
|
endmodule
|