Mercurial > pygar
view modules/bluespec/Pygar/core/Processor.bsv @ 38:05598d745f99 pygar svn.39
[svn r39] fixed audiocorepipe
author | punk |
---|---|
date | Tue, 04 May 2010 19:27:38 -0400 |
parents | 0475235d1513 |
children | ced2ebd41347 |
line wrap: on
line source
1 /// The MIT License3 // Copyright (c) 2009 Massachusetts Institute of Technology5 // Permission is hereby granted, free of charge, to any person obtaining a copy6 // of this software and associated documentation files (the "Software"), to deal7 // in the Software without restriction, including without limitation the rights8 // to use, copy, modify, merge, publish, distribute, sublicense, and/or sell9 // copies of the Software, and to permit persons to whom the Software is10 // furnished to do so, subject to the following conditions:12 // The above copyright notice and this permission notice shall be included in13 // all copies or substantial portions of the Software.15 // THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR16 // IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,17 // FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE18 // AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER19 // LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,20 // OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN21 // THE SOFTWARE.24 import Connectable::*;25 import GetPut::*;26 import ClientServer::*;27 import RegFile::*;29 import FIFO::*;30 import FIFOF::*;31 import SFIFO::*;32 import RWire::*;34 import Trace::*;35 import BFIFO::*;36 import MemTypes::*;37 import ProcTypes::*;38 import BRegFile::*;39 import BranchPred::*;40 //import PathTypes::*; This is only there to force the debugging42 //AWB includes43 `include "asim/provides/low_level_platform_interface.bsh"44 `include "asim/provides/soft_connections.bsh"45 `include "asim/provides/common_services.bsh"47 // Local includes48 //`include "asim/provides/processor_library.bsh" (included above directly)50 `include "asim/provides/common_services.bsh"51 `include "asim/dict/STATS_PROCESSOR.bsh"52 `include "asim/provides/processor_library.bsh"54 // Local includes. Look for the correspondingly named .awb files55 // workspace/labs/src/mit-6.375/modules/bluespec/mit-6.375/common/56 // to find the actual Bluespec files which are used to generate57 // these includes. These files are specific to this audio processing58 // pipeline60 `include "asim/provides/audio_pipe_types.bsh"62 //interface CPUToHost;63 // method Bit#(32) cpuToHost(int req);64 //endinterface66 interface Proc;68 // Interface from processor to caches69 interface Client#(DataReq,DataResp) dmem_client;70 interface Client#(InstReq,InstResp) imem_client;72 // Interface for enabling/disabling statistics on the rest of the core73 interface Get#(Bool) statsEn_get;75 // // Interface to host76 // interface CPUToHost tohost;78 // Interface to Audio Pipeline79 interface Get#(AudioProcessorUnit) sampleOutput;80 interface Put#(AudioProcessorUnit) sampleInput;82 endinterface84 typedef enum { PCgen, Exec, Writeback } Stage deriving(Eq,Bits);86 //-----------------------------------------------------------87 // Register file module88 //-----------------------------------------------------------90 interface BRFile;91 method Action wr( Rindx rindx, Bit#(32) data );92 method Bit#(32) rd1( Rindx rindx );93 method Bit#(32) rd2( Rindx rindx );94 endinterface96 module mkBRFile( BRFile );98 RegFile#(Rindx,Bit#(32)) rfile <- mkBRegFile();100 method Action wr( Rindx rindx, Bit#(32) data );101 rfile.upd( rindx, data );102 endmethod104 method Bit#(32) rd1( Rindx rindx );105 return ( rindx == 0 ) ? 0 : rfile.sub(rindx);106 endmethod108 method Bit#(32) rd2( Rindx rindx );109 return ( rindx == 0 ) ? 0 : rfile.sub(rindx);110 endmethod112 endmodule114 //-----------------------------------------------------------115 // Helper functions116 //-----------------------------------------------------------118 function Bit#(32) slt( Bit#(32) val1, Bit#(32) val2 );119 return zeroExtend( pack( signedLT(val1,val2) ) );120 endfunction122 function Bit#(32) sltu( Bit#(32) val1, Bit#(32) val2 );123 return zeroExtend( pack( val1 < val2 ) );124 endfunction126 function Bit#(32) rshft( Bit#(32) val );127 return zeroExtend(val[4:0]);128 endfunction131 //-----------------------------------------------------------132 // Find funct for wbQ133 //-----------------------------------------------------------134 function Bool findwbf(Rindx fVal, WBResult cmpVal);135 case (cmpVal) matches136 tagged WB_ALU {data:.res, dest:.rd} :137 return (fVal == rd);138 tagged WB_Load .rd :139 return (fVal == rd);140 tagged WB_Store .st :141 return False;142 tagged WB_Host .x :143 return False;144 endcase145 endfunction148 //-----------------------------------------------------------149 // Stall funct for wbQ150 //-----------------------------------------------------------151 function Bool stall(Instr inst, SFIFO#(WBResult, Rindx) f);152 case (inst) matches153 // -- Memory Ops ------------------------------------------------154 tagged LW .it :155 return f.find(it.rbase);156 tagged SW {rsrc:.dreg, rbase:.addr, offset:.o} :157 return (f.find(addr) || f.find2(dreg));159 // -- Simple Ops ------------------------------------------------160 tagged ADDIU .it : return f.find(it.rsrc);161 tagged SLTI .it : return f.find(it.rsrc);162 tagged SLTIU .it : return f.find(it.rsrc);163 tagged ANDI .it : return f.find(it.rsrc);164 tagged ORI .it : return f.find(it.rsrc);165 tagged XORI .it : return f.find(it.rsrc);167 tagged LUI .it : return f.find(it.rdst); //this rds/wrs itself168 tagged SLL .it : return f.find(it.rsrc);169 tagged SRL .it : return f.find(it.rsrc);170 tagged SRA .it : return f.find(it.rsrc);171 tagged SLLV .it : return (f.find(it.rsrc) || f.find(it.rshamt));172 tagged SRLV .it : return (f.find(it.rsrc) || f.find(it.rshamt));173 tagged SRAV .it : return (f.find(it.rsrc) || f.find(it.rshamt));174 tagged ADDU .it : return (f.find(it.rsrc1) || f.find2(it.rsrc2));175 tagged SUBU .it : return (f.find(it.rsrc1) || f.find2(it.rsrc2));176 tagged AND .it : return (f.find(it.rsrc1) || f.find2(it.rsrc2));177 tagged OR .it : return (f.find(it.rsrc1) || f.find2(it.rsrc2));178 tagged XOR .it : return (f.find(it.rsrc1) || f.find2(it.rsrc2));179 tagged NOR .it : return (f.find(it.rsrc1) || f.find2(it.rsrc2));180 tagged SLT .it : return (f.find(it.rsrc1) || f.find2(it.rsrc2));181 tagged SLTU .it : return (f.find(it.rsrc1) || f.find2(it.rsrc2));184 // -- Branches --------------------------------------------------186 tagged BLEZ .it : return (f.find(it.rsrc));187 tagged BGTZ .it : return (f.find(it.rsrc));188 tagged BLTZ .it : return (f.find(it.rsrc));189 tagged BGEZ .it : return (f.find(it.rsrc));190 tagged BEQ .it : return (f.find(it.rsrc1) || f.find2(it.rsrc2));191 tagged BNE .it : return (f.find(it.rsrc1) || f.find2(it.rsrc2));193 // -- Jumps -----------------------------------------------------195 tagged J .it : return False;196 tagged JR .it : return f.find(it.rsrc);197 tagged JALR .it : return f.find(it.rsrc);198 tagged JAL .it : return False;200 // -- Cop0 ------------------------------------------------------202 tagged MTC0 .it : return f.find(it.rsrc);203 tagged MFC0 .it : return False;205 // -- Illegal ---------------------------------------------------207 default : return False;209 endcase210 endfunction211 //-----------------------------------------------------------212 // Reference processor213 //-----------------------------------------------------------216 //(* doc = "synthesis attribute ram_style mkProc distributed;" *)217 //(* synthesize *)219 module [CONNECTED_MODULE] mkProc( Proc );221 //-----------------------------------------------------------222 // State224 // Standard processor state226 Reg#(Addr) pc <- mkReg(32'h00001000);227 Reg#(Epoch) epoch <- mkReg(0);228 Reg#(Stage) stage <- mkReg(PCgen);229 BRFile rf <- mkBRFile;231 // Branch Prediction232 BranchPred bp <- mkBranchPred();233 FIFO#(PCStat) execpc <- mkLFIFO();235 // Pipelines236 FIFO#(PCStat) pcQ <-mkSizedFIFO(3);237 SFIFO#(WBResult, Rindx) wbQ <-mkSFIFO(findwbf);239 // NEED TO ADD CAPABILITY FOR RESET (should be able to just say if I get valid in and these are flagged, clear them.240 Reg#(Bit#(32)) cp0_tohost <- mkReg(0);241 Reg#(Bit#(32)) cp0_fromhost <- mkReg(0);242 Reg#(Bool) cp0_statsEn <- mkReg(False);243 Reg#(Bool) cp0_audioEOF <- mkReg(False); // Register to let code that EOF is reached244 Reg#(Bool) cp0_progComp <- mkReg(False); // Register to let processor know that the program is complete (as this terminates)246 // Memory request/response state248 FIFO#(InstReq) instReqQ <- mkBFIFO1();249 FIFO#(InstResp) instRespQ <- mkFIFO();251 FIFO#(DataReq) dataReqQ <- mkBFIFO1();252 FIFO#(DataResp) dataRespQ <- mkFIFO();254 // Audio I/O255 FIFO#(AudioProcessorUnit) inAudioFifo <- mkFIFO;256 FIFO#(AudioProcessorUnit) outAudioFifo <- mkFIFO;259 // Statistics state (2010)260 // Reg#(Stat) num_cycles <- mkReg(0);261 // Reg#(Stat) num_inst <- mkReg(0);263 //Or:264 // Statistics state265 STAT num_cycles <- mkStatCounter(`STATS_PROCESSOR_CYCLE_COUNT);266 STAT num_inst <- mkStatCounter(`STATS_PROCESSOR_INST_COUNT);268 //-----------------------------------------------------------269 // Rules271 (* descending_urgency = "exec, pcgen" *)272 rule pcgen; //( stage == PCgen );273 let pc_plus4 = pc + 4;275 traceTiny("mkProc", "pc",pc);276 traceTiny("mkProc", "pcgen","P");277 instReqQ.enq( LoadReq{ addr:pc, tag:epoch} );279 let next_pc = bp.get(pc);280 if (next_pc matches tagged Valid .npc)281 begin282 pcQ.enq(PCStat {qpc:pc, qnxtpc:npc, qepoch:epoch});283 pc <= npc;284 end285 else286 begin287 pcQ.enq(PCStat {qpc:pc, qnxtpc:pc_plus4, qepoch:epoch});288 pc <= pc_plus4;289 end291 endrule293 rule discard (instRespQ.first() matches tagged LoadResp .ld294 &&& ld.tag != epoch);295 traceTiny("mkProc", "stage", "D");296 instRespQ.deq();297 endrule299 (* conflict_free = "exec, writeback" *)300 rule exec (instRespQ.first() matches tagged LoadResp.ld301 &&& (ld.tag == epoch)302 &&& unpack(ld.data) matches .inst303 &&& !stall(inst, wbQ));305 // Some abbreviations306 let sext = signExtend;307 let zext = zeroExtend;308 let sra = signedShiftRight;310 // Get the instruction312 instRespQ.deq();313 Instr inst314 = case ( instRespQ.first() ) matches315 tagged LoadResp .ld : return unpack(ld.data);316 tagged StoreResp .st : return ?;317 endcase;319 // Get the PC info320 let instrpc = pcQ.first().qpc;321 let pc_plus4 = instrpc + 4;323 Bool branchTaken = False;324 Addr newPC = pc_plus4;326 // Tracing327 traceTiny("mkProc", "exec","X");328 traceTiny("mkProc", "exInstTiny",inst);329 traceFull("mkProc", "exInstFull",inst);331 case ( inst ) matches333 // -- Memory Ops ------------------------------------------------335 tagged LW .it :336 begin337 Addr addr = rf.rd1(it.rbase) + sext(it.offset);338 dataReqQ.enq( LoadReq{ addr:addr, tag:zeroExtend(it.rdst) } );339 wbQ.enq(tagged WB_Load it.rdst);340 end342 tagged SW .it :343 begin344 Addr addr = rf.rd1(it.rbase) + sext(it.offset);345 dataReqQ.enq( StoreReq{ tag:0, addr:addr, data:rf.rd2(it.rsrc) } );346 wbQ.enq(tagged WB_Store);347 end349 // -- Simple Ops ------------------------------------------------351 tagged ADDIU .it :352 begin353 Bit#(32) result = rf.rd1(it.rsrc) + sext(it.imm);354 wbQ.enq(tagged WB_ALU {data:result, dest:it.rdst});355 end356 tagged SLTI .it : wbQ.enq(tagged WB_ALU {dest:it.rdst, data:slt( rf.rd1(it.rsrc), sext(it.imm) )});357 tagged SLTIU .it : wbQ.enq(tagged WB_ALU {dest:it.rdst, data:sltu( rf.rd1(it.rsrc), sext(it.imm) ) });358 tagged ANDI .it :359 begin360 Bit#(32) zext_it_imm = zext(it.imm);361 wbQ.enq(tagged WB_ALU {dest:it.rdst, data:(rf.rd1(it.rsrc) & zext_it_imm)} );362 end363 tagged ORI .it :364 begin365 Bit#(32) zext_it_imm = zext(it.imm);366 wbQ.enq(tagged WB_ALU {dest:it.rdst, data:(rf.rd1(it.rsrc) | zext_it_imm)} );367 end368 tagged XORI .it :369 begin370 Bit#(32) zext_it_imm = zext(it.imm);371 wbQ.enq(tagged WB_ALU {dest: it.rdst, data:(rf.rd1(it.rsrc) ^ zext_it_imm )});372 end373 tagged LUI .it :374 begin375 Bit#(32) zext_it_imm = zext(it.imm);376 wbQ.enq(tagged WB_ALU {dest: it.rdst, data:(zext_it_imm << 32'd16) });377 end379 tagged SLL .it :380 begin381 Bit#(32) zext_it_shamt = zext(it.shamt);382 wbQ.enq(tagged WB_ALU {dest: it.rdst, data:(rf.rd1(it.rsrc) << zext_it_shamt )} );383 end384 tagged SRL .it :385 begin386 Bit#(32) zext_it_shamt = zext(it.shamt);387 wbQ.enq(tagged WB_ALU {dest: it.rdst, data:(rf.rd1(it.rsrc) >> zext_it_shamt )});388 end389 tagged SRA .it :390 begin391 Bit#(32) zext_it_shamt = zext(it.shamt);392 wbQ.enq(tagged WB_ALU {dest: it.rdst, data:sra( rf.rd1(it.rsrc), zext_it_shamt )});393 end394 tagged SLLV .it : wbQ.enq(tagged WB_ALU {dest: it.rdst, data:(rf.rd1(it.rsrc) << rshft(rf.rd2(it.rshamt)) )});395 tagged SRLV .it : wbQ.enq(tagged WB_ALU {dest: it.rdst, data:(rf.rd1(it.rsrc) >> rshft(rf.rd2(it.rshamt)) )} );396 tagged SRAV .it : wbQ.enq(tagged WB_ALU {dest: it.rdst, data:sra( rf.rd1(it.rsrc), rshft(rf.rd2(it.rshamt)) ) });397 tagged ADDU .it : wbQ.enq(tagged WB_ALU {dest: it.rdst, data:(rf.rd1(it.rsrc1) + rf.rd2(it.rsrc2) )} );398 tagged SUBU .it : wbQ.enq(tagged WB_ALU {dest: it.rdst, data:(rf.rd1(it.rsrc1) - rf.rd2(it.rsrc2) )} );399 tagged AND .it : wbQ.enq(tagged WB_ALU {dest: it.rdst, data:(rf.rd1(it.rsrc1) & rf.rd2(it.rsrc2) )} );400 tagged OR .it : wbQ.enq(tagged WB_ALU {dest: it.rdst, data:(rf.rd1(it.rsrc1) | rf.rd2(it.rsrc2) )} );401 tagged XOR .it : wbQ.enq(tagged WB_ALU {dest: it.rdst, data:(rf.rd1(it.rsrc1) ^ rf.rd2(it.rsrc2) )} );402 tagged NOR .it : wbQ.enq(tagged WB_ALU {dest: it.rdst, data:(~(rf.rd1(it.rsrc1) | rf.rd2(it.rsrc2)) )} );403 tagged SLT .it : wbQ.enq(tagged WB_ALU {dest: it.rdst, data:slt( rf.rd1(it.rsrc1), rf.rd2(it.rsrc2) ) });404 tagged SLTU .it : wbQ.enq(tagged WB_ALU {dest: it.rdst, data:sltu( rf.rd1(it.rsrc1), rf.rd2(it.rsrc2) ) });406 // -- Branches --------------------------------------------------408 tagged BLEZ .it :409 if ( signedLE( rf.rd1(it.rsrc), 0 ) )410 begin411 newPC = pc_plus4 + (sext(it.offset) << 2);412 branchTaken = True;413 end415 tagged BGTZ .it :416 if ( signedGT( rf.rd1(it.rsrc), 0 ) )417 begin418 newPC = pc_plus4 + (sext(it.offset) << 2);419 branchTaken = True;420 end422 tagged BLTZ .it :423 if ( signedLT( rf.rd1(it.rsrc), 0 ) )424 begin425 newPC = pc_plus4 + (sext(it.offset) << 2);426 branchTaken = True;427 end429 tagged BGEZ .it :430 if ( signedGE( rf.rd1(it.rsrc), 0 ) )431 begin432 newPC = pc_plus4 + (sext(it.offset) << 2);433 branchTaken = True;434 end436 tagged BEQ .it :437 if ( rf.rd1(it.rsrc1) == rf.rd2(it.rsrc2) )438 begin439 newPC = pc_plus4 + (sext(it.offset) << 2);440 branchTaken = True;441 end443 tagged BNE .it :444 if ( rf.rd1(it.rsrc1) != rf.rd2(it.rsrc2) )445 begin446 newPC = pc_plus4 + (sext(it.offset) << 2);447 branchTaken = True;448 end450 // -- Jumps -----------------------------------------------------452 tagged J .it :453 begin454 newPC = { pc_plus4[31:28], it.target, 2'b0 };455 branchTaken = True;456 end458 tagged JR .it :459 begin460 newPC = rf.rd1(it.rsrc);461 branchTaken = True;462 end464 tagged JAL .it :465 begin466 wbQ.enq(tagged WB_ALU {dest:31, data:pc_plus4 });467 newPC = { pc_plus4[31:28], it.target, 2'b0 };468 branchTaken = True;469 end471 tagged JALR .it :472 begin473 wbQ.enq(tagged WB_ALU {dest:it.rdst, data:pc_plus4 });474 newPC = rf.rd1(it.rsrc);475 branchTaken = True;476 end478 // -- Cop0 ------------------------------------------------------480 tagged MTC0 .it : //Recieve things from host computer481 begin482 $display( " PROCESSOR MTC0 call\n");483 case ( it.cop0dst )484 5'd10 : cp0_statsEn <= unpack(truncate(rf.rd1(it.rsrc)));485 5'd21 : cp0_tohost <= truncate(rf.rd1(it.rsrc));486 5'd26 : cp0_progComp <= unpack(truncate(rf.rd1(it.rsrc))); //states audio program completed and termination okay487 5'd27 : outAudioFifo.enq(tagged Sample unpack(truncate(rf.rd1(it.rsrc)))); //Bit size is 16 not 32488 default :489 $display( " RTL-ERROR : %m : Illegal MTC0 cop0dst register!" );490 endcase491 wbQ.enq(tagged WB_Host 0); //no idea wwhat this actually should be.492 end494 //this is host stuff?495 tagged MFC0 .it : //Things out496 begin497 $display( " PROCESSOR MFC0 call\n");498 case ( it.cop0src )499 // not actually an ALU instruction but don't have the format otherwise500 5'd10 : wbQ.enq(tagged WB_ALU {dest:it.rdst, data:zext(pack(cp0_statsEn)) });501 5'd20 : wbQ.enq(tagged WB_ALU {dest:it.rdst, data:cp0_fromhost });502 5'd21 : wbQ.enq(tagged WB_ALU {dest:it.rdst, data:cp0_tohost });503 5'd25 : begin504 $display( "**** EOF Requested\n ");505 wbQ.enq(tagged WB_ALU {dest:it.rdst, data:zext(pack(cp0_audioEOF)) }); // Reading clears bit506 cp0_audioEOF <= False;507 end508 5'd28 : begin509 $display( "***** Reqesting Sample \n");510 let sample = inAudioFifo.first(); // is this going to cause perf. delay?511 if (sample matches tagged Sample .audio) // if it is EOF another rule sets the cp0_audioEOF512 wbQ.enq(tagged WB_ALU {dest:it.rdst, data:zext(pack(audio)) }); // do I need pack?513 else $display ( "Audio File EOF Reached. Invalid sample request.");514 inAudioFifo.deq();515 end516 default :517 $display( " RTL-ERROR : %m : Illegal MFC0 cop0src register!" );518 endcase519 end521 // -- Illegal ---------------------------------------------------523 default :524 $display( " RTL-ERROR : %m : Illegal instruction !" );526 endcase528 //evaluate branch prediction529 Addr ppc = pcQ.first().qnxtpc; //predicted branch530 if (ppc != newPC) //prediction wrong531 begin532 epoch <= pcQ.first().qepoch + 1;533 bp.upd(instrpc, newPC); //update branch predictor534 pcQ.clear();535 pc <= newPC;536 end537 else538 pcQ.deq();540 if ( cp0_statsEn )541 num_inst.incr();543 endrule545 rule writeback; // ( stage == Writeback );546 traceTiny("mkProc", "writeback","W");549 // get what to do off the writeback queue550 wbQ.deq();551 case (wbQ.first()) matches552 tagged WB_ALU {data:.res, dest:.rdst} : rf.wr(rdst, res);553 tagged WB_Load .regWr :554 begin555 dataRespQ.deq();556 if (dataRespQ.first() matches tagged LoadResp .ld)557 rf.wr(truncate(ld.tag), ld.data); // no need to use Rindx from queue? Duplicate?558 end559 tagged WB_Store : dataRespQ.deq();560 tagged WB_Host .dat : noAction;561 endcase563 endrule565 rule inc_num_cycles;566 if ( cp0_statsEn )567 num_cycles.incr();568 endrule571 // for now, we don't do anything.572 // rule connectAudioReqResp;573 // $display("rlm: PROCESSOR copies a datum\n");574 // outAudioFifo.enq(inAudioFifo.first());575 // inAudioFifo.deq;576 // endrule578 rule flagAudioEnd (inAudioFifo.first() matches tagged EndOfFile);579 $display (" PROCESSOR End Audio Flag Set ");580 cp0_audioEOF <= True;581 inAudioFifo.deq;582 endrule584 rule sendAudioEnd (cp0_progComp);585 $display (" PROCESSOR Says Program Complete ");586 outAudioFifo.enq(tagged EndOfFile);587 cp0_progComp <= False; //only send one. And functions to reset588 endrule591 //-----------------------------------------------------------592 // Methods594 interface Client imem_client;595 interface Get request = fifoToGet(instReqQ);596 interface Put response = fifoToPut(instRespQ);597 endinterface599 interface Client dmem_client;600 interface Get request = fifoToGet(dataReqQ);601 interface Put response = fifoToPut(dataRespQ);602 endinterface604 interface Get statsEn_get = toGet(asReg(cp0_statsEn));606 /*607 interface CPUToHost tohost;608 method Bit#(32) cpuToHost(int req);609 return (case (req)610 0: cp0_tohost;611 1: pc;612 2: zeroExtend(pack(stage));613 endcase);614 endmethod615 endinterface616 */618 interface Get sampleOutput = fifoToGet(outAudioFifo);619 interface Put sampleInput = fifoToPut(inAudioFifo);621 endmodule