GPU_RfO-TCC.sm revision 14184:11ac1337c5e2
1/*
2 * Copyright (c) 2010-2015 Advanced Micro Devices, Inc.
3 * All rights reserved.
4 *
5 * For use for simulation and test purposes only
6 *
7 * Redistribution and use in source and binary forms, with or without
8 * modification, are permitted provided that the following conditions are met:
9 *
10 * 1. Redistributions of source code must retain the above copyright notice,
11 * this list of conditions and the following disclaimer.
12 *
13 * 2. Redistributions in binary form must reproduce the above copyright notice,
14 * this list of conditions and the following disclaimer in the documentation
15 * and/or other materials provided with the distribution.
16 *
17 * 3. Neither the name of the copyright holder nor the names of its
18 * contributors may be used to endorse or promote products derived from this
19 * software without specific prior written permission.
20 *
21 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
22 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
23 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
24 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE
25 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
26 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
27 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
28 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
29 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
30 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
31 * POSSIBILITY OF SUCH DAMAGE.
32 *
33 * Authors: Lisa Hsu
34 */
35
36machine(MachineType:TCC, "TCC Cache")
37 : CacheMemory * L2cache;
38   WireBuffer * w_reqToTCCDir;
39   WireBuffer * w_respToTCCDir;
40   WireBuffer * w_TCCUnblockToTCCDir;
41   WireBuffer * w_reqToTCC;
42   WireBuffer * w_probeToTCC;
43   WireBuffer * w_respToTCC;
44   int TCC_select_num_bits;
45   Cycles l2_request_latency := 1;
46   Cycles l2_response_latency := 20;
47
48  // To the general response network
49  MessageBuffer * responseFromTCC, network="To", virtual_network="3", vnet_type="response";
50
51  // From the general response network
52  MessageBuffer * responseToTCC, network="From", virtual_network="3", vnet_type="response";
53
54{
55  // EVENTS
56  enumeration(Event, desc="TCC Events") {
57    // Requests coming from the Cores
58    RdBlk,                  desc="CPU RdBlk event";
59    RdBlkM,                 desc="CPU RdBlkM event";
60    RdBlkS,                 desc="CPU RdBlkS event";
61    CtoD,                   desc="Change to Dirty request";
62    WrVicBlk,               desc="L1 Victim (dirty)";
63    WrVicBlkShared,               desc="L1 Victim (dirty)";
64    ClVicBlk,               desc="L1 Victim (clean)";
65    ClVicBlkShared,               desc="L1 Victim (clean)";
66
67    CPUData,                      desc="WB data from CPU";
68    CPUDataShared,                desc="WB data from CPU, NBReqShared 1";
69    StaleWB,                desc="Stale WB, No data";
70
71    L2_Repl,             desc="L2 Replacement";
72
73    // Probes
74    PrbInvData,         desc="Invalidating probe, return dirty data";
75    PrbInv,             desc="Invalidating probe, no need to return data";
76    PrbShrData,         desc="Downgrading probe, return data";
77
78    // Coming from Memory Controller
79    WBAck,                     desc="ack from memory";
80
81    CancelWB,                   desc="Cancel WB from L2";
82  }
83
84  // STATES
85  state_declaration(State, desc="TCC State", default="TCC_State_I") {
86    M, AccessPermission:Read_Write, desc="Modified";  // No other cache has copy, memory stale
87    O, AccessPermission:Read_Only, desc="Owned";     // Correct most recent copy, others may exist in S
88    E, AccessPermission:Read_Write, desc="Exclusive"; // Correct, most recent, and only copy (and == Memory)
89    S, AccessPermission:Read_Only, desc="Shared";    // Correct, most recent. If no one in O, then == Memory
90    I, AccessPermission:Invalid, desc="Invalid";
91
92    I_M, AccessPermission:Busy, desc="Invalid, received WrVicBlk, sent Ack, waiting for Data";
93    I_O, AccessPermission:Busy, desc="Invalid, received WrVicBlk, sent Ack, waiting for Data";
94    I_E, AccessPermission:Busy, desc="Invalid, receive ClVicBlk, sent Ack, waiting for Data";
95    I_S, AccessPermission:Busy, desc="Invalid, receive ClVicBlk, sent Ack, waiting for Data";
96    S_M, AccessPermission:Busy, desc="received WrVicBlk, sent Ack, waiting for Data, then go to M";
97    S_O, AccessPermission:Busy, desc="received WrVicBlkShared, sent Ack, waiting for Data, then go to O";
98    S_E, AccessPermission:Busy, desc="Shared, received ClVicBlk, sent Ack, waiting for Data, then go to E";
99    S_S, AccessPermission:Busy, desc="Shared, received ClVicBlk, sent Ack, waiting for Data, then go to S";
100    E_M, AccessPermission:Busy, desc="received WrVicBlk, sent Ack, waiting for Data, then go to O";
101    E_O, AccessPermission:Busy, desc="received WrVicBlkShared, sent Ack, waiting for Data, then go to O";
102    E_E, AccessPermission:Busy, desc="received WrVicBlk, sent Ack, waiting for Data, then go to O";
103    E_S, AccessPermission:Busy, desc="Shared, received WrVicBlk, sent Ack, waiting for Data";
104    O_M, AccessPermission:Busy, desc="...";
105    O_O, AccessPermission:Busy, desc="...";
106    O_E, AccessPermission:Busy, desc="...";
107    M_M, AccessPermission:Busy, desc="...";
108    M_O, AccessPermission:Busy, desc="...";
109    M_E, AccessPermission:Busy, desc="...";
110    M_S, AccessPermission:Busy, desc="...";
111    D_I, AccessPermission:Invalid,  desc="drop WB data on the floor when receive";
112    MOD_I, AccessPermission:Busy, desc="drop WB data on the floor, waiting for WBAck from Mem";
113    MO_I, AccessPermission:Busy, desc="M or O, received L2_Repl, waiting for WBAck from Mem";
114    ES_I, AccessPermission:Busy, desc="E or S, received L2_Repl, waiting for WBAck from Mem";
115    I_C, AccessPermission:Invalid, desc="sent cancel, just waiting to receive mem wb ack so nothing gets confused";
116  }
117
118  enumeration(RequestType, desc="To communicate stats from transitions to recordStats") {
119    DataArrayRead,    desc="Read the data array";
120    DataArrayWrite,   desc="Write the data array";
121    TagArrayRead,     desc="Read the data array";
122    TagArrayWrite,    desc="Write the data array";
123  }
124
125
126  // STRUCTURES
127
128  structure(Entry, desc="...", interface="AbstractCacheEntry") {
129    State CacheState,           desc="cache state";
130    bool Dirty,                 desc="Is the data dirty (diff from memory?)";
131    DataBlock DataBlk,          desc="Data for the block";
132  }
133
134  structure(TBE, desc="...") {
135    State TBEState,     desc="Transient state";
136    DataBlock DataBlk,  desc="data for the block";
137    bool Dirty,         desc="Is the data dirty?";
138    bool Shared,        desc="Victim hit by shared probe";
139    MachineID From,     desc="Waiting for writeback from...";
140  }
141
142  structure(TBETable, external="yes") {
143    TBE lookup(Addr);
144    void allocate(Addr);
145    void deallocate(Addr);
146    bool isPresent(Addr);
147  }
148
149  TBETable TBEs, template="<TCC_TBE>", constructor="m_number_of_TBEs";
150  int TCC_select_low_bit, default="RubySystem::getBlockSizeBits()";
151
152  void set_cache_entry(AbstractCacheEntry b);
153  void unset_cache_entry();
154  void set_tbe(TBE b);
155  void unset_tbe();
156  void wakeUpAllBuffers();
157  void wakeUpBuffers(Addr a);
158
159
160  // FUNCTION DEFINITIONS
161  Tick clockEdge();
162  Tick cyclesToTicks(Cycles c);
163
164  Entry getCacheEntry(Addr addr), return_by_pointer="yes" {
165    return static_cast(Entry, "pointer", L2cache.lookup(addr));
166  }
167
168  DataBlock getDataBlock(Addr addr), return_by_ref="yes" {
169    return getCacheEntry(addr).DataBlk;
170  }
171
172  bool presentOrAvail(Addr addr) {
173    return L2cache.isTagPresent(addr) || L2cache.cacheAvail(addr);
174  }
175
176  State getState(TBE tbe, Entry cache_entry, Addr addr) {
177    if (is_valid(tbe)) {
178      return tbe.TBEState;
179    } else if (is_valid(cache_entry)) {
180      return cache_entry.CacheState;
181    }
182    return State:I;
183  }
184
185  void setState(TBE tbe, Entry cache_entry, Addr addr, State state) {
186    if (is_valid(tbe)) {
187        tbe.TBEState := state;
188    }
189
190    if (is_valid(cache_entry)) {
191        cache_entry.CacheState := state;
192    }
193  }
194
195  AccessPermission getAccessPermission(Addr addr) {
196    TBE tbe := TBEs.lookup(addr);
197    if(is_valid(tbe)) {
198      return TCC_State_to_permission(tbe.TBEState);
199    }
200
201    Entry cache_entry := getCacheEntry(addr);
202    if(is_valid(cache_entry)) {
203      return TCC_State_to_permission(cache_entry.CacheState);
204    }
205
206    return AccessPermission:NotPresent;
207  }
208
209  void setAccessPermission(Entry cache_entry, Addr addr, State state) {
210    if (is_valid(cache_entry)) {
211      cache_entry.changePermission(TCC_State_to_permission(state));
212    }
213  }
214
215  void functionalRead(Addr addr, Packet *pkt) {
216    TBE tbe := TBEs.lookup(addr);
217    if(is_valid(tbe)) {
218      testAndRead(addr, tbe.DataBlk, pkt);
219    } else {
220      functionalMemoryRead(pkt);
221    }
222  }
223
224  int functionalWrite(Addr addr, Packet *pkt) {
225    int num_functional_writes := 0;
226
227    TBE tbe := TBEs.lookup(addr);
228    if(is_valid(tbe)) {
229      num_functional_writes := num_functional_writes +
230            testAndWrite(addr, tbe.DataBlk, pkt);
231    }
232
233    num_functional_writes := num_functional_writes + functionalMemoryWrite(pkt);
234    return num_functional_writes;
235  }
236
237  void recordRequestType(RequestType request_type, Addr addr) {
238    if (request_type == RequestType:DataArrayRead) {
239        L2cache.recordRequestType(CacheRequestType:DataArrayRead, addr);
240    } else if (request_type == RequestType:DataArrayWrite) {
241        L2cache.recordRequestType(CacheRequestType:DataArrayWrite, addr);
242    } else if (request_type == RequestType:TagArrayRead) {
243        L2cache.recordRequestType(CacheRequestType:TagArrayRead, addr);
244    } else if (request_type == RequestType:TagArrayWrite) {
245        L2cache.recordRequestType(CacheRequestType:TagArrayWrite, addr);
246    }
247  }
248
249  bool checkResourceAvailable(RequestType request_type, Addr addr) {
250    if (request_type == RequestType:DataArrayRead) {
251      return L2cache.checkResourceAvailable(CacheResourceType:DataArray, addr);
252    } else if (request_type == RequestType:DataArrayWrite) {
253      return L2cache.checkResourceAvailable(CacheResourceType:DataArray, addr);
254    } else if (request_type == RequestType:TagArrayRead) {
255      return L2cache.checkResourceAvailable(CacheResourceType:TagArray, addr);
256    } else if (request_type == RequestType:TagArrayWrite) {
257      return L2cache.checkResourceAvailable(CacheResourceType:TagArray, addr);
258    } else {
259      error("Invalid RequestType type in checkResourceAvailable");
260      return true;
261    }
262  }
263
264
265
266  // OUT PORTS
267  out_port(w_requestNetwork_out, CPURequestMsg, w_reqToTCCDir);
268  out_port(w_TCCResp_out, ResponseMsg, w_respToTCCDir);
269  out_port(responseNetwork_out, ResponseMsg, responseFromTCC);
270  out_port(w_unblockNetwork_out, UnblockMsg, w_TCCUnblockToTCCDir);
271
272  // IN PORTS
273  in_port(TDResponse_in, ResponseMsg, w_respToTCC) {
274    if (TDResponse_in.isReady(clockEdge())) {
275      peek(TDResponse_in, ResponseMsg) {
276        Entry cache_entry := getCacheEntry(in_msg.addr);
277        TBE tbe := TBEs.lookup(in_msg.addr);
278        if (in_msg.Type == CoherenceResponseType:TDSysWBAck) {
279          trigger(Event:WBAck, in_msg.addr, cache_entry, tbe);
280        }
281        else {
282          DPRINTF(RubySlicc, "%s\n", in_msg);
283          error("Error on TDResponse Type");
284        }
285      }
286    }
287  }
288
289  // Response Network
290  in_port(responseNetwork_in, ResponseMsg, responseToTCC) {
291    if (responseNetwork_in.isReady(clockEdge())) {
292      peek(responseNetwork_in, ResponseMsg) {
293        Entry cache_entry := getCacheEntry(in_msg.addr);
294        TBE tbe := TBEs.lookup(in_msg.addr);
295        if (in_msg.Type == CoherenceResponseType:CPUData) {
296          if (in_msg.NbReqShared) {
297            trigger(Event:CPUDataShared, in_msg.addr, cache_entry, tbe);
298          } else {
299            trigger(Event:CPUData, in_msg.addr, cache_entry, tbe);
300          }
301        } else if (in_msg.Type == CoherenceResponseType:StaleNotif) {
302            trigger(Event:StaleWB, in_msg.addr, cache_entry, tbe);
303        } else {
304          DPRINTF(RubySlicc, "%s\n", in_msg);
305          error("Error on TDResponse Type");
306        }
307      }
308    }
309  }
310
311  // probe network
312  in_port(probeNetwork_in, TDProbeRequestMsg, w_probeToTCC) {
313    if (probeNetwork_in.isReady(clockEdge())) {
314      peek(probeNetwork_in, TDProbeRequestMsg) {
315        Entry cache_entry := getCacheEntry(in_msg.addr);
316        TBE tbe := TBEs.lookup(in_msg.addr);
317        if (in_msg.Type == ProbeRequestType:PrbInv) {
318          if (in_msg.ReturnData) {
319            trigger(Event:PrbInvData, in_msg.addr, cache_entry, tbe);
320          } else {
321            trigger(Event:PrbInv, in_msg.addr, cache_entry, tbe);
322          }
323        } else if (in_msg.Type == ProbeRequestType:PrbDowngrade) {
324          if (in_msg.ReturnData) {
325            trigger(Event:PrbShrData, in_msg.addr, cache_entry, tbe);
326          } else {
327            error("Don't think I should get any of these");
328          }
329        }
330      }
331    }
332  }
333
334  // Request Network
335  in_port(requestNetwork_in, CPURequestMsg, w_reqToTCC) {
336    if (requestNetwork_in.isReady(clockEdge())) {
337      peek(requestNetwork_in, CPURequestMsg) {
338        assert(in_msg.Destination.isElement(machineID));
339        Entry cache_entry := getCacheEntry(in_msg.addr);
340        TBE tbe := TBEs.lookup(in_msg.addr);
341        if (in_msg.Type == CoherenceRequestType:RdBlk) {
342          trigger(Event:RdBlk, in_msg.addr, cache_entry, tbe);
343        } else if (in_msg.Type == CoherenceRequestType:RdBlkS) {
344          trigger(Event:RdBlkS, in_msg.addr, cache_entry, tbe);
345        } else if (in_msg.Type == CoherenceRequestType:RdBlkM) {
346          trigger(Event:RdBlkM, in_msg.addr, cache_entry, tbe);
347        } else if (in_msg.Type == CoherenceRequestType:VicClean) {
348          if (presentOrAvail(in_msg.addr)) {
349            if (in_msg.Shared) {
350              trigger(Event:ClVicBlkShared, in_msg.addr, cache_entry, tbe);
351            } else {
352              trigger(Event:ClVicBlk, in_msg.addr, cache_entry, tbe);
353            }
354          } else {
355            Addr victim :=  L2cache.cacheProbe(in_msg.addr);
356            trigger(Event:L2_Repl, victim, getCacheEntry(victim), TBEs.lookup(victim));
357          }
358        } else if (in_msg.Type == CoherenceRequestType:VicDirty) {
359          if (presentOrAvail(in_msg.addr)) {
360            if (in_msg.Shared) {
361              trigger(Event:WrVicBlkShared, in_msg.addr, cache_entry, tbe);
362            } else {
363              trigger(Event:WrVicBlk, in_msg.addr, cache_entry, tbe);
364            }
365          } else {
366            Addr victim := L2cache.cacheProbe(in_msg.addr);
367            trigger(Event:L2_Repl, victim, getCacheEntry(victim), TBEs.lookup(victim));
368          }
369        } else {
370            requestNetwork_in.recycle(clockEdge(), cyclesToTicks(recycle_latency));
371        }
372      }
373    }
374  }
375
376  // BEGIN ACTIONS
377
378  action(i_invL2, "i", desc="invalidate TCC cache block") {
379    if (is_valid(cache_entry)) {
380        L2cache.deallocate(address);
381    }
382    unset_cache_entry();
383  }
384
385  action(rm_sendResponseM, "rm", desc="send Modified response") {
386    peek(requestNetwork_in, CPURequestMsg) {
387      enqueue(responseNetwork_out, ResponseMsg, l2_response_latency) {
388        out_msg.addr := address;
389        out_msg.Type := CoherenceResponseType:TDSysResp;
390        out_msg.Sender := machineID;
391        out_msg.Destination.add(in_msg.Requestor);
392        out_msg.DataBlk := cache_entry.DataBlk;
393        out_msg.MessageSize := MessageSizeType:Response_Data;
394        out_msg.Dirty := cache_entry.Dirty;
395        out_msg.State := CoherenceState:Modified;
396        DPRINTF(RubySlicc, "%s\n", out_msg);
397      }
398    }
399  }
400
401  action(rs_sendResponseS, "rs", desc="send Shared response") {
402    peek(requestNetwork_in, CPURequestMsg) {
403      enqueue(responseNetwork_out, ResponseMsg, l2_response_latency) {
404        out_msg.addr := address;
405        out_msg.Type := CoherenceResponseType:TDSysResp;
406        out_msg.Sender := machineID;
407        out_msg.Destination.add(in_msg.Requestor);
408        out_msg.DataBlk := cache_entry.DataBlk;
409        out_msg.MessageSize := MessageSizeType:Response_Data;
410        out_msg.Dirty := cache_entry.Dirty;
411        out_msg.State := CoherenceState:Shared;
412        DPRINTF(RubySlicc, "%s\n", out_msg);
413      }
414    }
415  }
416
417
418  action(r_requestToTD, "r", desc="Miss in L2, pass on") {
419    peek(requestNetwork_in, CPURequestMsg) {
420      enqueue(w_requestNetwork_out, CPURequestMsg, l2_request_latency) {
421        out_msg.addr := address;
422        out_msg.Type := in_msg.Type;
423        out_msg.Requestor := in_msg.Requestor;
424        out_msg.Destination.add(mapAddressToRange(address,MachineType:TCCdir,
425                                TCC_select_low_bit, TCC_select_num_bits));
426        out_msg.Shared := false; // unneeded for this request
427        out_msg.MessageSize := in_msg.MessageSize;
428        DPRINTF(RubySlicc, "%s\n", out_msg);
429      }
430    }
431  }
432
433  action(t_allocateTBE, "t", desc="allocate TBE Entry") {
434    TBEs.allocate(address);
435    set_tbe(TBEs.lookup(address));
436    if (is_valid(cache_entry)) {
437      tbe.DataBlk := cache_entry.DataBlk; // Data only for WBs
438      tbe.Dirty := cache_entry.Dirty;
439    }
440    tbe.From := machineID;
441  }
442
443  action(dt_deallocateTBE, "dt", desc="deallocate TBE Entry") {
444    TBEs.deallocate(address);
445    unset_tbe();
446  }
447
448  action(vc_vicClean, "vc", desc="Victimize Clean L2 data") {
449    enqueue(w_requestNetwork_out, CPURequestMsg, l2_request_latency) {
450      out_msg.addr := address;
451      out_msg.Type := CoherenceRequestType:VicClean;
452      out_msg.Requestor := machineID;
453      out_msg.DataBlk := cache_entry.DataBlk;
454      out_msg.Destination.add(mapAddressToRange(address,MachineType:TCCdir,
455                              TCC_select_low_bit, TCC_select_num_bits));
456      out_msg.MessageSize := MessageSizeType:Response_Data;
457    }
458  }
459
460  action(vd_vicDirty, "vd", desc="Victimize dirty L2 data") {
461    enqueue(w_requestNetwork_out, CPURequestMsg, l2_request_latency) {
462      out_msg.addr := address;
463      out_msg.Type := CoherenceRequestType:VicDirty;
464      out_msg.Requestor := machineID;
465      out_msg.DataBlk := cache_entry.DataBlk;
466      out_msg.Destination.add(mapAddressToRange(address,MachineType:TCCdir,
467                              TCC_select_low_bit, TCC_select_num_bits));
468      out_msg.MessageSize := MessageSizeType:Response_Data;
469    }
470  }
471
472  action(w_sendResponseWBAck, "w", desc="send WB Ack") {
473    peek(requestNetwork_in, CPURequestMsg) {
474      enqueue(responseNetwork_out, ResponseMsg, l2_response_latency) {
475        out_msg.addr := address;
476        out_msg.Type := CoherenceResponseType:TDSysWBAck;
477        out_msg.Destination.add(in_msg.Requestor);
478        out_msg.Sender := machineID;
479        out_msg.MessageSize := MessageSizeType:Writeback_Control;
480      }
481    }
482  }
483
484  action(pi_sendProbeResponseInv, "pi", desc="send probe ack inv, no data") {
485    enqueue(w_TCCResp_out, ResponseMsg, l2_request_latency) {
486      out_msg.addr := address;
487      out_msg.Type := CoherenceResponseType:CPUPrbResp;  // TCC and CPUs respond in same way to probes
488      out_msg.Sender := machineID;
489      // will this always be ok? probably not for multisocket
490      out_msg.Destination.add(mapAddressToRange(address,MachineType:TCCdir,
491                              TCC_select_low_bit, TCC_select_num_bits));
492      out_msg.Dirty := false;
493      out_msg.Hit := false;
494      out_msg.Ntsl := true;
495      out_msg.State := CoherenceState:NA;
496      out_msg.MessageSize := MessageSizeType:Response_Control;
497    }
498  }
499
500  action(ph_sendProbeResponseHit, "ph", desc="send probe ack, no data") {
501    enqueue(w_TCCResp_out, ResponseMsg, l2_request_latency) {
502      out_msg.addr := address;
503      out_msg.Type := CoherenceResponseType:CPUPrbResp;  // TCC and CPUs respond in same way to probes
504      out_msg.Sender := machineID;
505      // will this always be ok? probably not for multisocket
506      out_msg.Destination.add(mapAddressToRange(address,MachineType:TCCdir,
507                              TCC_select_low_bit, TCC_select_num_bits));
508      out_msg.Dirty := false;
509      out_msg.Hit := true;
510      out_msg.Ntsl := false;
511      out_msg.State := CoherenceState:NA;
512      out_msg.MessageSize := MessageSizeType:Response_Control;
513    }
514  }
515
516  action(pm_sendProbeResponseMiss, "pm", desc="send probe ack, no data") {
517    enqueue(w_TCCResp_out, ResponseMsg, l2_request_latency) {
518      out_msg.addr := address;
519      out_msg.Type := CoherenceResponseType:CPUPrbResp;  // TCC and CPUs respond in same way to probes
520      out_msg.Sender := machineID;
521      // will this always be ok? probably not for multisocket
522      out_msg.Destination.add(mapAddressToRange(address,MachineType:TCCdir,
523                              TCC_select_low_bit, TCC_select_num_bits));
524      out_msg.Dirty := false;
525      out_msg.Hit := false;
526      out_msg.Ntsl := false;
527      out_msg.State := CoherenceState:NA;
528      out_msg.MessageSize := MessageSizeType:Response_Control;
529    }
530  }
531
532  action(pd_sendProbeResponseData, "pd", desc="send probe ack, with data") {
533    enqueue(w_TCCResp_out, ResponseMsg, l2_request_latency) {
534      out_msg.addr := address;
535      out_msg.Type := CoherenceResponseType:CPUPrbResp;  // TCC and CPUs respond in same way to probes
536      out_msg.Sender := machineID;
537      // will this always be ok? probably not for multisocket
538      out_msg.Destination.add(mapAddressToRange(address,MachineType:TCCdir,
539                              TCC_select_low_bit, TCC_select_num_bits));
540      out_msg.DataBlk := cache_entry.DataBlk;
541      //assert(cache_entry.Dirty); Not needed in TCC where TCC can supply clean data
542      out_msg.Dirty := cache_entry.Dirty;
543      out_msg.Hit := true;
544      out_msg.State := CoherenceState:NA;
545      out_msg.MessageSize := MessageSizeType:Response_Data;
546    }
547  }
548
549  action(pdt_sendProbeResponseDataFromTBE, "pdt", desc="send probe ack with data") {
550    enqueue(w_TCCResp_out, ResponseMsg, l2_request_latency) {
551      out_msg.addr := address;
552      out_msg.Type := CoherenceResponseType:CPUPrbResp;
553      out_msg.Sender := machineID;
554      out_msg.Destination.add(mapAddressToRange(address,MachineType:TCCdir,
555                              TCC_select_low_bit, TCC_select_num_bits));
556      out_msg.DataBlk := tbe.DataBlk;
557      //assert(tbe.Dirty);
558      out_msg.Dirty := tbe.Dirty;
559      out_msg.Hit := true;
560      out_msg.MessageSize := MessageSizeType:Response_Data;
561      out_msg.State := CoherenceState:NA;
562      DPRINTF(RubySlicc, "%s\n", out_msg);
563    }
564  }
565
566  action(mc_cancelMemWriteback, "mc", desc="send writeback cancel to memory") {
567    enqueue(w_requestNetwork_out, CPURequestMsg, l2_request_latency) {
568      out_msg.addr := address;
569      out_msg.Type := CoherenceRequestType:WrCancel;
570      out_msg.Requestor := machineID;
571      out_msg.Destination.add(mapAddressToRange(address,MachineType:TCCdir,
572                              TCC_select_low_bit, TCC_select_num_bits));
573      out_msg.MessageSize := MessageSizeType:Request_Control;
574    }
575  }
576
577  action(a_allocateBlock, "a", desc="allocate TCC block") {
578    if (is_invalid(cache_entry)) {
579      set_cache_entry(L2cache.allocate(address, new Entry));
580    }
581  }
582
583  action(d_writeData, "d", desc="write data to TCC") {
584    peek(responseNetwork_in, ResponseMsg) {
585      if (in_msg.Dirty) {
586        cache_entry.Dirty := in_msg.Dirty;
587      }
588      cache_entry.DataBlk := in_msg.DataBlk;
589      DPRINTF(RubySlicc, "Writing to TCC: %s\n", in_msg);
590    }
591  }
592
593  action(rd_copyDataFromRequest, "rd", desc="write data to TCC") {
594    peek(requestNetwork_in, CPURequestMsg) {
595      cache_entry.DataBlk := in_msg.DataBlk;
596      cache_entry.Dirty := true;
597    }
598  }
599
600  action(f_setFrom, "f", desc="set who WB is expected to come from") {
601    peek(requestNetwork_in, CPURequestMsg) {
602      tbe.From := in_msg.Requestor;
603    }
604  }
605
606  action(rf_resetFrom, "rf", desc="reset From") {
607    tbe.From := machineID;
608  }
609
610  action(wb_data, "wb", desc="write back data") {
611    enqueue(w_TCCResp_out, ResponseMsg, l2_request_latency) {
612      out_msg.addr := address;
613      out_msg.Type := CoherenceResponseType:CPUData;
614      out_msg.Sender := machineID;
615      out_msg.Destination.add(mapAddressToRange(address,MachineType:TCCdir,
616                              TCC_select_low_bit, TCC_select_num_bits));
617      out_msg.DataBlk := tbe.DataBlk;
618      out_msg.Dirty := tbe.Dirty;
619      if (tbe.Shared) {
620        out_msg.NbReqShared := true;
621      } else {
622        out_msg.NbReqShared := false;
623      }
624      out_msg.State := CoherenceState:Shared; // faux info
625      out_msg.MessageSize := MessageSizeType:Writeback_Data;
626      DPRINTF(RubySlicc, "%s\n", out_msg);
627    }
628  }
629
630  action(wt_writeDataToTBE, "wt", desc="write WB data to TBE") {
631    peek(responseNetwork_in, ResponseMsg) {
632      tbe.DataBlk := in_msg.DataBlk;
633      tbe.Dirty := in_msg.Dirty;
634    }
635  }
636
637  action(uo_sendUnblockOwner, "uo", desc="state changed to E, M, or O, unblock") {
638    enqueue(w_unblockNetwork_out, UnblockMsg, l2_request_latency) {
639      out_msg.addr := address;
640      out_msg.Sender := machineID;
641      out_msg.Destination.add(mapAddressToRange(address,MachineType:TCCdir,
642                              TCC_select_low_bit, TCC_select_num_bits));
643      out_msg.MessageSize := MessageSizeType:Unblock_Control;
644      out_msg.currentOwner := true;
645      out_msg.valid := true;
646      DPRINTF(RubySlicc, "%s\n", out_msg);
647    }
648  }
649
650  action(us_sendUnblockSharer, "us", desc="state changed to S , unblock") {
651    enqueue(w_unblockNetwork_out, UnblockMsg, l2_request_latency) {
652      out_msg.addr := address;
653      out_msg.Sender := machineID;
654      out_msg.Destination.add(mapAddressToRange(address,MachineType:TCCdir,
655                              TCC_select_low_bit, TCC_select_num_bits));
656      out_msg.MessageSize := MessageSizeType:Unblock_Control;
657      out_msg.currentOwner := false;
658      out_msg.valid := true;
659      DPRINTF(RubySlicc, "%s\n", out_msg);
660    }
661  }
662
663  action(un_sendUnblockNotValid, "un", desc="state changed toI, unblock") {
664    enqueue(w_unblockNetwork_out, UnblockMsg, l2_request_latency) {
665      out_msg.addr := address;
666      out_msg.Sender := machineID;
667      out_msg.Destination.add(mapAddressToRange(address,MachineType:TCCdir,
668                              TCC_select_low_bit, TCC_select_num_bits));
669      out_msg.MessageSize := MessageSizeType:Unblock_Control;
670      out_msg.currentOwner := false;
671      out_msg.valid := false;
672      DPRINTF(RubySlicc, "%s\n", out_msg);
673    }
674  }
675
676  action(ut_updateTag, "ut", desc="update Tag (i.e. set MRU)") {
677    L2cache.setMRU(address);
678  }
679
680  action(p_popRequestQueue, "p", desc="pop request queue") {
681    requestNetwork_in.dequeue(clockEdge());
682  }
683
684  action(pr_popResponseQueue, "pr", desc="pop response queue") {
685    responseNetwork_in.dequeue(clockEdge());
686  }
687
688  action(pn_popTDResponseQueue, "pn", desc="pop TD response queue") {
689    TDResponse_in.dequeue(clockEdge());
690  }
691
692  action(pp_popProbeQueue, "pp", desc="pop probe queue") {
693    probeNetwork_in.dequeue(clockEdge());
694  }
695
696  action(zz_recycleRequestQueue, "\z", desc="recycle request queue") {
697    requestNetwork_in.recycle(clockEdge(), cyclesToTicks(recycle_latency));
698  }
699
700
701  // END ACTIONS
702
703  // BEGIN TRANSITIONS
704
705  // transitions from base
706
707  transition({I, I_C}, {RdBlk, RdBlkS, RdBlkM, CtoD}){TagArrayRead} {
708    // TCCdir already knows that the block is not here. This is to allocate and get the block.
709    r_requestToTD;
710    p_popRequestQueue;
711  }
712
713// check
714  transition({M, O}, RdBlk, O){TagArrayRead, TagArrayWrite} {
715    rs_sendResponseS;
716    ut_updateTag;
717    // detect 2nd chancing
718    p_popRequestQueue;
719  }
720
721//check
722  transition({E, S}, RdBlk, S){TagArrayRead, TagArrayWrite} {
723    rs_sendResponseS;
724    ut_updateTag;
725    // detect 2nd chancing
726    p_popRequestQueue;
727  }
728
729// check
730  transition({M, O}, RdBlkS, O){TagArrayRead, TagArrayWrite} {
731    rs_sendResponseS;
732    ut_updateTag;
733    // detect 2nd chance sharing
734    p_popRequestQueue;
735  }
736
737//check
738  transition({E, S}, RdBlkS, S){TagArrayRead, TagArrayWrite} {
739    rs_sendResponseS;
740    ut_updateTag;
741    // detect 2nd chance sharing
742    p_popRequestQueue;
743  }
744
745// check
746  transition(M, RdBlkM, I){TagArrayRead, TagArrayWrite} {
747    rm_sendResponseM;
748    i_invL2;
749    p_popRequestQueue;
750  }
751
752  //check
753  transition(E, RdBlkM, I){TagArrayRead, TagArrayWrite} {
754    rm_sendResponseM;
755    i_invL2;
756    p_popRequestQueue;
757  }
758
759// check
760  transition({I}, WrVicBlk, I_M){TagArrayRead} {
761    a_allocateBlock;
762    t_allocateTBE;
763    f_setFrom;
764    w_sendResponseWBAck;
765    p_popRequestQueue;
766  }
767
768  transition(I_C, {WrVicBlk, WrVicBlkShared, ClVicBlk, ClVicBlkShared}) {
769    zz_recycleRequestQueue;
770  }
771
772//check
773  transition({I}, WrVicBlkShared, I_O) {TagArrayRead}{
774    a_allocateBlock;
775    t_allocateTBE;
776    f_setFrom;
777//    rd_copyDataFromRequest;
778    w_sendResponseWBAck;
779    p_popRequestQueue;
780  }
781
782//check
783  transition(S, WrVicBlkShared, S_O){TagArrayRead} {
784    t_allocateTBE;
785    f_setFrom;
786    w_sendResponseWBAck;
787    p_popRequestQueue;
788  }
789
790// a stale writeback
791 transition(S, WrVicBlk, S_S){TagArrayRead} {
792   t_allocateTBE;
793   f_setFrom;
794   w_sendResponseWBAck;
795   p_popRequestQueue;
796 }
797
798// a stale writeback
799  transition(E, WrVicBlk, E_E){TagArrayRead} {
800    t_allocateTBE;
801    f_setFrom;
802    w_sendResponseWBAck;
803    p_popRequestQueue;
804  }
805
806// a stale writeback
807  transition(E, WrVicBlkShared, E_E){TagArrayRead} {
808    t_allocateTBE;
809    f_setFrom;
810    w_sendResponseWBAck;
811    p_popRequestQueue;
812  }
813
814// a stale writeback
815  transition(O, WrVicBlk, O_O){TagArrayRead} {
816    t_allocateTBE;
817    f_setFrom;
818    w_sendResponseWBAck;
819    p_popRequestQueue;
820  }
821
822// a stale writeback
823 transition(O, WrVicBlkShared, O_O){TagArrayRead} {
824   t_allocateTBE;
825   f_setFrom;
826   w_sendResponseWBAck;
827   p_popRequestQueue;
828 }
829
830// a stale writeback
831  transition(M, WrVicBlk, M_M){TagArrayRead} {
832    t_allocateTBE;
833    f_setFrom;
834    w_sendResponseWBAck;
835    p_popRequestQueue;
836  }
837
838// a stale writeback
839  transition(M, WrVicBlkShared, M_O){TagArrayRead} {
840    t_allocateTBE;
841    f_setFrom;
842    w_sendResponseWBAck;
843    p_popRequestQueue;
844  }
845
846//check
847  transition({I}, ClVicBlk, I_E){TagArrayRead} {
848    t_allocateTBE;
849    f_setFrom;
850    a_allocateBlock;
851    w_sendResponseWBAck;
852    p_popRequestQueue;
853  }
854
855  transition({I}, ClVicBlkShared, I_S){TagArrayRead} {
856    t_allocateTBE;
857    f_setFrom;
858    a_allocateBlock;
859    w_sendResponseWBAck;
860    p_popRequestQueue;
861  }
862
863//check
864  transition(S, ClVicBlkShared, S_S){TagArrayRead} {
865    t_allocateTBE;
866    f_setFrom;
867    w_sendResponseWBAck;
868    p_popRequestQueue;
869  }
870
871// a stale writeback
872  transition(E, ClVicBlk, E_E){TagArrayRead} {
873    t_allocateTBE;
874    f_setFrom;
875    w_sendResponseWBAck;
876    p_popRequestQueue;
877  }
878
879// a stale writeback
880  transition(E, ClVicBlkShared, E_S){TagArrayRead} {
881    t_allocateTBE;
882    f_setFrom;
883    w_sendResponseWBAck;
884    p_popRequestQueue;
885  }
886
887// a stale writeback
888 transition(O, ClVicBlk, O_O){TagArrayRead} {
889   t_allocateTBE;
890   f_setFrom;
891   w_sendResponseWBAck;
892   p_popRequestQueue;
893 }
894
895// check. Original L3 ahd it going from O to O_S. Something can go from O to S only on writeback.
896  transition(O, ClVicBlkShared, O_O){TagArrayRead} {
897    t_allocateTBE;
898    f_setFrom;
899    w_sendResponseWBAck;
900    p_popRequestQueue;
901  }
902
903// a stale writeback
904 transition(M, ClVicBlk, M_E){TagArrayRead} {
905   t_allocateTBE;
906   f_setFrom;
907   w_sendResponseWBAck;
908   p_popRequestQueue;
909 }
910
911// a stale writeback
912 transition(M, ClVicBlkShared, M_S){TagArrayRead} {
913   t_allocateTBE;
914   f_setFrom;
915   w_sendResponseWBAck;
916   p_popRequestQueue;
917 }
918
919
920  transition({MO_I}, {RdBlk, RdBlkS, RdBlkM, CtoD}) {
921    a_allocateBlock;
922    t_allocateTBE;
923    f_setFrom;
924    r_requestToTD;
925    p_popRequestQueue;
926  }
927
928  transition(MO_I, {WrVicBlkShared, WrVicBlk, ClVicBlk, ClVicBlkShared}, MOD_I) {
929    f_setFrom;
930    w_sendResponseWBAck;
931    p_popRequestQueue;
932  }
933
934  transition(I_M, CPUData, M){TagArrayWrite} {
935    uo_sendUnblockOwner;
936    dt_deallocateTBE;
937    d_writeData;
938    pr_popResponseQueue;
939  }
940
941  transition(I_M, CPUDataShared, O){TagArrayWrite, DataArrayWrite} {
942    uo_sendUnblockOwner;
943    dt_deallocateTBE;
944    d_writeData;
945    pr_popResponseQueue;
946  }
947
948  transition(I_O, {CPUData, CPUDataShared}, O){TagArrayWrite, DataArrayWrite}  {
949    uo_sendUnblockOwner;
950    dt_deallocateTBE;
951    d_writeData;
952    pr_popResponseQueue;
953  }
954
955  transition(I_E, CPUData, E){TagArrayWrite, DataArrayWrite}  {
956    uo_sendUnblockOwner;
957    dt_deallocateTBE;
958    d_writeData;
959    pr_popResponseQueue;
960  }
961
962  transition(I_E, CPUDataShared, S){TagArrayWrite, DataArrayWrite}  {
963    us_sendUnblockSharer;
964    dt_deallocateTBE;
965    d_writeData;
966    pr_popResponseQueue;
967  }
968
969  transition(I_S, {CPUData, CPUDataShared}, S){TagArrayWrite, DataArrayWrite}  {
970    us_sendUnblockSharer;
971    dt_deallocateTBE;
972    d_writeData;
973    pr_popResponseQueue;
974  }
975
976  transition(S_M, CPUDataShared, O){TagArrayWrite, DataArrayWrite}  {
977    uo_sendUnblockOwner;
978    dt_deallocateTBE;
979    d_writeData;
980    ut_updateTag;  // update tag on writeback hits.
981    pr_popResponseQueue;
982  }
983
984  transition(S_O, {CPUData, CPUDataShared}, O){TagArrayWrite, DataArrayWrite}  {
985    uo_sendUnblockOwner;
986    dt_deallocateTBE;
987    d_writeData;
988    ut_updateTag;  // update tag on writeback hits.
989    pr_popResponseQueue;
990  }
991
992  transition(S_E, CPUDataShared, S){TagArrayWrite, DataArrayWrite}  {
993    us_sendUnblockSharer;
994    dt_deallocateTBE;
995    d_writeData;
996    ut_updateTag;  // update tag on writeback hits.
997    pr_popResponseQueue;
998  }
999
1000  transition(S_S, {CPUData, CPUDataShared}, S){TagArrayWrite, DataArrayWrite}  {
1001    us_sendUnblockSharer;
1002    dt_deallocateTBE;
1003    d_writeData;
1004    ut_updateTag;  // update tag on writeback hits.
1005    pr_popResponseQueue;
1006  }
1007
1008  transition(O_E, CPUDataShared, O){TagArrayWrite, DataArrayWrite}  {
1009    uo_sendUnblockOwner;
1010    dt_deallocateTBE;
1011    d_writeData;
1012    ut_updateTag;  // update tag on writeback hits.
1013    pr_popResponseQueue;
1014  }
1015
1016  transition(O_O, {CPUData, CPUDataShared}, O){TagArrayWrite, DataArrayWrite}  {
1017    uo_sendUnblockOwner;
1018    dt_deallocateTBE;
1019    d_writeData;
1020    ut_updateTag;  // update tag on writeback hits.
1021    pr_popResponseQueue;
1022  }
1023
1024  transition({D_I}, {CPUData, CPUDataShared}, I){TagArrayWrite}  {
1025    un_sendUnblockNotValid;
1026    dt_deallocateTBE;
1027    pr_popResponseQueue;
1028  }
1029
1030  transition(MOD_I, {CPUData, CPUDataShared}, MO_I) {
1031    un_sendUnblockNotValid;
1032    rf_resetFrom;
1033    pr_popResponseQueue;
1034  }
1035
1036  transition({O,S,I}, CPUData) {
1037    pr_popResponseQueue;
1038  }
1039
1040  transition({M, O}, L2_Repl, MO_I){TagArrayRead, DataArrayRead} {
1041    t_allocateTBE;
1042    vd_vicDirty;
1043    i_invL2;
1044  }
1045
1046  transition({E, S,}, L2_Repl, ES_I){TagArrayRead, DataArrayRead} {
1047    t_allocateTBE;
1048    vc_vicClean;
1049    i_invL2;
1050  }
1051
1052  transition({I_M, I_O, S_M, S_O, E_M, E_O}, L2_Repl) {
1053    zz_recycleRequestQueue;
1054  }
1055
1056  transition({O_M, O_O, O_E, M_M, M_O, M_E, M_S}, L2_Repl) {
1057    zz_recycleRequestQueue;
1058  }
1059
1060  transition({I_E, I_S, S_E, S_S, E_E, E_S}, L2_Repl) {
1061    zz_recycleRequestQueue;
1062  }
1063
1064  transition({M, O}, PrbInvData, I){TagArrayRead, TagArrayWrite} {
1065    pd_sendProbeResponseData;
1066    i_invL2;
1067    pp_popProbeQueue;
1068  }
1069
1070  transition(I, PrbInvData){TagArrayRead, TagArrayWrite}  {
1071    pi_sendProbeResponseInv;
1072    pp_popProbeQueue;
1073  }
1074
1075  transition({E, S}, PrbInvData, I){TagArrayRead, TagArrayWrite}  {
1076    pd_sendProbeResponseData;
1077    i_invL2;
1078    pp_popProbeQueue;
1079  }
1080
1081  transition({M, O, E, S, I}, PrbInv, I){TagArrayRead, TagArrayWrite}  {
1082    pi_sendProbeResponseInv;
1083    i_invL2; // nothing will happen in I
1084    pp_popProbeQueue;
1085  }
1086
1087  transition({M, O}, PrbShrData, O){TagArrayRead, TagArrayWrite}  {
1088    pd_sendProbeResponseData;
1089    pp_popProbeQueue;
1090  }
1091
1092  transition({E, S}, PrbShrData, S){TagArrayRead, TagArrayWrite}  {
1093    pd_sendProbeResponseData;
1094    pp_popProbeQueue;
1095  }
1096
1097  transition(I, PrbShrData){TagArrayRead}  {
1098    pm_sendProbeResponseMiss;
1099    pp_popProbeQueue;
1100  }
1101
1102  transition(MO_I, PrbInvData, I_C) {
1103    pdt_sendProbeResponseDataFromTBE;
1104    pp_popProbeQueue;
1105  }
1106
1107  transition(ES_I, PrbInvData, I_C) {
1108    pi_sendProbeResponseInv;
1109    pp_popProbeQueue;
1110  }
1111
1112  transition({ES_I,MO_I}, PrbInv, I_C) {
1113    pi_sendProbeResponseInv;
1114    pp_popProbeQueue;
1115  }
1116
1117  transition({ES_I, MO_I}, PrbShrData) {
1118    pdt_sendProbeResponseDataFromTBE;
1119    pp_popProbeQueue;
1120  }
1121
1122  transition(I_C, {PrbInvData, PrbInv}) {
1123    pi_sendProbeResponseInv;
1124    pp_popProbeQueue;
1125  }
1126
1127  transition(I_C, PrbShrData) {
1128    pm_sendProbeResponseMiss;
1129    pp_popProbeQueue;
1130  }
1131
1132  transition(MOD_I, WBAck, D_I) {
1133    pn_popTDResponseQueue;
1134  }
1135
1136  transition(MO_I, WBAck, I){TagArrayWrite} {
1137    dt_deallocateTBE;
1138    pn_popTDResponseQueue;
1139  }
1140
1141  // this can only be a spurious CPUData from a shared block.
1142  transition(MO_I, CPUData) {
1143    pr_popResponseQueue;
1144  }
1145
1146  transition(ES_I, WBAck, I){TagArrayWrite} {
1147    dt_deallocateTBE;
1148    pn_popTDResponseQueue;
1149  }
1150
1151  transition(I_C, {WBAck}, I){TagArrayWrite} {
1152    dt_deallocateTBE;
1153    pn_popTDResponseQueue;
1154  }
1155
1156  transition({I_M, I_O, I_E, I_S}, StaleWB, I){TagArrayWrite} {
1157    un_sendUnblockNotValid;
1158    dt_deallocateTBE;
1159    i_invL2;
1160    pr_popResponseQueue;
1161  }
1162
1163  transition({S_S, S_O, S_M, S_E}, StaleWB, S){TagArrayWrite} {
1164    us_sendUnblockSharer;
1165    dt_deallocateTBE;
1166    pr_popResponseQueue;
1167  }
1168
1169  transition({E_M, E_O, E_E, E_S}, StaleWB, E){TagArrayWrite} {
1170    uo_sendUnblockOwner;
1171    dt_deallocateTBE;
1172    pr_popResponseQueue;
1173  }
1174
1175  transition({O_M, O_O, O_E}, StaleWB, O){TagArrayWrite} {
1176    uo_sendUnblockOwner;
1177    dt_deallocateTBE;
1178    pr_popResponseQueue;
1179  }
1180
1181  transition({M_M, M_O, M_E, M_S}, StaleWB, M){TagArrayWrite} {
1182    uo_sendUnblockOwner;
1183    dt_deallocateTBE;
1184    pr_popResponseQueue;
1185  }
1186
1187  transition(D_I, StaleWB, I) {TagArrayWrite}{
1188    un_sendUnblockNotValid;
1189    dt_deallocateTBE;
1190    pr_popResponseQueue;
1191  }
1192
1193  transition(MOD_I, StaleWB, MO_I) {
1194    un_sendUnblockNotValid;
1195    rf_resetFrom;
1196    pr_popResponseQueue;
1197  }
1198
1199}
1200