lsq.cc revision 11429:cf5af0cc3be4
1/*
2 * Copyright (c) 2013-2014 ARM Limited
3 * All rights reserved
4 *
5 * The license below extends only to copyright in the software and shall
6 * not be construed as granting a license to any other intellectual
7 * property including but not limited to intellectual property relating
8 * to a hardware implementation of the functionality of the software
9 * licensed hereunder.  You may use the software subject to the license
10 * terms below provided that you ensure that this notice is replicated
11 * unmodified and in its entirety in all distributions of the software,
12 * modified or unmodified, in source code or in binary form.
13 *
14 * Redistribution and use in source and binary forms, with or without
15 * modification, are permitted provided that the following conditions are
16 * met: redistributions of source code must retain the above copyright
17 * notice, this list of conditions and the following disclaimer;
18 * redistributions in binary form must reproduce the above copyright
19 * notice, this list of conditions and the following disclaimer in the
20 * documentation and/or other materials provided with the distribution;
21 * neither the name of the copyright holders nor the names of its
22 * contributors may be used to endorse or promote products derived from
23 * this software without specific prior written permission.
24 *
25 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
26 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
27 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
28 * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
29 * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
30 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
31 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
32 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
33 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
34 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
35 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
36 *
37 * Authors: Andrew Bardsley
38 */
39
40#include <iomanip>
41#include <sstream>
42
43#include "arch/locked_mem.hh"
44#include "arch/mmapped_ipr.hh"
45#include "cpu/minor/cpu.hh"
46#include "cpu/minor/exec_context.hh"
47#include "cpu/minor/execute.hh"
48#include "cpu/minor/lsq.hh"
49#include "cpu/minor/pipeline.hh"
50#include "debug/Activity.hh"
51#include "debug/MinorMem.hh"
52
53namespace Minor
54{
55
56/** Returns the offset of addr into an aligned a block of size block_size */
57static Addr
58addrBlockOffset(Addr addr, unsigned int block_size)
59{
60    return addr & (block_size - 1);
61}
62
63/** Returns true if the given [addr .. addr+size-1] transfer needs to be
64 *  fragmented across a block size of block_size */
65static bool
66transferNeedsBurst(Addr addr, unsigned int size, unsigned int block_size)
67{
68    return (addrBlockOffset(addr, block_size) + size) > block_size;
69}
70
71LSQ::LSQRequest::LSQRequest(LSQ &port_, MinorDynInstPtr inst_, bool isLoad_,
72    PacketDataPtr data_, uint64_t *res_) :
73    SenderState(),
74    port(port_),
75    inst(inst_),
76    isLoad(isLoad_),
77    data(data_),
78    packet(NULL),
79    request(),
80    fault(NoFault),
81    res(res_),
82    skipped(false),
83    issuedToMemory(false),
84    state(NotIssued)
85{ }
86
87LSQ::AddrRangeCoverage
88LSQ::LSQRequest::containsAddrRangeOf(
89    Addr req1_addr, unsigned int req1_size,
90    Addr req2_addr, unsigned int req2_size)
91{
92    /* 'end' here means the address of the byte just past the request
93     *  blocks */
94    Addr req2_end_addr = req2_addr + req2_size;
95    Addr req1_end_addr = req1_addr + req1_size;
96
97    AddrRangeCoverage ret;
98
99    if (req1_addr > req2_end_addr || req1_end_addr < req2_addr)
100        ret = NoAddrRangeCoverage;
101    else if (req1_addr <= req2_addr && req1_end_addr >= req2_end_addr)
102        ret = FullAddrRangeCoverage;
103    else
104        ret = PartialAddrRangeCoverage;
105
106    return ret;
107}
108
109LSQ::AddrRangeCoverage
110LSQ::LSQRequest::containsAddrRangeOf(LSQRequestPtr other_request)
111{
112    return containsAddrRangeOf(request.getPaddr(), request.getSize(),
113        other_request->request.getPaddr(), other_request->request.getSize());
114}
115
116bool
117LSQ::LSQRequest::isBarrier()
118{
119    return inst->isInst() && inst->staticInst->isMemBarrier();
120}
121
122bool
123LSQ::LSQRequest::needsToBeSentToStoreBuffer()
124{
125    return state == StoreToStoreBuffer;
126}
127
128void
129LSQ::LSQRequest::setState(LSQRequestState new_state)
130{
131    DPRINTFS(MinorMem, (&port), "Setting state from %d to %d for request:"
132        " %s\n", state, new_state, *inst);
133    state = new_state;
134}
135
136bool
137LSQ::LSQRequest::isComplete() const
138{
139    /* @todo, There is currently only one 'completed' state.  This
140     *  may not be a good choice */
141    return state == Complete;
142}
143
144void
145LSQ::LSQRequest::reportData(std::ostream &os) const
146{
147    os << (isLoad ? 'R' : 'W') << ';';
148    inst->reportData(os);
149    os << ';' << state;
150}
151
152std::ostream &
153operator <<(std::ostream &os, LSQ::AddrRangeCoverage coverage)
154{
155    switch (coverage) {
156      case LSQ::PartialAddrRangeCoverage:
157        os << "PartialAddrRangeCoverage";
158        break;
159      case LSQ::FullAddrRangeCoverage:
160        os << "FullAddrRangeCoverage";
161        break;
162      case LSQ::NoAddrRangeCoverage:
163        os << "NoAddrRangeCoverage";
164        break;
165      default:
166        os << "AddrRangeCoverage-" << static_cast<int>(coverage);
167        break;
168    }
169    return os;
170}
171
172std::ostream &
173operator <<(std::ostream &os, LSQ::LSQRequest::LSQRequestState state)
174{
175    switch (state) {
176      case LSQ::LSQRequest::NotIssued:
177        os << "NotIssued";
178        break;
179      case LSQ::LSQRequest::InTranslation:
180        os << "InTranslation";
181        break;
182      case LSQ::LSQRequest::Translated:
183        os << "Translated";
184        break;
185      case LSQ::LSQRequest::Failed:
186        os << "Failed";
187        break;
188      case LSQ::LSQRequest::RequestIssuing:
189        os << "RequestIssuing";
190        break;
191      case LSQ::LSQRequest::StoreToStoreBuffer:
192        os << "StoreToStoreBuffer";
193        break;
194      case LSQ::LSQRequest::StoreInStoreBuffer:
195        os << "StoreInStoreBuffer";
196        break;
197      case LSQ::LSQRequest::StoreBufferIssuing:
198        os << "StoreBufferIssuing";
199        break;
200      case LSQ::LSQRequest::RequestNeedsRetry:
201        os << "RequestNeedsRetry";
202        break;
203      case LSQ::LSQRequest::StoreBufferNeedsRetry:
204        os << "StoreBufferNeedsRetry";
205        break;
206      case LSQ::LSQRequest::Complete:
207        os << "Complete";
208        break;
209      default:
210        os << "LSQRequestState-" << static_cast<int>(state);
211        break;
212    }
213    return os;
214}
215
216void
217LSQ::clearMemBarrier(MinorDynInstPtr inst)
218{
219    bool is_last_barrier = inst->id.execSeqNum >= lastMemBarrier;
220
221    DPRINTF(MinorMem, "Moving %s barrier out of store buffer inst: %s\n",
222        (is_last_barrier ? "last" : "a"), *inst);
223
224    if (is_last_barrier)
225        lastMemBarrier = 0;
226}
227
228void
229LSQ::SingleDataRequest::finish(const Fault &fault_, RequestPtr request_,
230                               ThreadContext *tc, BaseTLB::Mode mode)
231{
232    fault = fault_;
233
234    port.numAccessesInDTLB--;
235
236    DPRINTFS(MinorMem, (&port), "Received translation response for"
237        " request: %s\n", *inst);
238
239    makePacket();
240
241    setState(Translated);
242    port.tryToSendToTransfers(this);
243
244    /* Let's try and wake up the processor for the next cycle */
245    port.cpu.wakeupOnEvent(Pipeline::ExecuteStageId);
246}
247
248void
249LSQ::SingleDataRequest::startAddrTranslation()
250{
251    ThreadContext *thread = port.cpu.getContext(
252        inst->id.threadId);
253
254    port.numAccessesInDTLB++;
255
256    setState(LSQ::LSQRequest::InTranslation);
257
258    DPRINTFS(MinorMem, (&port), "Submitting DTLB request\n");
259    /* Submit the translation request.  The response will come through
260     *  finish/markDelayed on the LSQRequest as it bears the Translation
261     *  interface */
262    thread->getDTBPtr()->translateTiming(
263        &request, thread, this, (isLoad ? BaseTLB::Read : BaseTLB::Write));
264}
265
266void
267LSQ::SingleDataRequest::retireResponse(PacketPtr packet_)
268{
269    DPRINTFS(MinorMem, (&port), "Retiring packet\n");
270    packet = packet_;
271    packetInFlight = false;
272    setState(Complete);
273}
274
275void
276LSQ::SplitDataRequest::finish(const Fault &fault_, RequestPtr request_,
277                              ThreadContext *tc, BaseTLB::Mode mode)
278{
279    fault = fault_;
280
281    port.numAccessesInDTLB--;
282
283    unsigned int M5_VAR_USED expected_fragment_index =
284        numTranslatedFragments;
285
286    numInTranslationFragments--;
287    numTranslatedFragments++;
288
289    DPRINTFS(MinorMem, (&port), "Received translation response for fragment"
290        " %d of request: %s\n", expected_fragment_index, *inst);
291
292    assert(request_ == fragmentRequests[expected_fragment_index]);
293
294    /* Wake up next cycle to get things going again in case the
295     *  tryToSendToTransfers does take */
296    port.cpu.wakeupOnEvent(Pipeline::ExecuteStageId);
297
298    if (fault != NoFault) {
299        /* tryToSendToTransfers will handle the fault */
300
301        DPRINTFS(MinorMem, (&port), "Faulting translation for fragment:"
302            " %d of request: %s\n",
303            expected_fragment_index, *inst);
304
305        setState(Translated);
306        port.tryToSendToTransfers(this);
307    } else if (numTranslatedFragments == numFragments) {
308        makeFragmentPackets();
309
310        setState(Translated);
311        port.tryToSendToTransfers(this);
312    } else {
313        /* Avoid calling translateTiming from within ::finish */
314        assert(!translationEvent.scheduled());
315        port.cpu.schedule(translationEvent, curTick());
316    }
317}
318
319LSQ::SplitDataRequest::SplitDataRequest(LSQ &port_, MinorDynInstPtr inst_,
320    bool isLoad_, PacketDataPtr data_, uint64_t *res_) :
321    LSQRequest(port_, inst_, isLoad_, data_, res_),
322    translationEvent(*this),
323    numFragments(0),
324    numInTranslationFragments(0),
325    numTranslatedFragments(0),
326    numIssuedFragments(0),
327    numRetiredFragments(0),
328    fragmentRequests(),
329    fragmentPackets()
330{
331    /* Don't know how many elements are needed until the request is
332     *  populated by the caller. */
333}
334
335LSQ::SplitDataRequest::~SplitDataRequest()
336{
337    for (auto i = fragmentRequests.begin();
338        i != fragmentRequests.end(); i++)
339    {
340        delete *i;
341    }
342
343    for (auto i = fragmentPackets.begin();
344         i != fragmentPackets.end(); i++)
345    {
346        delete *i;
347    }
348}
349
350void
351LSQ::SplitDataRequest::makeFragmentRequests()
352{
353    Addr base_addr = request.getVaddr();
354    unsigned int whole_size = request.getSize();
355    unsigned int line_width = port.lineWidth;
356
357    unsigned int fragment_size;
358    Addr fragment_addr;
359
360    /* Assume that this transfer is across potentially many block snap
361     * boundaries:
362     *
363     * |      _|________|________|________|___     |
364     * |     |0| 1      | 2      | 3      | 4 |    |
365     * |     |_|________|________|________|___|    |
366     * |       |        |        |        |        |
367     *
368     *  The first transfer (0) can be up to lineWidth in size.
369     *  All the middle transfers (1-3) are lineWidth in size
370     *  The last transfer (4) can be from zero to lineWidth - 1 in size
371     */
372    unsigned int first_fragment_offset =
373        addrBlockOffset(base_addr, line_width);
374    unsigned int last_fragment_size =
375        addrBlockOffset(base_addr + whole_size, line_width);
376    unsigned int first_fragment_size =
377        line_width - first_fragment_offset;
378
379    unsigned int middle_fragments_total_size =
380        whole_size - (first_fragment_size + last_fragment_size);
381
382    assert(addrBlockOffset(middle_fragments_total_size, line_width) == 0);
383
384    unsigned int middle_fragment_count =
385        middle_fragments_total_size / line_width;
386
387    numFragments = 1 /* first */ + middle_fragment_count +
388        (last_fragment_size == 0 ? 0 : 1);
389
390    DPRINTFS(MinorMem, (&port), "Dividing transfer into %d fragmentRequests."
391        " First fragment size: %d Last fragment size: %d\n",
392        numFragments, first_fragment_size,
393        (last_fragment_size == 0 ? line_width : last_fragment_size));
394
395    assert(((middle_fragment_count * line_width) +
396        first_fragment_size + last_fragment_size) == whole_size);
397
398    fragment_addr = base_addr;
399    fragment_size = first_fragment_size;
400
401    /* Just past the last address in the request */
402    Addr end_addr = base_addr + whole_size;
403
404    for (unsigned int fragment_index = 0; fragment_index < numFragments;
405         fragment_index++)
406    {
407        bool M5_VAR_USED is_last_fragment = false;
408
409        if (fragment_addr == base_addr) {
410            /* First fragment */
411            fragment_size = first_fragment_size;
412        } else {
413            if ((fragment_addr + line_width) > end_addr) {
414                /* Adjust size of last fragment */
415                fragment_size = end_addr - fragment_addr;
416                is_last_fragment = true;
417            } else {
418                /* Middle fragments */
419                fragment_size = line_width;
420            }
421        }
422
423        Request *fragment = new Request();
424
425        fragment->setThreadContext(request.contextId(), /* thread id */ 0);
426        fragment->setVirt(0 /* asid */,
427            fragment_addr, fragment_size, request.getFlags(),
428            request.masterId(),
429            request.getPC());
430
431        DPRINTFS(MinorMem, (&port), "Generating fragment addr: 0x%x size: %d"
432            " (whole request addr: 0x%x size: %d) %s\n",
433            fragment_addr, fragment_size, base_addr, whole_size,
434            (is_last_fragment ? "last fragment" : ""));
435
436        fragment_addr += fragment_size;
437
438        fragmentRequests.push_back(fragment);
439    }
440}
441
442void
443LSQ::SplitDataRequest::makeFragmentPackets()
444{
445    Addr base_addr = request.getVaddr();
446
447    DPRINTFS(MinorMem, (&port), "Making packets for request: %s\n", *inst);
448
449    for (unsigned int fragment_index = 0; fragment_index < numFragments;
450         fragment_index++)
451    {
452        Request *fragment = fragmentRequests[fragment_index];
453
454        DPRINTFS(MinorMem, (&port), "Making packet %d for request: %s"
455            " (%d, 0x%x)\n",
456            fragment_index, *inst,
457            (fragment->hasPaddr() ? "has paddr" : "no paddr"),
458            (fragment->hasPaddr() ? fragment->getPaddr() : 0));
459
460        Addr fragment_addr = fragment->getVaddr();
461        unsigned int fragment_size = fragment->getSize();
462
463        uint8_t *request_data = NULL;
464
465        if (!isLoad) {
466            /* Split data for Packets.  Will become the property of the
467             *  outgoing Packets */
468            request_data = new uint8_t[fragment_size];
469            std::memcpy(request_data, data + (fragment_addr - base_addr),
470                fragment_size);
471        }
472
473        assert(fragment->hasPaddr());
474
475        PacketPtr fragment_packet =
476            makePacketForRequest(*fragment, isLoad, this, request_data);
477
478        fragmentPackets.push_back(fragment_packet);
479        /* Accumulate flags in parent request */
480        request.setFlags(fragment->getFlags());
481    }
482
483    /* Might as well make the overall/response packet here */
484    /* Get the physical address for the whole request/packet from the first
485     *  fragment */
486    request.setPaddr(fragmentRequests[0]->getPaddr());
487    makePacket();
488}
489
490void
491LSQ::SplitDataRequest::startAddrTranslation()
492{
493    setState(LSQ::LSQRequest::InTranslation);
494
495    makeFragmentRequests();
496
497    numInTranslationFragments = 0;
498    numTranslatedFragments = 0;
499
500    /* @todo, just do these in sequence for now with
501     * a loop of:
502     * do {
503     *  sendNextFragmentToTranslation ; translateTiming ; finish
504     * } while (numTranslatedFragments != numFragments);
505     */
506
507    /* Do first translation */
508    sendNextFragmentToTranslation();
509}
510
511PacketPtr
512LSQ::SplitDataRequest::getHeadPacket()
513{
514    assert(numIssuedFragments < numFragments);
515
516    return fragmentPackets[numIssuedFragments];
517}
518
519void
520LSQ::SplitDataRequest::stepToNextPacket()
521{
522    assert(numIssuedFragments < numFragments);
523
524    numIssuedFragments++;
525}
526
527void
528LSQ::SplitDataRequest::retireResponse(PacketPtr response)
529{
530    assert(numRetiredFragments < numFragments);
531
532    DPRINTFS(MinorMem, (&port), "Retiring fragment addr: 0x%x size: %d"
533        " offset: 0x%x (retired fragment num: %d) %s\n",
534        response->req->getVaddr(), response->req->getSize(),
535        request.getVaddr() - response->req->getVaddr(),
536        numRetiredFragments,
537        (fault == NoFault ? "" : fault->name()));
538
539    numRetiredFragments++;
540
541    if (skipped) {
542        /* Skip because we already knew the request had faulted or been
543         *  skipped */
544        DPRINTFS(MinorMem, (&port), "Skipping this fragment\n");
545    } else if (response->isError()) {
546        /* Mark up the error and leave to execute to handle it */
547        DPRINTFS(MinorMem, (&port), "Fragment has an error, skipping\n");
548        setSkipped();
549        packet->copyError(response);
550    } else {
551        if (isLoad) {
552            if (!data) {
553                /* For a split transfer, a Packet must be constructed
554                 *  to contain all returning data.  This is that packet's
555                 *  data */
556                data = new uint8_t[request.getSize()];
557            }
558
559            /* Populate the portion of the overall response data represented
560             *  by the response fragment */
561            std::memcpy(
562                data + (response->req->getVaddr() - request.getVaddr()),
563                response->getConstPtr<uint8_t>(),
564                response->req->getSize());
565        }
566    }
567
568    /* Complete early if we're skipping are no more in-flight accesses */
569    if (skipped && !hasPacketsInMemSystem()) {
570        DPRINTFS(MinorMem, (&port), "Completed skipped burst\n");
571        setState(Complete);
572        if (packet->needsResponse())
573            packet->makeResponse();
574    }
575
576    if (numRetiredFragments == numFragments)
577        setState(Complete);
578
579    if (!skipped && isComplete()) {
580        DPRINTFS(MinorMem, (&port), "Completed burst %d\n", packet != NULL);
581
582        DPRINTFS(MinorMem, (&port), "Retired packet isRead: %d isWrite: %d"
583             " needsResponse: %d packetSize: %s requestSize: %s responseSize:"
584             " %s\n", packet->isRead(), packet->isWrite(),
585             packet->needsResponse(), packet->getSize(), request.getSize(),
586             response->getSize());
587
588        /* A request can become complete by several paths, this is a sanity
589         *  check to make sure the packet's data is created */
590        if (!data) {
591            data = new uint8_t[request.getSize()];
592        }
593
594        if (isLoad) {
595            DPRINTFS(MinorMem, (&port), "Copying read data\n");
596            std::memcpy(packet->getPtr<uint8_t>(), data, request.getSize());
597        }
598        packet->makeResponse();
599    }
600
601    /* Packets are all deallocated together in ~SplitLSQRequest */
602}
603
604void
605LSQ::SplitDataRequest::sendNextFragmentToTranslation()
606{
607    unsigned int fragment_index = numTranslatedFragments;
608
609    ThreadContext *thread = port.cpu.getContext(
610        inst->id.threadId);
611
612    DPRINTFS(MinorMem, (&port), "Submitting DTLB request for fragment: %d\n",
613        fragment_index);
614
615    port.numAccessesInDTLB++;
616    numInTranslationFragments++;
617
618    thread->getDTBPtr()->translateTiming(
619        fragmentRequests[fragment_index], thread, this, (isLoad ?
620        BaseTLB::Read : BaseTLB::Write));
621}
622
623bool
624LSQ::StoreBuffer::canInsert() const
625{
626    /* @todo, support store amalgamation */
627    return slots.size() < numSlots;
628}
629
630void
631LSQ::StoreBuffer::deleteRequest(LSQRequestPtr request)
632{
633    auto found = std::find(slots.begin(), slots.end(), request);
634
635    if (found != slots.end()) {
636        DPRINTF(MinorMem, "Deleting request: %s %s %s from StoreBuffer\n",
637            request, *found, *(request->inst));
638        slots.erase(found);
639
640        delete request;
641    }
642}
643
644void
645LSQ::StoreBuffer::insert(LSQRequestPtr request)
646{
647    if (!canInsert()) {
648        warn("%s: store buffer insertion without space to insert from"
649            " inst: %s\n", name(), *(request->inst));
650    }
651
652    DPRINTF(MinorMem, "Pushing store: %s into store buffer\n", request);
653
654    numUnissuedAccesses++;
655
656    if (request->state != LSQRequest::Complete)
657        request->setState(LSQRequest::StoreInStoreBuffer);
658
659    slots.push_back(request);
660
661    /* Let's try and wake up the processor for the next cycle to step
662     *  the store buffer */
663    lsq.cpu.wakeupOnEvent(Pipeline::ExecuteStageId);
664}
665
666LSQ::AddrRangeCoverage
667LSQ::StoreBuffer::canForwardDataToLoad(LSQRequestPtr request,
668    unsigned int &found_slot)
669{
670    unsigned int slot_index = slots.size() - 1;
671    auto i = slots.rbegin();
672    AddrRangeCoverage ret = NoAddrRangeCoverage;
673
674    /* Traverse the store buffer in reverse order (most to least recent)
675     *  and try to find a slot whose address range overlaps this request */
676    while (ret == NoAddrRangeCoverage && i != slots.rend()) {
677        LSQRequestPtr slot = *i;
678
679        if (slot->packet) {
680            AddrRangeCoverage coverage = slot->containsAddrRangeOf(request);
681
682            if (coverage != NoAddrRangeCoverage) {
683                DPRINTF(MinorMem, "Forwarding: slot: %d result: %s thisAddr:"
684                    " 0x%x thisSize: %d slotAddr: 0x%x slotSize: %d\n",
685                    slot_index, coverage,
686                    request->request.getPaddr(), request->request.getSize(),
687                    slot->request.getPaddr(), slot->request.getSize());
688
689                found_slot = slot_index;
690                ret = coverage;
691            }
692        }
693
694        i++;
695        slot_index--;
696    }
697
698    return ret;
699}
700
701/** Fill the given packet with appropriate date from slot slot_number */
702void
703LSQ::StoreBuffer::forwardStoreData(LSQRequestPtr load,
704    unsigned int slot_number)
705{
706    assert(slot_number < slots.size());
707    assert(load->packet);
708    assert(load->isLoad);
709
710    LSQRequestPtr store = slots[slot_number];
711
712    assert(store->packet);
713    assert(store->containsAddrRangeOf(load) == FullAddrRangeCoverage);
714
715    Addr load_addr = load->request.getPaddr();
716    Addr store_addr = store->request.getPaddr();
717    Addr addr_offset = load_addr - store_addr;
718
719    unsigned int load_size = load->request.getSize();
720
721    DPRINTF(MinorMem, "Forwarding %d bytes for addr: 0x%x from store buffer"
722        " slot: %d addr: 0x%x addressOffset: 0x%x\n",
723        load_size, load_addr, slot_number,
724        store_addr, addr_offset);
725
726    void *load_packet_data = load->packet->getPtr<void>();
727    void *store_packet_data = store->packet->getPtr<uint8_t>() + addr_offset;
728
729    std::memcpy(load_packet_data, store_packet_data, load_size);
730}
731
732void
733LSQ::StoreBuffer::countIssuedStore(LSQRequestPtr request)
734{
735    /* Barriers are accounted for as they are cleared from
736     *  the queue, not after their transfers are complete */
737    if (!request->isBarrier())
738        numUnissuedAccesses--;
739}
740
741void
742LSQ::StoreBuffer::step()
743{
744    DPRINTF(MinorMem, "StoreBuffer step numUnissuedAccesses: %d\n",
745        numUnissuedAccesses);
746
747    if (numUnissuedAccesses != 0 && lsq.state == LSQ::MemoryRunning) {
748        /* Clear all the leading barriers */
749        while (!slots.empty() &&
750            slots.front()->isComplete() && slots.front()->isBarrier())
751        {
752            LSQRequestPtr barrier = slots.front();
753
754            DPRINTF(MinorMem, "Clearing barrier for inst: %s\n",
755                *(barrier->inst));
756
757            numUnissuedAccesses--;
758            lsq.clearMemBarrier(barrier->inst);
759            slots.pop_front();
760
761            delete barrier;
762        }
763
764        auto i = slots.begin();
765        bool issued = true;
766        unsigned int issue_count = 0;
767
768        /* Skip trying if the memory system is busy */
769        if (lsq.state == LSQ::MemoryNeedsRetry)
770            issued = false;
771
772        /* Try to issue all stores in order starting from the head
773         *  of the queue.  Responses are allowed to be retired
774         *  out of order */
775        while (issued &&
776            issue_count < storeLimitPerCycle &&
777            lsq.canSendToMemorySystem() &&
778            i != slots.end())
779        {
780            LSQRequestPtr request = *i;
781
782            DPRINTF(MinorMem, "Considering request: %s, sentAllPackets: %d"
783                " state: %s\n",
784                *(request->inst), request->sentAllPackets(),
785                request->state);
786
787            if (request->isBarrier() && request->isComplete()) {
788                /* Give up at barriers */
789                issued = false;
790            } else if (!(request->state == LSQRequest::StoreBufferIssuing &&
791                request->sentAllPackets()))
792            {
793                DPRINTF(MinorMem, "Trying to send request: %s to memory"
794                    " system\n", *(request->inst));
795
796                if (lsq.tryToSend(request)) {
797                    countIssuedStore(request);
798                    issue_count++;
799                } else {
800                    /* Don't step on to the next store buffer entry if this
801                     *  one hasn't issued all its packets as the store
802                     *  buffer must still enforce ordering */
803                    issued = false;
804                }
805            }
806            i++;
807        }
808    }
809}
810
811void
812LSQ::completeMemBarrierInst(MinorDynInstPtr inst,
813    bool committed)
814{
815    if (committed) {
816        /* Not already sent to the store buffer as a store request? */
817        if (!inst->inStoreBuffer) {
818            /* Insert an entry into the store buffer to tick off barriers
819             *  until there are none in flight */
820            storeBuffer.insert(new BarrierDataRequest(*this, inst));
821        }
822    } else {
823        /* Clear the barrier anyway if it wasn't actually committed */
824        clearMemBarrier(inst);
825    }
826}
827
828void
829LSQ::StoreBuffer::minorTrace() const
830{
831    unsigned int size = slots.size();
832    unsigned int i = 0;
833    std::ostringstream os;
834
835    while (i < size) {
836        LSQRequestPtr request = slots[i];
837
838        request->reportData(os);
839
840        i++;
841        if (i < numSlots)
842            os << ',';
843    }
844
845    while (i < numSlots) {
846        os << '-';
847
848        i++;
849        if (i < numSlots)
850            os << ',';
851    }
852
853    MINORTRACE("addr=%s num_unissued_stores=%d\n", os.str(),
854        numUnissuedAccesses);
855}
856
857void
858LSQ::tryToSendToTransfers(LSQRequestPtr request)
859{
860    if (state == MemoryNeedsRetry) {
861        DPRINTF(MinorMem, "Request needs retry, not issuing to"
862            " memory until retry arrives\n");
863        return;
864    }
865
866    if (request->state == LSQRequest::InTranslation) {
867        DPRINTF(MinorMem, "Request still in translation, not issuing to"
868            " memory\n");
869        return;
870    }
871
872    assert(request->state == LSQRequest::Translated ||
873        request->state == LSQRequest::RequestIssuing ||
874        request->state == LSQRequest::Failed ||
875        request->state == LSQRequest::Complete);
876
877    if (requests.empty() || requests.front() != request) {
878        DPRINTF(MinorMem, "Request not at front of requests queue, can't"
879            " issue to memory\n");
880        return;
881    }
882
883    if (transfers.unreservedRemainingSpace() == 0) {
884        DPRINTF(MinorMem, "No space to insert request into transfers"
885            " queue\n");
886        return;
887    }
888
889    if (request->isComplete() || request->state == LSQRequest::Failed) {
890        DPRINTF(MinorMem, "Passing a %s transfer on to transfers"
891            " queue\n", (request->isComplete() ? "completed" : "failed"));
892        request->setState(LSQRequest::Complete);
893        request->setSkipped();
894        moveFromRequestsToTransfers(request);
895        return;
896    }
897
898    if (!execute.instIsRightStream(request->inst)) {
899        /* Wrong stream, try to abort the transfer but only do so if
900         *  there are no packets in flight */
901        if (request->hasPacketsInMemSystem()) {
902            DPRINTF(MinorMem, "Request's inst. is from the wrong stream,"
903                " waiting for responses before aborting request\n");
904        } else {
905            DPRINTF(MinorMem, "Request's inst. is from the wrong stream,"
906                " aborting request\n");
907            request->setState(LSQRequest::Complete);
908            request->setSkipped();
909            moveFromRequestsToTransfers(request);
910        }
911        return;
912    }
913
914    if (request->fault != NoFault) {
915        if (request->inst->staticInst->isPrefetch()) {
916            DPRINTF(MinorMem, "Not signalling fault for faulting prefetch\n");
917        }
918        DPRINTF(MinorMem, "Moving faulting request into the transfers"
919            " queue\n");
920        request->setState(LSQRequest::Complete);
921        request->setSkipped();
922        moveFromRequestsToTransfers(request);
923        return;
924    }
925
926    bool is_load = request->isLoad;
927    bool is_llsc = request->request.isLLSC();
928    bool is_swap = request->request.isSwap();
929    bool bufferable = !(request->request.isStrictlyOrdered() ||
930        is_llsc || is_swap);
931
932    if (is_load) {
933        if (numStoresInTransfers != 0) {
934            DPRINTF(MinorMem, "Load request with stores still in transfers"
935                " queue, stalling\n");
936            return;
937        }
938    } else {
939        /* Store.  Can it be sent to the store buffer? */
940        if (bufferable && !request->request.isMmappedIpr()) {
941            request->setState(LSQRequest::StoreToStoreBuffer);
942            moveFromRequestsToTransfers(request);
943            DPRINTF(MinorMem, "Moving store into transfers queue\n");
944            return;
945        }
946    }
947
948    /* Check if this is the head instruction (and so must be executable as
949     *  its stream sequence number was checked above) for loads which must
950     *  not be speculatively issued and stores which must be issued here */
951    if (!bufferable) {
952        if (!execute.instIsHeadInst(request->inst)) {
953            DPRINTF(MinorMem, "Memory access not the head inst., can't be"
954                " sure it can be performed, not issuing\n");
955            return;
956        }
957
958        unsigned int forwarding_slot = 0;
959
960        if (storeBuffer.canForwardDataToLoad(request, forwarding_slot) !=
961            NoAddrRangeCoverage)
962        {
963            DPRINTF(MinorMem, "Memory access can receive forwarded data"
964                " from the store buffer, need to wait for store buffer to"
965                " drain\n");
966            return;
967        }
968    }
969
970    /* True: submit this packet to the transfers queue to be sent to the
971     * memory system.
972     * False: skip the memory and push a packet for this request onto
973     * requests */
974    bool do_access = true;
975
976    if (!is_llsc) {
977        /* Check for match in the store buffer */
978        if (is_load) {
979            unsigned int forwarding_slot = 0;
980            AddrRangeCoverage forwarding_result =
981                storeBuffer.canForwardDataToLoad(request,
982                forwarding_slot);
983
984            switch (forwarding_result) {
985              case FullAddrRangeCoverage:
986                /* Forward data from the store buffer into this request and
987                 *  repurpose this request's packet into a response packet */
988                storeBuffer.forwardStoreData(request, forwarding_slot);
989                request->packet->makeResponse();
990
991                /* Just move between queues, no access */
992                do_access = false;
993                break;
994              case PartialAddrRangeCoverage:
995                DPRINTF(MinorMem, "Load partly satisfied by store buffer"
996                    " data. Must wait for the store to complete\n");
997                return;
998                break;
999              case NoAddrRangeCoverage:
1000                DPRINTF(MinorMem, "No forwardable data from store buffer\n");
1001                /* Fall through to try access */
1002                break;
1003            }
1004        }
1005    } else {
1006        if (!canSendToMemorySystem()) {
1007            DPRINTF(MinorMem, "Can't send request to memory system yet\n");
1008            return;
1009        }
1010
1011        SimpleThread &thread = *cpu.threads[request->inst->id.threadId];
1012
1013        TheISA::PCState old_pc = thread.pcState();
1014        ExecContext context(cpu, thread, execute, request->inst);
1015
1016        /* Handle LLSC requests and tests */
1017        if (is_load) {
1018            TheISA::handleLockedRead(&context, &request->request);
1019        } else {
1020            do_access = TheISA::handleLockedWrite(&context,
1021                &request->request, cacheBlockMask);
1022
1023            if (!do_access) {
1024                DPRINTF(MinorMem, "Not perfoming a memory "
1025                    "access for store conditional\n");
1026            }
1027        }
1028        thread.pcState(old_pc);
1029    }
1030
1031    /* See the do_access comment above */
1032    if (do_access) {
1033        if (!canSendToMemorySystem()) {
1034            DPRINTF(MinorMem, "Can't send request to memory system yet\n");
1035            return;
1036        }
1037
1038        /* Remember if this is an access which can't be idly
1039         *  discarded by an interrupt */
1040        if (!bufferable && !request->issuedToMemory) {
1041            numAccessesIssuedToMemory++;
1042            request->issuedToMemory = true;
1043        }
1044
1045        if (tryToSend(request))
1046            moveFromRequestsToTransfers(request);
1047    } else {
1048        request->setState(LSQRequest::Complete);
1049        moveFromRequestsToTransfers(request);
1050    }
1051}
1052
1053bool
1054LSQ::tryToSend(LSQRequestPtr request)
1055{
1056    bool ret = false;
1057
1058    if (!canSendToMemorySystem()) {
1059        DPRINTF(MinorMem, "Can't send request: %s yet, no space in memory\n",
1060            *(request->inst));
1061    } else {
1062        PacketPtr packet = request->getHeadPacket();
1063
1064        DPRINTF(MinorMem, "Trying to send request: %s addr: 0x%x\n",
1065            *(request->inst), packet->req->getVaddr());
1066
1067        /* The sender state of the packet *must* be an LSQRequest
1068         *  so the response can be correctly handled */
1069        assert(packet->findNextSenderState<LSQRequest>());
1070
1071        if (request->request.isMmappedIpr()) {
1072            ThreadContext *thread =
1073                cpu.getContext(request->request.threadId());
1074
1075            if (request->isLoad) {
1076                DPRINTF(MinorMem, "IPR read inst: %s\n", *(request->inst));
1077                TheISA::handleIprRead(thread, packet);
1078            } else {
1079                DPRINTF(MinorMem, "IPR write inst: %s\n", *(request->inst));
1080                TheISA::handleIprWrite(thread, packet);
1081            }
1082
1083            request->stepToNextPacket();
1084            ret = request->sentAllPackets();
1085
1086            if (!ret) {
1087                DPRINTF(MinorMem, "IPR access has another packet: %s\n",
1088                    *(request->inst));
1089            }
1090
1091            if (ret)
1092                request->setState(LSQRequest::Complete);
1093            else
1094                request->setState(LSQRequest::RequestIssuing);
1095        } else if (dcachePort.sendTimingReq(packet)) {
1096            DPRINTF(MinorMem, "Sent data memory request\n");
1097
1098            numAccessesInMemorySystem++;
1099
1100            request->stepToNextPacket();
1101
1102            ret = request->sentAllPackets();
1103
1104            switch (request->state) {
1105              case LSQRequest::Translated:
1106              case LSQRequest::RequestIssuing:
1107                /* Fully or partially issued a request in the transfers
1108                 *  queue */
1109                request->setState(LSQRequest::RequestIssuing);
1110                break;
1111              case LSQRequest::StoreInStoreBuffer:
1112              case LSQRequest::StoreBufferIssuing:
1113                /* Fully or partially issued a request in the store
1114                 *  buffer */
1115                request->setState(LSQRequest::StoreBufferIssuing);
1116                break;
1117              default:
1118                assert(false);
1119                break;
1120            }
1121
1122            state = MemoryRunning;
1123        } else {
1124            DPRINTF(MinorMem,
1125                "Sending data memory request - needs retry\n");
1126
1127            /* Needs to be resent, wait for that */
1128            state = MemoryNeedsRetry;
1129            retryRequest = request;
1130
1131            switch (request->state) {
1132              case LSQRequest::Translated:
1133              case LSQRequest::RequestIssuing:
1134                request->setState(LSQRequest::RequestNeedsRetry);
1135                break;
1136              case LSQRequest::StoreInStoreBuffer:
1137              case LSQRequest::StoreBufferIssuing:
1138                request->setState(LSQRequest::StoreBufferNeedsRetry);
1139                break;
1140              default:
1141                assert(false);
1142                break;
1143            }
1144        }
1145    }
1146
1147    return ret;
1148}
1149
1150void
1151LSQ::moveFromRequestsToTransfers(LSQRequestPtr request)
1152{
1153    assert(!requests.empty() && requests.front() == request);
1154    assert(transfers.unreservedRemainingSpace() != 0);
1155
1156    /* Need to count the number of stores in the transfers
1157     *  queue so that loads know when their store buffer forwarding
1158     *  results will be correct (only when all those stores
1159     *  have reached the store buffer) */
1160    if (!request->isLoad)
1161        numStoresInTransfers++;
1162
1163    requests.pop();
1164    transfers.push(request);
1165}
1166
1167bool
1168LSQ::canSendToMemorySystem()
1169{
1170    return state == MemoryRunning &&
1171        numAccessesInMemorySystem < inMemorySystemLimit;
1172}
1173
1174bool
1175LSQ::recvTimingResp(PacketPtr response)
1176{
1177    LSQRequestPtr request =
1178        safe_cast<LSQRequestPtr>(response->popSenderState());
1179
1180    DPRINTF(MinorMem, "Received response packet inst: %s"
1181        " addr: 0x%x cmd: %s\n",
1182        *(request->inst), response->getAddr(),
1183        response->cmd.toString());
1184
1185    numAccessesInMemorySystem--;
1186
1187    if (response->isError()) {
1188        DPRINTF(MinorMem, "Received error response packet: %s\n",
1189            *request->inst);
1190    }
1191
1192    switch (request->state) {
1193      case LSQRequest::RequestIssuing:
1194      case LSQRequest::RequestNeedsRetry:
1195        /* Response to a request from the transfers queue */
1196        request->retireResponse(response);
1197
1198        DPRINTF(MinorMem, "Has outstanding packets?: %d %d\n",
1199            request->hasPacketsInMemSystem(), request->isComplete());
1200
1201        break;
1202      case LSQRequest::StoreBufferIssuing:
1203      case LSQRequest::StoreBufferNeedsRetry:
1204        /* Response to a request from the store buffer */
1205        request->retireResponse(response);
1206
1207        /* Remove completed requests unless they are barriers (which will
1208         *  need to be removed in order */
1209        if (request->isComplete()) {
1210            if (!request->isBarrier()) {
1211                storeBuffer.deleteRequest(request);
1212            } else {
1213                DPRINTF(MinorMem, "Completed transfer for barrier: %s"
1214                    " leaving the request as it is also a barrier\n",
1215                    *(request->inst));
1216            }
1217        }
1218        break;
1219      default:
1220        /* Shouldn't be allowed to receive a response from another
1221         *  state */
1222        assert(false);
1223        break;
1224    }
1225
1226    /* We go to idle even if there are more things in the requests queue
1227     * as it's the job of step to actually step us on to the next
1228     * transaction */
1229
1230    /* Let's try and wake up the processor for the next cycle */
1231    cpu.wakeupOnEvent(Pipeline::ExecuteStageId);
1232
1233    /* Never busy */
1234    return true;
1235}
1236
1237void
1238LSQ::recvReqRetry()
1239{
1240    DPRINTF(MinorMem, "Received retry request\n");
1241
1242    assert(state == MemoryNeedsRetry);
1243
1244    switch (retryRequest->state) {
1245      case LSQRequest::RequestNeedsRetry:
1246        /* Retry in the requests queue */
1247        retryRequest->setState(LSQRequest::Translated);
1248        break;
1249      case LSQRequest::StoreBufferNeedsRetry:
1250        /* Retry in the store buffer */
1251        retryRequest->setState(LSQRequest::StoreInStoreBuffer);
1252        break;
1253      default:
1254        assert(false);
1255    }
1256
1257    /* Set state back to MemoryRunning so that the following
1258     *  tryToSend can actually send.  Note that this won't
1259     *  allow another transfer in as tryToSend should
1260     *  issue a memory request and either succeed for this
1261     *  request or return the LSQ back to MemoryNeedsRetry */
1262    state = MemoryRunning;
1263
1264    /* Try to resend the request */
1265    if (tryToSend(retryRequest)) {
1266        /* Successfully sent, need to move the request */
1267        switch (retryRequest->state) {
1268          case LSQRequest::RequestIssuing:
1269            /* In the requests queue */
1270            moveFromRequestsToTransfers(retryRequest);
1271            break;
1272          case LSQRequest::StoreBufferIssuing:
1273            /* In the store buffer */
1274            storeBuffer.countIssuedStore(retryRequest);
1275            break;
1276          default:
1277            assert(false);
1278            break;
1279        }
1280
1281        retryRequest = NULL;
1282    }
1283}
1284
1285LSQ::LSQ(std::string name_, std::string dcache_port_name_,
1286    MinorCPU &cpu_, Execute &execute_,
1287    unsigned int in_memory_system_limit, unsigned int line_width,
1288    unsigned int requests_queue_size, unsigned int transfers_queue_size,
1289    unsigned int store_buffer_size,
1290    unsigned int store_buffer_cycle_store_limit) :
1291    Named(name_),
1292    cpu(cpu_),
1293    execute(execute_),
1294    dcachePort(dcache_port_name_, *this, cpu_),
1295    lastMemBarrier(0),
1296    state(MemoryRunning),
1297    inMemorySystemLimit(in_memory_system_limit),
1298    lineWidth((line_width == 0 ? cpu.cacheLineSize() : line_width)),
1299    requests(name_ + ".requests", "addr", requests_queue_size),
1300    transfers(name_ + ".transfers", "addr", transfers_queue_size),
1301    storeBuffer(name_ + ".storeBuffer",
1302        *this, store_buffer_size, store_buffer_cycle_store_limit),
1303    numAccessesInMemorySystem(0),
1304    numAccessesInDTLB(0),
1305    numStoresInTransfers(0),
1306    numAccessesIssuedToMemory(0),
1307    retryRequest(NULL),
1308    cacheBlockMask(~(cpu_.cacheLineSize() - 1))
1309{
1310    if (in_memory_system_limit < 1) {
1311        fatal("%s: executeMaxAccessesInMemory must be >= 1 (%d)\n", name_,
1312            in_memory_system_limit);
1313    }
1314
1315    if (store_buffer_cycle_store_limit < 1) {
1316        fatal("%s: executeLSQMaxStoreBufferStoresPerCycle must be"
1317            " >= 1 (%d)\n", name_, store_buffer_cycle_store_limit);
1318    }
1319
1320    if (requests_queue_size < 1) {
1321        fatal("%s: executeLSQRequestsQueueSize must be"
1322            " >= 1 (%d)\n", name_, requests_queue_size);
1323    }
1324
1325    if (transfers_queue_size < 1) {
1326        fatal("%s: executeLSQTransfersQueueSize must be"
1327            " >= 1 (%d)\n", name_, transfers_queue_size);
1328    }
1329
1330    if (store_buffer_size < 1) {
1331        fatal("%s: executeLSQStoreBufferSize must be"
1332            " >= 1 (%d)\n", name_, store_buffer_size);
1333    }
1334
1335    if ((lineWidth & (lineWidth - 1)) != 0) {
1336        fatal("%s: lineWidth: %d must be a power of 2\n", name(), lineWidth);
1337    }
1338}
1339
1340LSQ::~LSQ()
1341{ }
1342
1343LSQ::LSQRequest::~LSQRequest()
1344{
1345    if (packet)
1346        delete packet;
1347    if (data)
1348        delete [] data;
1349}
1350
1351/**
1352 *  Step the memory access mechanism on to its next state.  In reality, most
1353 *  of the stepping is done by the callbacks on the LSQ but this
1354 *  function is responsible for issuing memory requests lodged in the
1355 *  requests queue.
1356 */
1357void
1358LSQ::step()
1359{
1360    /* Try to move address-translated requests between queues and issue
1361     *  them */
1362    if (!requests.empty())
1363        tryToSendToTransfers(requests.front());
1364
1365    storeBuffer.step();
1366}
1367
1368LSQ::LSQRequestPtr
1369LSQ::findResponse(MinorDynInstPtr inst)
1370{
1371    LSQ::LSQRequestPtr ret = NULL;
1372
1373    if (!transfers.empty()) {
1374        LSQRequestPtr request = transfers.front();
1375
1376        /* Same instruction and complete access or a store that's
1377         *  capable of being moved to the store buffer */
1378        if (request->inst->id == inst->id) {
1379            bool complete = request->isComplete();
1380            bool can_store = storeBuffer.canInsert();
1381            bool to_store_buffer = request->state ==
1382                LSQRequest::StoreToStoreBuffer;
1383
1384            if ((complete && !(request->isBarrier() && !can_store)) ||
1385                (to_store_buffer && can_store))
1386            {
1387                ret = request;
1388            }
1389        }
1390    }
1391
1392    if (ret) {
1393        DPRINTF(MinorMem, "Found matching memory response for inst: %s\n",
1394            *inst);
1395    } else {
1396        DPRINTF(MinorMem, "No matching memory response for inst: %s\n",
1397            *inst);
1398    }
1399
1400    return ret;
1401}
1402
1403void
1404LSQ::popResponse(LSQ::LSQRequestPtr response)
1405{
1406    assert(!transfers.empty() && transfers.front() == response);
1407
1408    transfers.pop();
1409
1410    if (!response->isLoad)
1411        numStoresInTransfers--;
1412
1413    if (response->issuedToMemory)
1414        numAccessesIssuedToMemory--;
1415
1416    if (response->state != LSQRequest::StoreInStoreBuffer) {
1417        DPRINTF(MinorMem, "Deleting %s request: %s\n",
1418            (response->isLoad ? "load" : "store"),
1419            *(response->inst));
1420
1421        delete response;
1422    }
1423}
1424
1425void
1426LSQ::sendStoreToStoreBuffer(LSQRequestPtr request)
1427{
1428    assert(request->state == LSQRequest::StoreToStoreBuffer);
1429
1430    DPRINTF(MinorMem, "Sending store: %s to store buffer\n",
1431        *(request->inst));
1432
1433    request->inst->inStoreBuffer = true;
1434
1435    storeBuffer.insert(request);
1436}
1437
1438bool
1439LSQ::isDrained()
1440{
1441    return requests.empty() && transfers.empty() &&
1442        storeBuffer.isDrained();
1443}
1444
1445bool
1446LSQ::needsToTick()
1447{
1448    bool ret = false;
1449
1450    if (canSendToMemorySystem()) {
1451        bool have_translated_requests = !requests.empty() &&
1452            requests.front()->state != LSQRequest::InTranslation &&
1453            transfers.unreservedRemainingSpace() != 0;
1454
1455        ret = have_translated_requests ||
1456            storeBuffer.numUnissuedStores() != 0;
1457    }
1458
1459    if (ret)
1460        DPRINTF(Activity, "Need to tick\n");
1461
1462    return ret;
1463}
1464
1465void
1466LSQ::pushRequest(MinorDynInstPtr inst, bool isLoad, uint8_t *data,
1467    unsigned int size, Addr addr, unsigned int flags, uint64_t *res)
1468{
1469    bool needs_burst = transferNeedsBurst(addr, size, lineWidth);
1470    LSQRequestPtr request;
1471
1472    /* Copy given data into the request.  The request will pass this to the
1473     *  packet and then it will own the data */
1474    uint8_t *request_data = NULL;
1475
1476    DPRINTF(MinorMem, "Pushing request (%s) addr: 0x%x size: %d flags:"
1477        " 0x%x%s lineWidth : 0x%x\n",
1478        (isLoad ? "load" : "store"), addr, size, flags,
1479            (needs_burst ? " (needs burst)" : ""), lineWidth);
1480
1481    if (!isLoad) {
1482        /* request_data becomes the property of a ...DataRequest (see below)
1483         *  and destroyed by its destructor */
1484        request_data = new uint8_t[size];
1485        if (flags & Request::CACHE_BLOCK_ZERO) {
1486            /* For cache zeroing, just use zeroed data */
1487            std::memset(request_data, 0, size);
1488        } else {
1489            std::memcpy(request_data, data, size);
1490        }
1491    }
1492
1493    if (needs_burst) {
1494        request = new SplitDataRequest(
1495            *this, inst, isLoad, request_data, res);
1496    } else {
1497        request = new SingleDataRequest(
1498            *this, inst, isLoad, request_data, res);
1499    }
1500
1501    if (inst->traceData)
1502        inst->traceData->setMem(addr, size, flags);
1503
1504    int cid = cpu.threads[inst->id.threadId]->getTC()->contextId();
1505    request->request.setThreadContext(cid, /* thread id */ 0);
1506    request->request.setVirt(0 /* asid */,
1507        addr, size, flags, cpu.dataMasterId(),
1508        /* I've no idea why we need the PC, but give it */
1509        inst->pc.instAddr());
1510
1511    requests.push(request);
1512    request->startAddrTranslation();
1513}
1514
1515void
1516LSQ::pushFailedRequest(MinorDynInstPtr inst)
1517{
1518    LSQRequestPtr request = new FailedDataRequest(*this, inst);
1519    requests.push(request);
1520}
1521
1522void
1523LSQ::minorTrace() const
1524{
1525    MINORTRACE("state=%s in_tlb_mem=%d/%d stores_in_transfers=%d"
1526        " lastMemBarrier=%d\n",
1527        state, numAccessesInDTLB, numAccessesInMemorySystem,
1528        numStoresInTransfers, lastMemBarrier);
1529    requests.minorTrace();
1530    transfers.minorTrace();
1531    storeBuffer.minorTrace();
1532}
1533
1534LSQ::StoreBuffer::StoreBuffer(std::string name_, LSQ &lsq_,
1535    unsigned int store_buffer_size,
1536    unsigned int store_limit_per_cycle) :
1537    Named(name_), lsq(lsq_),
1538    numSlots(store_buffer_size),
1539    storeLimitPerCycle(store_limit_per_cycle),
1540    slots(),
1541    numUnissuedAccesses(0)
1542{
1543}
1544
1545PacketPtr
1546makePacketForRequest(Request &request, bool isLoad,
1547    Packet::SenderState *sender_state, PacketDataPtr data)
1548{
1549    PacketPtr ret = isLoad ? Packet::createRead(&request)
1550                           : Packet::createWrite(&request);
1551
1552    if (sender_state)
1553        ret->pushSenderState(sender_state);
1554
1555    if (isLoad)
1556        ret->allocate();
1557    else
1558        ret->dataDynamic(data);
1559
1560    return ret;
1561}
1562
1563void
1564LSQ::issuedMemBarrierInst(MinorDynInstPtr inst)
1565{
1566    assert(inst->isInst() && inst->staticInst->isMemBarrier());
1567    assert(inst->id.execSeqNum > lastMemBarrier);
1568
1569    /* Remember the barrier.  We only have a notion of one
1570     *  barrier so this may result in some mem refs being
1571     *  delayed if they are between barriers */
1572    lastMemBarrier = inst->id.execSeqNum;
1573}
1574
1575void
1576LSQ::LSQRequest::makePacket()
1577{
1578    /* Make the function idempotent */
1579    if (packet)
1580        return;
1581
1582    // if the translation faulted, do not create a packet
1583    if (fault != NoFault) {
1584        assert(packet == NULL);
1585        return;
1586    }
1587
1588    packet = makePacketForRequest(request, isLoad, this, data);
1589    /* Null the ret data so we know not to deallocate it when the
1590     * ret is destroyed.  The data now belongs to the ret and
1591     * the ret is responsible for its destruction */
1592    data = NULL;
1593}
1594
1595std::ostream &
1596operator <<(std::ostream &os, LSQ::MemoryState state)
1597{
1598    switch (state) {
1599      case LSQ::MemoryRunning:
1600        os << "MemoryRunning";
1601        break;
1602      case LSQ::MemoryNeedsRetry:
1603        os << "MemoryNeedsRetry";
1604        break;
1605      default:
1606        os << "MemoryState-" << static_cast<int>(state);
1607        break;
1608    }
1609    return os;
1610}
1611
1612void
1613LSQ::recvTimingSnoopReq(PacketPtr pkt)
1614{
1615    /* LLSC operations in Minor can't be speculative and are executed from
1616     * the head of the requests queue.  We shouldn't need to do more than
1617     * this action on snoops. */
1618
1619    /* THREAD */
1620    if (pkt->isInvalidate() || pkt->isWrite()) {
1621        TheISA::handleLockedSnoop(cpu.getContext(0), pkt, cacheBlockMask);
1622    }
1623}
1624
1625}
1626