schedule_stage.cc (11308:7d8836fd043d) schedule_stage.cc (12696:15d4edfbb01b)
1/*
2 * Copyright (c) 2014-2015 Advanced Micro Devices, Inc.
3 * All rights reserved.
4 *
5 * For use for simulation and test purposes only
6 *
7 * Redistribution and use in source and binary forms, with or without
8 * modification, are permitted provided that the following conditions are met:
9 *
10 * 1. Redistributions of source code must retain the above copyright notice,
11 * this list of conditions and the following disclaimer.
12 *
13 * 2. Redistributions in binary form must reproduce the above copyright notice,
14 * this list of conditions and the following disclaimer in the documentation
15 * and/or other materials provided with the distribution.
16 *
17 * 3. Neither the name of the copyright holder nor the names of its contributors
18 * may be used to endorse or promote products derived from this software
19 * without specific prior written permission.
20 *
21 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
22 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
23 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
24 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE
25 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
26 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
27 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
28 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
29 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
30 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
31 * POSSIBILITY OF SUCH DAMAGE.
32 *
33 * Author: Sooraj Puthoor
34 */
35
36#include "gpu-compute/schedule_stage.hh"
37
38#include "gpu-compute/compute_unit.hh"
39#include "gpu-compute/gpu_static_inst.hh"
40#include "gpu-compute/vector_register_file.hh"
41#include "gpu-compute/wavefront.hh"
42
43ScheduleStage::ScheduleStage(const ComputeUnitParams *p)
44 : numSIMDs(p->num_SIMDs),
45 numMemUnits(p->num_global_mem_pipes + p->num_shared_mem_pipes)
46{
47 for (int j = 0; j < numSIMDs + numMemUnits; ++j) {
1/*
2 * Copyright (c) 2014-2015 Advanced Micro Devices, Inc.
3 * All rights reserved.
4 *
5 * For use for simulation and test purposes only
6 *
7 * Redistribution and use in source and binary forms, with or without
8 * modification, are permitted provided that the following conditions are met:
9 *
10 * 1. Redistributions of source code must retain the above copyright notice,
11 * this list of conditions and the following disclaimer.
12 *
13 * 2. Redistributions in binary form must reproduce the above copyright notice,
14 * this list of conditions and the following disclaimer in the documentation
15 * and/or other materials provided with the distribution.
16 *
17 * 3. Neither the name of the copyright holder nor the names of its contributors
18 * may be used to endorse or promote products derived from this software
19 * without specific prior written permission.
20 *
21 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
22 * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
23 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
24 * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE
25 * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
26 * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
27 * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
28 * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
29 * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
30 * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
31 * POSSIBILITY OF SUCH DAMAGE.
32 *
33 * Author: Sooraj Puthoor
34 */
35
36#include "gpu-compute/schedule_stage.hh"
37
38#include "gpu-compute/compute_unit.hh"
39#include "gpu-compute/gpu_static_inst.hh"
40#include "gpu-compute/vector_register_file.hh"
41#include "gpu-compute/wavefront.hh"
42
43ScheduleStage::ScheduleStage(const ComputeUnitParams *p)
44 : numSIMDs(p->num_SIMDs),
45 numMemUnits(p->num_global_mem_pipes + p->num_shared_mem_pipes)
46{
47 for (int j = 0; j < numSIMDs + numMemUnits; ++j) {
48 Scheduler newScheduler(p);
49 scheduler.push_back(newScheduler);
48 scheduler.emplace_back(p);
50 }
51}
52
53ScheduleStage::~ScheduleStage()
54{
55 scheduler.clear();
56 waveStatusList.clear();
57}
58
59void
60ScheduleStage::init(ComputeUnit *cu)
61{
62 computeUnit = cu;
63 _name = computeUnit->name() + ".ScheduleStage";
64
65 for (int j = 0; j < numSIMDs + numMemUnits; ++j) {
66 scheduler[j].bindList(&computeUnit->readyList[j]);
67 }
68
69 for (int j = 0; j < numSIMDs; ++j) {
70 waveStatusList.push_back(&computeUnit->waveStatusList[j]);
71 }
72
73 dispatchList = &computeUnit->dispatchList;
74}
75
76void
77ScheduleStage::arbitrate()
78{
79 // iterate over all Memory pipelines
80 for (int j = numSIMDs; j < numSIMDs + numMemUnits; ++j) {
81 if (dispatchList->at(j).first) {
82 Wavefront *waveToMemPipe = dispatchList->at(j).first;
83 // iterate over all execution pipelines
84 for (int i = 0; i < numSIMDs + numMemUnits; ++i) {
85 if ((i != j) && (dispatchList->at(i).first)) {
86 Wavefront *waveToExePipe = dispatchList->at(i).first;
87 // if the two selected wavefronts are mapped to the same
88 // SIMD unit then they share the VRF
89 if (waveToMemPipe->simdId == waveToExePipe->simdId) {
90 int simdId = waveToMemPipe->simdId;
91 // Read VRF port arbitration:
92 // If there are read VRF port conflicts between the
93 // a memory and another instruction we drop the other
94 // instruction. We don't need to check for write VRF
95 // port conflicts because the memory instruction either
96 // does not need to write to the VRF (store) or will
97 // write to the VRF when the data comes back (load) in
98 // which case the arbiter of the memory pipes will
99 // resolve any conflicts
100 if (computeUnit->vrf[simdId]->
101 isReadConflict(waveToMemPipe->wfSlotId,
102 waveToExePipe->wfSlotId)) {
103 // FIXME: The "second" member variable is never
104 // used in the model. I am setting it to READY
105 // simply to follow the protocol of setting it
106 // when the WF has an instruction ready to issue
107 waveStatusList[simdId]->at(waveToExePipe->wfSlotId)
108 .second = READY;
109
110 dispatchList->at(i).first = nullptr;
111 dispatchList->at(i).second = EMPTY;
112 break;
113 }
114 }
115 }
116 }
117 }
118 }
119}
120
121void
122ScheduleStage::exec()
123{
124 for (int j = 0; j < numSIMDs + numMemUnits; ++j) {
125 uint32_t readyListSize = computeUnit->readyList[j].size();
126
127 // If no wave is ready to be scheduled on the execution resource
128 // then skip scheduling for this execution resource
129 if (!readyListSize) {
130 continue;
131 }
132
133 Wavefront *waveToBeDispatched = scheduler[j].chooseWave();
134 dispatchList->at(j).first = waveToBeDispatched;
135 waveToBeDispatched->updateResources();
136 dispatchList->at(j).second = FILLED;
137
138 waveStatusList[waveToBeDispatched->simdId]->at(
139 waveToBeDispatched->wfSlotId).second = BLOCKED;
140
141 assert(computeUnit->readyList[j].size() == readyListSize - 1);
142 }
143 // arbitrate over all shared resources among instructions being issued
144 // simultaneously
145 arbitrate();
146}
147
148void
149ScheduleStage::regStats()
150{
151}
49 }
50}
51
52ScheduleStage::~ScheduleStage()
53{
54 scheduler.clear();
55 waveStatusList.clear();
56}
57
58void
59ScheduleStage::init(ComputeUnit *cu)
60{
61 computeUnit = cu;
62 _name = computeUnit->name() + ".ScheduleStage";
63
64 for (int j = 0; j < numSIMDs + numMemUnits; ++j) {
65 scheduler[j].bindList(&computeUnit->readyList[j]);
66 }
67
68 for (int j = 0; j < numSIMDs; ++j) {
69 waveStatusList.push_back(&computeUnit->waveStatusList[j]);
70 }
71
72 dispatchList = &computeUnit->dispatchList;
73}
74
75void
76ScheduleStage::arbitrate()
77{
78 // iterate over all Memory pipelines
79 for (int j = numSIMDs; j < numSIMDs + numMemUnits; ++j) {
80 if (dispatchList->at(j).first) {
81 Wavefront *waveToMemPipe = dispatchList->at(j).first;
82 // iterate over all execution pipelines
83 for (int i = 0; i < numSIMDs + numMemUnits; ++i) {
84 if ((i != j) && (dispatchList->at(i).first)) {
85 Wavefront *waveToExePipe = dispatchList->at(i).first;
86 // if the two selected wavefronts are mapped to the same
87 // SIMD unit then they share the VRF
88 if (waveToMemPipe->simdId == waveToExePipe->simdId) {
89 int simdId = waveToMemPipe->simdId;
90 // Read VRF port arbitration:
91 // If there are read VRF port conflicts between the
92 // a memory and another instruction we drop the other
93 // instruction. We don't need to check for write VRF
94 // port conflicts because the memory instruction either
95 // does not need to write to the VRF (store) or will
96 // write to the VRF when the data comes back (load) in
97 // which case the arbiter of the memory pipes will
98 // resolve any conflicts
99 if (computeUnit->vrf[simdId]->
100 isReadConflict(waveToMemPipe->wfSlotId,
101 waveToExePipe->wfSlotId)) {
102 // FIXME: The "second" member variable is never
103 // used in the model. I am setting it to READY
104 // simply to follow the protocol of setting it
105 // when the WF has an instruction ready to issue
106 waveStatusList[simdId]->at(waveToExePipe->wfSlotId)
107 .second = READY;
108
109 dispatchList->at(i).first = nullptr;
110 dispatchList->at(i).second = EMPTY;
111 break;
112 }
113 }
114 }
115 }
116 }
117 }
118}
119
120void
121ScheduleStage::exec()
122{
123 for (int j = 0; j < numSIMDs + numMemUnits; ++j) {
124 uint32_t readyListSize = computeUnit->readyList[j].size();
125
126 // If no wave is ready to be scheduled on the execution resource
127 // then skip scheduling for this execution resource
128 if (!readyListSize) {
129 continue;
130 }
131
132 Wavefront *waveToBeDispatched = scheduler[j].chooseWave();
133 dispatchList->at(j).first = waveToBeDispatched;
134 waveToBeDispatched->updateResources();
135 dispatchList->at(j).second = FILLED;
136
137 waveStatusList[waveToBeDispatched->simdId]->at(
138 waveToBeDispatched->wfSlotId).second = BLOCKED;
139
140 assert(computeUnit->readyList[j].size() == readyListSize - 1);
141 }
142 // arbitrate over all shared resources among instructions being issued
143 // simultaneously
144 arbitrate();
145}
146
147void
148ScheduleStage::regStats()
149{
150}