111308Santhony.gutierrez@amd.com/*
211308Santhony.gutierrez@amd.com * Copyright (c) 2014-2015 Advanced Micro Devices, Inc.
311308Santhony.gutierrez@amd.com * All rights reserved.
411308Santhony.gutierrez@amd.com *
511308Santhony.gutierrez@amd.com * For use for simulation and test purposes only
611308Santhony.gutierrez@amd.com *
711308Santhony.gutierrez@amd.com * Redistribution and use in source and binary forms, with or without
811308Santhony.gutierrez@amd.com * modification, are permitted provided that the following conditions are met:
911308Santhony.gutierrez@amd.com *
1011308Santhony.gutierrez@amd.com * 1. Redistributions of source code must retain the above copyright notice,
1111308Santhony.gutierrez@amd.com * this list of conditions and the following disclaimer.
1211308Santhony.gutierrez@amd.com *
1311308Santhony.gutierrez@amd.com * 2. Redistributions in binary form must reproduce the above copyright notice,
1411308Santhony.gutierrez@amd.com * this list of conditions and the following disclaimer in the documentation
1511308Santhony.gutierrez@amd.com * and/or other materials provided with the distribution.
1611308Santhony.gutierrez@amd.com *
1712697Santhony.gutierrez@amd.com * 3. Neither the name of the copyright holder nor the names of its
1812697Santhony.gutierrez@amd.com * contributors may be used to endorse or promote products derived from this
1912697Santhony.gutierrez@amd.com * software without specific prior written permission.
2011308Santhony.gutierrez@amd.com *
2111308Santhony.gutierrez@amd.com * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
2211308Santhony.gutierrez@amd.com * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
2311308Santhony.gutierrez@amd.com * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
2411308Santhony.gutierrez@amd.com * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE
2511308Santhony.gutierrez@amd.com * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
2611308Santhony.gutierrez@amd.com * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
2711308Santhony.gutierrez@amd.com * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
2811308Santhony.gutierrez@amd.com * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
2911308Santhony.gutierrez@amd.com * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
3011308Santhony.gutierrez@amd.com * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
3111308Santhony.gutierrez@amd.com * POSSIBILITY OF SUCH DAMAGE.
3211308Santhony.gutierrez@amd.com *
3312697Santhony.gutierrez@amd.com * Authors: John Kalamatianos,
3412697Santhony.gutierrez@amd.com *          Sooraj Puthoor,
3512697Santhony.gutierrez@amd.com *          Mark Wyse
3611308Santhony.gutierrez@amd.com */
3711308Santhony.gutierrez@amd.com
3811308Santhony.gutierrez@amd.com#include "gpu-compute/scoreboard_check_stage.hh"
3911308Santhony.gutierrez@amd.com
4011308Santhony.gutierrez@amd.com#include "gpu-compute/compute_unit.hh"
4111308Santhony.gutierrez@amd.com#include "gpu-compute/gpu_static_inst.hh"
4211308Santhony.gutierrez@amd.com#include "gpu-compute/shader.hh"
4311308Santhony.gutierrez@amd.com#include "gpu-compute/wavefront.hh"
4411308Santhony.gutierrez@amd.com#include "params/ComputeUnit.hh"
4511308Santhony.gutierrez@amd.com
4611308Santhony.gutierrez@amd.comScoreboardCheckStage::ScoreboardCheckStage(const ComputeUnitParams *p)
4711308Santhony.gutierrez@amd.com    : numSIMDs(p->num_SIMDs),
4811308Santhony.gutierrez@amd.com      numMemUnits(p->num_global_mem_pipes + p->num_shared_mem_pipes),
4911308Santhony.gutierrez@amd.com      numShrMemPipes(p->num_shared_mem_pipes),
5011308Santhony.gutierrez@amd.com      vectorAluInstAvail(nullptr),
5111308Santhony.gutierrez@amd.com      lastGlbMemSimd(-1),
5211308Santhony.gutierrez@amd.com      lastShrMemSimd(-1), glbMemInstAvail(nullptr),
5311308Santhony.gutierrez@amd.com      shrMemInstAvail(nullptr)
5411308Santhony.gutierrez@amd.com{
5511308Santhony.gutierrez@amd.com}
5611308Santhony.gutierrez@amd.com
5711308Santhony.gutierrez@amd.comScoreboardCheckStage::~ScoreboardCheckStage()
5811308Santhony.gutierrez@amd.com{
5911308Santhony.gutierrez@amd.com    readyList.clear();
6011308Santhony.gutierrez@amd.com    waveStatusList.clear();
6111308Santhony.gutierrez@amd.com    shrMemInstAvail = nullptr;
6211308Santhony.gutierrez@amd.com    glbMemInstAvail = nullptr;
6311308Santhony.gutierrez@amd.com}
6411308Santhony.gutierrez@amd.com
6511308Santhony.gutierrez@amd.comvoid
6611308Santhony.gutierrez@amd.comScoreboardCheckStage::init(ComputeUnit *cu)
6711308Santhony.gutierrez@amd.com{
6811308Santhony.gutierrez@amd.com    computeUnit = cu;
6911308Santhony.gutierrez@amd.com    _name = computeUnit->name() + ".ScoreboardCheckStage";
7011308Santhony.gutierrez@amd.com
7111308Santhony.gutierrez@amd.com    for (int unitId = 0; unitId < numSIMDs + numMemUnits; ++unitId) {
7211308Santhony.gutierrez@amd.com        readyList.push_back(&computeUnit->readyList[unitId]);
7311308Santhony.gutierrez@amd.com    }
7411308Santhony.gutierrez@amd.com
7511308Santhony.gutierrez@amd.com    for (int unitId = 0; unitId < numSIMDs; ++unitId) {
7611308Santhony.gutierrez@amd.com        waveStatusList.push_back(&computeUnit->waveStatusList[unitId]);
7711308Santhony.gutierrez@amd.com    }
7811308Santhony.gutierrez@amd.com
7911308Santhony.gutierrez@amd.com    vectorAluInstAvail = &computeUnit->vectorAluInstAvail;
8011308Santhony.gutierrez@amd.com    glbMemInstAvail= &computeUnit->glbMemInstAvail;
8111308Santhony.gutierrez@amd.com    shrMemInstAvail= &computeUnit->shrMemInstAvail;
8211308Santhony.gutierrez@amd.com}
8311308Santhony.gutierrez@amd.com
8411308Santhony.gutierrez@amd.comvoid
8511308Santhony.gutierrez@amd.comScoreboardCheckStage::initStatistics()
8611308Santhony.gutierrez@amd.com{
8711308Santhony.gutierrez@amd.com    lastGlbMemSimd = -1;
8811308Santhony.gutierrez@amd.com    lastShrMemSimd = -1;
8911308Santhony.gutierrez@amd.com    *glbMemInstAvail = 0;
9011308Santhony.gutierrez@amd.com    *shrMemInstAvail = 0;
9111308Santhony.gutierrez@amd.com
9211308Santhony.gutierrez@amd.com    for (int unitId = 0; unitId < numSIMDs; ++unitId)
9311308Santhony.gutierrez@amd.com        vectorAluInstAvail->at(unitId) = false;
9411308Santhony.gutierrez@amd.com}
9511308Santhony.gutierrez@amd.com
9611308Santhony.gutierrez@amd.comvoid
9711308Santhony.gutierrez@amd.comScoreboardCheckStage::collectStatistics(Wavefront *curWave, int unitId)
9811308Santhony.gutierrez@amd.com{
9911308Santhony.gutierrez@amd.com    if (curWave->instructionBuffer.empty())
10011308Santhony.gutierrez@amd.com        return;
10111308Santhony.gutierrez@amd.com
10211308Santhony.gutierrez@amd.com    // track which vector SIMD unit has at least one WV with a vector
10311308Santhony.gutierrez@amd.com    // ALU as the oldest instruction in its Instruction buffer
10411308Santhony.gutierrez@amd.com    vectorAluInstAvail->at(unitId) = vectorAluInstAvail->at(unitId) ||
10511308Santhony.gutierrez@amd.com                                     curWave->isOldestInstALU();
10611308Santhony.gutierrez@amd.com
10711308Santhony.gutierrez@amd.com    // track how many vector SIMD units have at least one WV with a
10811308Santhony.gutierrez@amd.com    // vector Global memory instruction as the oldest instruction
10911308Santhony.gutierrez@amd.com    // in its Instruction buffer
11011308Santhony.gutierrez@amd.com    if ((curWave->isOldestInstGMem() || curWave->isOldestInstPrivMem() ||
11111308Santhony.gutierrez@amd.com         curWave->isOldestInstFlatMem()) && lastGlbMemSimd != unitId &&
11211308Santhony.gutierrez@amd.com        *glbMemInstAvail <= 1) {
11311308Santhony.gutierrez@amd.com        (*glbMemInstAvail)++;
11411308Santhony.gutierrez@amd.com        lastGlbMemSimd = unitId;
11511308Santhony.gutierrez@amd.com    }
11611308Santhony.gutierrez@amd.com
11711308Santhony.gutierrez@amd.com    // track how many vector SIMD units have at least one WV with a
11811308Santhony.gutierrez@amd.com    // vector shared memory (LDS) instruction as the oldest instruction
11911308Santhony.gutierrez@amd.com    // in its Instruction buffer
12011308Santhony.gutierrez@amd.com    // TODO: parametrize the limit of the LDS units
12111308Santhony.gutierrez@amd.com    if (curWave->isOldestInstLMem() && (*shrMemInstAvail <= numShrMemPipes) &&
12211308Santhony.gutierrez@amd.com        lastShrMemSimd != unitId) {
12311308Santhony.gutierrez@amd.com        (*shrMemInstAvail)++;
12411308Santhony.gutierrez@amd.com        lastShrMemSimd = unitId;
12511308Santhony.gutierrez@amd.com    }
12611308Santhony.gutierrez@amd.com}
12711308Santhony.gutierrez@amd.com
12811308Santhony.gutierrez@amd.comvoid
12911308Santhony.gutierrez@amd.comScoreboardCheckStage::exec()
13011308Santhony.gutierrez@amd.com{
13111308Santhony.gutierrez@amd.com    initStatistics();
13211308Santhony.gutierrez@amd.com
13311308Santhony.gutierrez@amd.com    // reset the ready list for all execution units; it will be
13411308Santhony.gutierrez@amd.com    // constructed every cycle since resource availability may change
13511308Santhony.gutierrez@amd.com    for (int unitId = 0; unitId < numSIMDs + numMemUnits; ++unitId) {
13611308Santhony.gutierrez@amd.com        readyList[unitId]->clear();
13711308Santhony.gutierrez@amd.com    }
13811308Santhony.gutierrez@amd.com
13911308Santhony.gutierrez@amd.com    // iterate over the Wavefronts of all SIMD units
14011308Santhony.gutierrez@amd.com    for (int unitId = 0; unitId < numSIMDs; ++unitId) {
14111308Santhony.gutierrez@amd.com        for (int wvId = 0; wvId < computeUnit->shader->n_wf; ++wvId) {
14211308Santhony.gutierrez@amd.com            // reset the ready status of each wavefront
14311308Santhony.gutierrez@amd.com            waveStatusList[unitId]->at(wvId).second = BLOCKED;
14411308Santhony.gutierrez@amd.com            Wavefront *curWave = waveStatusList[unitId]->at(wvId).first;
14511308Santhony.gutierrez@amd.com            collectStatistics(curWave, unitId);
14611308Santhony.gutierrez@amd.com
14711308Santhony.gutierrez@amd.com            if (curWave->ready(Wavefront::I_ALU)) {
14811308Santhony.gutierrez@amd.com                readyList[unitId]->push_back(curWave);
14911308Santhony.gutierrez@amd.com                waveStatusList[unitId]->at(wvId).second = READY;
15011308Santhony.gutierrez@amd.com            } else if (curWave->ready(Wavefront::I_GLOBAL)) {
15111308Santhony.gutierrez@amd.com                if (computeUnit->cedeSIMD(unitId, wvId)) {
15211308Santhony.gutierrez@amd.com                    continue;
15311308Santhony.gutierrez@amd.com                }
15411308Santhony.gutierrez@amd.com
15511308Santhony.gutierrez@amd.com                readyList[computeUnit->GlbMemUnitId()]->push_back(curWave);
15611308Santhony.gutierrez@amd.com                waveStatusList[unitId]->at(wvId).second = READY;
15711308Santhony.gutierrez@amd.com            } else if (curWave->ready(Wavefront::I_SHARED)) {
15811308Santhony.gutierrez@amd.com                readyList[computeUnit->ShrMemUnitId()]->push_back(curWave);
15911308Santhony.gutierrez@amd.com                waveStatusList[unitId]->at(wvId).second = READY;
16011308Santhony.gutierrez@amd.com            } else if (curWave->ready(Wavefront::I_FLAT)) {
16111308Santhony.gutierrez@amd.com                readyList[computeUnit->GlbMemUnitId()]->push_back(curWave);
16211308Santhony.gutierrez@amd.com                waveStatusList[unitId]->at(wvId).second = READY;
16311308Santhony.gutierrez@amd.com            } else if (curWave->ready(Wavefront::I_PRIVATE)) {
16411308Santhony.gutierrez@amd.com                readyList[computeUnit->GlbMemUnitId()]->push_back(curWave);
16511308Santhony.gutierrez@amd.com                waveStatusList[unitId]->at(wvId).second = READY;
16611308Santhony.gutierrez@amd.com            }
16711308Santhony.gutierrez@amd.com        }
16811308Santhony.gutierrez@amd.com    }
16911308Santhony.gutierrez@amd.com}
17011308Santhony.gutierrez@amd.com
17111308Santhony.gutierrez@amd.comvoid
17211308Santhony.gutierrez@amd.comScoreboardCheckStage::regStats()
17311308Santhony.gutierrez@amd.com{
17411308Santhony.gutierrez@amd.com}
175