111308Santhony.gutierrez@amd.com/* 211308Santhony.gutierrez@amd.com * Copyright (c) 2014-2015 Advanced Micro Devices, Inc. 311308Santhony.gutierrez@amd.com * All rights reserved. 411308Santhony.gutierrez@amd.com * 511308Santhony.gutierrez@amd.com * For use for simulation and test purposes only 611308Santhony.gutierrez@amd.com * 711308Santhony.gutierrez@amd.com * Redistribution and use in source and binary forms, with or without 811308Santhony.gutierrez@amd.com * modification, are permitted provided that the following conditions are met: 911308Santhony.gutierrez@amd.com * 1011308Santhony.gutierrez@amd.com * 1. Redistributions of source code must retain the above copyright notice, 1111308Santhony.gutierrez@amd.com * this list of conditions and the following disclaimer. 1211308Santhony.gutierrez@amd.com * 1311308Santhony.gutierrez@amd.com * 2. Redistributions in binary form must reproduce the above copyright notice, 1411308Santhony.gutierrez@amd.com * this list of conditions and the following disclaimer in the documentation 1511308Santhony.gutierrez@amd.com * and/or other materials provided with the distribution. 1611308Santhony.gutierrez@amd.com * 1712697Santhony.gutierrez@amd.com * 3. Neither the name of the copyright holder nor the names of its 1812697Santhony.gutierrez@amd.com * contributors may be used to endorse or promote products derived from this 1912697Santhony.gutierrez@amd.com * software without specific prior written permission. 2011308Santhony.gutierrez@amd.com * 2111308Santhony.gutierrez@amd.com * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" 2211308Santhony.gutierrez@amd.com * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 2311308Santhony.gutierrez@amd.com * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 2411308Santhony.gutierrez@amd.com * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE 2511308Santhony.gutierrez@amd.com * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR 2611308Santhony.gutierrez@amd.com * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF 2711308Santhony.gutierrez@amd.com * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS 2811308Santhony.gutierrez@amd.com * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN 2911308Santhony.gutierrez@amd.com * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) 3011308Santhony.gutierrez@amd.com * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE 3111308Santhony.gutierrez@amd.com * POSSIBILITY OF SUCH DAMAGE. 3211308Santhony.gutierrez@amd.com * 3312697Santhony.gutierrez@amd.com * Authors: John Kalamatianos, 3412697Santhony.gutierrez@amd.com * Sooraj Puthoor, 3512697Santhony.gutierrez@amd.com * Mark Wyse 3611308Santhony.gutierrez@amd.com */ 3711308Santhony.gutierrez@amd.com 3811308Santhony.gutierrez@amd.com#include "gpu-compute/scoreboard_check_stage.hh" 3911308Santhony.gutierrez@amd.com 4011308Santhony.gutierrez@amd.com#include "gpu-compute/compute_unit.hh" 4111308Santhony.gutierrez@amd.com#include "gpu-compute/gpu_static_inst.hh" 4211308Santhony.gutierrez@amd.com#include "gpu-compute/shader.hh" 4311308Santhony.gutierrez@amd.com#include "gpu-compute/wavefront.hh" 4411308Santhony.gutierrez@amd.com#include "params/ComputeUnit.hh" 4511308Santhony.gutierrez@amd.com 4611308Santhony.gutierrez@amd.comScoreboardCheckStage::ScoreboardCheckStage(const ComputeUnitParams *p) 4711308Santhony.gutierrez@amd.com : numSIMDs(p->num_SIMDs), 4811308Santhony.gutierrez@amd.com numMemUnits(p->num_global_mem_pipes + p->num_shared_mem_pipes), 4911308Santhony.gutierrez@amd.com numShrMemPipes(p->num_shared_mem_pipes), 5011308Santhony.gutierrez@amd.com vectorAluInstAvail(nullptr), 5111308Santhony.gutierrez@amd.com lastGlbMemSimd(-1), 5211308Santhony.gutierrez@amd.com lastShrMemSimd(-1), glbMemInstAvail(nullptr), 5311308Santhony.gutierrez@amd.com shrMemInstAvail(nullptr) 5411308Santhony.gutierrez@amd.com{ 5511308Santhony.gutierrez@amd.com} 5611308Santhony.gutierrez@amd.com 5711308Santhony.gutierrez@amd.comScoreboardCheckStage::~ScoreboardCheckStage() 5811308Santhony.gutierrez@amd.com{ 5911308Santhony.gutierrez@amd.com readyList.clear(); 6011308Santhony.gutierrez@amd.com waveStatusList.clear(); 6111308Santhony.gutierrez@amd.com shrMemInstAvail = nullptr; 6211308Santhony.gutierrez@amd.com glbMemInstAvail = nullptr; 6311308Santhony.gutierrez@amd.com} 6411308Santhony.gutierrez@amd.com 6511308Santhony.gutierrez@amd.comvoid 6611308Santhony.gutierrez@amd.comScoreboardCheckStage::init(ComputeUnit *cu) 6711308Santhony.gutierrez@amd.com{ 6811308Santhony.gutierrez@amd.com computeUnit = cu; 6911308Santhony.gutierrez@amd.com _name = computeUnit->name() + ".ScoreboardCheckStage"; 7011308Santhony.gutierrez@amd.com 7111308Santhony.gutierrez@amd.com for (int unitId = 0; unitId < numSIMDs + numMemUnits; ++unitId) { 7211308Santhony.gutierrez@amd.com readyList.push_back(&computeUnit->readyList[unitId]); 7311308Santhony.gutierrez@amd.com } 7411308Santhony.gutierrez@amd.com 7511308Santhony.gutierrez@amd.com for (int unitId = 0; unitId < numSIMDs; ++unitId) { 7611308Santhony.gutierrez@amd.com waveStatusList.push_back(&computeUnit->waveStatusList[unitId]); 7711308Santhony.gutierrez@amd.com } 7811308Santhony.gutierrez@amd.com 7911308Santhony.gutierrez@amd.com vectorAluInstAvail = &computeUnit->vectorAluInstAvail; 8011308Santhony.gutierrez@amd.com glbMemInstAvail= &computeUnit->glbMemInstAvail; 8111308Santhony.gutierrez@amd.com shrMemInstAvail= &computeUnit->shrMemInstAvail; 8211308Santhony.gutierrez@amd.com} 8311308Santhony.gutierrez@amd.com 8411308Santhony.gutierrez@amd.comvoid 8511308Santhony.gutierrez@amd.comScoreboardCheckStage::initStatistics() 8611308Santhony.gutierrez@amd.com{ 8711308Santhony.gutierrez@amd.com lastGlbMemSimd = -1; 8811308Santhony.gutierrez@amd.com lastShrMemSimd = -1; 8911308Santhony.gutierrez@amd.com *glbMemInstAvail = 0; 9011308Santhony.gutierrez@amd.com *shrMemInstAvail = 0; 9111308Santhony.gutierrez@amd.com 9211308Santhony.gutierrez@amd.com for (int unitId = 0; unitId < numSIMDs; ++unitId) 9311308Santhony.gutierrez@amd.com vectorAluInstAvail->at(unitId) = false; 9411308Santhony.gutierrez@amd.com} 9511308Santhony.gutierrez@amd.com 9611308Santhony.gutierrez@amd.comvoid 9711308Santhony.gutierrez@amd.comScoreboardCheckStage::collectStatistics(Wavefront *curWave, int unitId) 9811308Santhony.gutierrez@amd.com{ 9911308Santhony.gutierrez@amd.com if (curWave->instructionBuffer.empty()) 10011308Santhony.gutierrez@amd.com return; 10111308Santhony.gutierrez@amd.com 10211308Santhony.gutierrez@amd.com // track which vector SIMD unit has at least one WV with a vector 10311308Santhony.gutierrez@amd.com // ALU as the oldest instruction in its Instruction buffer 10411308Santhony.gutierrez@amd.com vectorAluInstAvail->at(unitId) = vectorAluInstAvail->at(unitId) || 10511308Santhony.gutierrez@amd.com curWave->isOldestInstALU(); 10611308Santhony.gutierrez@amd.com 10711308Santhony.gutierrez@amd.com // track how many vector SIMD units have at least one WV with a 10811308Santhony.gutierrez@amd.com // vector Global memory instruction as the oldest instruction 10911308Santhony.gutierrez@amd.com // in its Instruction buffer 11011308Santhony.gutierrez@amd.com if ((curWave->isOldestInstGMem() || curWave->isOldestInstPrivMem() || 11111308Santhony.gutierrez@amd.com curWave->isOldestInstFlatMem()) && lastGlbMemSimd != unitId && 11211308Santhony.gutierrez@amd.com *glbMemInstAvail <= 1) { 11311308Santhony.gutierrez@amd.com (*glbMemInstAvail)++; 11411308Santhony.gutierrez@amd.com lastGlbMemSimd = unitId; 11511308Santhony.gutierrez@amd.com } 11611308Santhony.gutierrez@amd.com 11711308Santhony.gutierrez@amd.com // track how many vector SIMD units have at least one WV with a 11811308Santhony.gutierrez@amd.com // vector shared memory (LDS) instruction as the oldest instruction 11911308Santhony.gutierrez@amd.com // in its Instruction buffer 12011308Santhony.gutierrez@amd.com // TODO: parametrize the limit of the LDS units 12111308Santhony.gutierrez@amd.com if (curWave->isOldestInstLMem() && (*shrMemInstAvail <= numShrMemPipes) && 12211308Santhony.gutierrez@amd.com lastShrMemSimd != unitId) { 12311308Santhony.gutierrez@amd.com (*shrMemInstAvail)++; 12411308Santhony.gutierrez@amd.com lastShrMemSimd = unitId; 12511308Santhony.gutierrez@amd.com } 12611308Santhony.gutierrez@amd.com} 12711308Santhony.gutierrez@amd.com 12811308Santhony.gutierrez@amd.comvoid 12911308Santhony.gutierrez@amd.comScoreboardCheckStage::exec() 13011308Santhony.gutierrez@amd.com{ 13111308Santhony.gutierrez@amd.com initStatistics(); 13211308Santhony.gutierrez@amd.com 13311308Santhony.gutierrez@amd.com // reset the ready list for all execution units; it will be 13411308Santhony.gutierrez@amd.com // constructed every cycle since resource availability may change 13511308Santhony.gutierrez@amd.com for (int unitId = 0; unitId < numSIMDs + numMemUnits; ++unitId) { 13611308Santhony.gutierrez@amd.com readyList[unitId]->clear(); 13711308Santhony.gutierrez@amd.com } 13811308Santhony.gutierrez@amd.com 13911308Santhony.gutierrez@amd.com // iterate over the Wavefronts of all SIMD units 14011308Santhony.gutierrez@amd.com for (int unitId = 0; unitId < numSIMDs; ++unitId) { 14111308Santhony.gutierrez@amd.com for (int wvId = 0; wvId < computeUnit->shader->n_wf; ++wvId) { 14211308Santhony.gutierrez@amd.com // reset the ready status of each wavefront 14311308Santhony.gutierrez@amd.com waveStatusList[unitId]->at(wvId).second = BLOCKED; 14411308Santhony.gutierrez@amd.com Wavefront *curWave = waveStatusList[unitId]->at(wvId).first; 14511308Santhony.gutierrez@amd.com collectStatistics(curWave, unitId); 14611308Santhony.gutierrez@amd.com 14711308Santhony.gutierrez@amd.com if (curWave->ready(Wavefront::I_ALU)) { 14811308Santhony.gutierrez@amd.com readyList[unitId]->push_back(curWave); 14911308Santhony.gutierrez@amd.com waveStatusList[unitId]->at(wvId).second = READY; 15011308Santhony.gutierrez@amd.com } else if (curWave->ready(Wavefront::I_GLOBAL)) { 15111308Santhony.gutierrez@amd.com if (computeUnit->cedeSIMD(unitId, wvId)) { 15211308Santhony.gutierrez@amd.com continue; 15311308Santhony.gutierrez@amd.com } 15411308Santhony.gutierrez@amd.com 15511308Santhony.gutierrez@amd.com readyList[computeUnit->GlbMemUnitId()]->push_back(curWave); 15611308Santhony.gutierrez@amd.com waveStatusList[unitId]->at(wvId).second = READY; 15711308Santhony.gutierrez@amd.com } else if (curWave->ready(Wavefront::I_SHARED)) { 15811308Santhony.gutierrez@amd.com readyList[computeUnit->ShrMemUnitId()]->push_back(curWave); 15911308Santhony.gutierrez@amd.com waveStatusList[unitId]->at(wvId).second = READY; 16011308Santhony.gutierrez@amd.com } else if (curWave->ready(Wavefront::I_FLAT)) { 16111308Santhony.gutierrez@amd.com readyList[computeUnit->GlbMemUnitId()]->push_back(curWave); 16211308Santhony.gutierrez@amd.com waveStatusList[unitId]->at(wvId).second = READY; 16311308Santhony.gutierrez@amd.com } else if (curWave->ready(Wavefront::I_PRIVATE)) { 16411308Santhony.gutierrez@amd.com readyList[computeUnit->GlbMemUnitId()]->push_back(curWave); 16511308Santhony.gutierrez@amd.com waveStatusList[unitId]->at(wvId).second = READY; 16611308Santhony.gutierrez@amd.com } 16711308Santhony.gutierrez@amd.com } 16811308Santhony.gutierrez@amd.com } 16911308Santhony.gutierrez@amd.com} 17011308Santhony.gutierrez@amd.com 17111308Santhony.gutierrez@amd.comvoid 17211308Santhony.gutierrez@amd.comScoreboardCheckStage::regStats() 17311308Santhony.gutierrez@amd.com{ 17411308Santhony.gutierrez@amd.com} 175