1/*
2 * Copyright (c) 2014 The University of Wisconsin
3 *
4 * Copyright (c) 2006 INRIA (Institut National de Recherche en
5 * Informatique et en Automatique / French National Research Institute
6 * for Computer Science and Applied Mathematics)
7 *
8 * All rights reserved.
9 *
10 * Redistribution and use in source and binary forms, with or without
11 * modification, are permitted provided that the following conditions are
12 * met: redistributions of source code must retain the above copyright
13 * notice, this list of conditions and the following disclaimer;
14 * redistributions in binary form must reproduce the above copyright
15 * notice, this list of conditions and the following disclaimer in the
16 * documentation and/or other materials provided with the distribution;
17 * neither the name of the copyright holders nor the names of its
18 * contributors may be used to endorse or promote products derived from
19 * this software without specific prior written permission.
20 *
21 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
22 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
23 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
24 * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
25 * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
26 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
27 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
28 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
29 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
30 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
31 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
32 *
33 * Authors: Vignyan Reddy, Dibakar Gope and Arthur Perais,
34 * from André Seznec's code.
35 */
36
37/* @file
38 * Implementation of a L-TAGE branch predictor
39 */
40
41#include "cpu/pred/ltage.hh"
42
43#include "base/intmath.hh"
44#include "base/logging.hh"
45#include "base/random.hh"
46#include "base/trace.hh"
47#include "debug/Fetch.hh"
48#include "debug/LTage.hh"
49
50LTAGE::LTAGE(const LTAGEParams *params)
51 : TAGE(params),
52 logSizeLoopPred(params->logSizeLoopPred),
53 loopTableAgeBits(params->loopTableAgeBits),
54 loopTableConfidenceBits(params->loopTableConfidenceBits),
55 loopTableTagBits(params->loopTableTagBits),
56 loopTableIterBits(params->loopTableIterBits),
57 logLoopTableAssoc(params->logLoopTableAssoc),
58 confidenceThreshold((1 << loopTableConfidenceBits) - 1),
59 loopTagMask((1 << loopTableTagBits) - 1),
60 loopNumIterMask((1 << loopTableIterBits) - 1),
61 loopUseCounter(0),
62 withLoopBits(params->withLoopBits)
63{
64 // we use uint16_t type for these vales, so they cannot be more than
65 // 16 bits
66 assert(loopTableTagBits <= 16);
67 assert(loopTableIterBits <= 16);
68
69 assert(logSizeLoopPred >= logLoopTableAssoc);
70
71 ltable = new LoopEntry[ULL(1) << logSizeLoopPred];
72}
73
74int
75LTAGE::lindex(Addr pc_in) const
76{
77 // The loop table is implemented as a linear table
78 // If associativity is N (N being 1 << logLoopTableAssoc),
79 // the first N entries are for set 0, the next N entries are for set 1,
80 // and so on.
81 // Thus, this function calculates the set and then it gets left shifted
82 // by logLoopTableAssoc in order to return the index of the first of the
83 // N entries of the set
84 Addr mask = (ULL(1) << (logSizeLoopPred - logLoopTableAssoc)) - 1;
85 return (((pc_in >> instShiftAmt) & mask) << logLoopTableAssoc);
86}
87
88//loop prediction: only used if high confidence
89bool
90LTAGE::getLoop(Addr pc, LTageBranchInfo* bi) const
91{
92 bi->loopHit = -1;
93 bi->loopPredValid = false;
94 bi->loopIndex = lindex(pc);
95 unsigned pcShift = instShiftAmt + logSizeLoopPred - logLoopTableAssoc;
96 bi->loopTag = ((pc) >> pcShift) & loopTagMask;
97
98 for (int i = 0; i < (1 << logLoopTableAssoc); i++) {
99 if (ltable[bi->loopIndex + i].tag == bi->loopTag) {
100 bi->loopHit = i;
101 bi->loopPredValid =
102 ltable[bi->loopIndex + i].confidence == confidenceThreshold;
103 bi->currentIter = ltable[bi->loopIndex + i].currentIterSpec;
104 if (ltable[bi->loopIndex + i].currentIterSpec + 1 ==
105 ltable[bi->loopIndex + i].numIter) {
106 return !(ltable[bi->loopIndex + i].dir);
107 }else {
108 return (ltable[bi->loopIndex + i].dir);
109 }
110 }
111 }
112 return false;
113}
114
115void
116LTAGE::specLoopUpdate(Addr pc, bool taken, LTageBranchInfo* bi)
117{
118 if (bi->loopHit>=0) {
119 int index = lindex(pc);
120 if (taken != ltable[index].dir) {
121 ltable[index].currentIterSpec = 0;
122 } else {
123 ltable[index].currentIterSpec =
124 (ltable[index].currentIterSpec + 1) & loopNumIterMask;
125 }
126 }
127}
128
129void
130LTAGE::loopUpdate(Addr pc, bool taken, LTageBranchInfo* bi)
131{
132 int idx = bi->loopIndex + bi->loopHit;
133 if (bi->loopHit >= 0) {
134 //already a hit
135 if (bi->loopPredValid) {
136 if (taken != bi->loopPred) {
137 // free the entry
138 ltable[idx].numIter = 0;
139 ltable[idx].age = 0;
140 ltable[idx].confidence = 0;
141 ltable[idx].currentIter = 0;
142 return;
143 } else if (bi->loopPred != bi->tagePred) {
144 DPRINTF(LTage, "Loop Prediction success:%lx\n",pc);
145 unsignedCtrUpdate(ltable[idx].age, true, loopTableAgeBits);
146 }
147 }
148
149 ltable[idx].currentIter =
150 (ltable[idx].currentIter + 1) & loopNumIterMask;
151 if (ltable[idx].currentIter > ltable[idx].numIter) {
152 ltable[idx].confidence = 0;
153 if (ltable[idx].numIter != 0) {
154 // free the entry
155 ltable[idx].numIter = 0;
156 ltable[idx].age = 0;
157 ltable[idx].confidence = 0;
158 }
159 }
160
161 if (taken != ltable[idx].dir) {
162 if (ltable[idx].currentIter == ltable[idx].numIter) {
163 DPRINTF(LTage, "Loop End predicted successfully:%lx\n", pc);
164
165 unsignedCtrUpdate(ltable[idx].confidence, true,
166 loopTableConfidenceBits);
167 //just do not predict when the loop count is 1 or 2
168 if (ltable[idx].numIter < 3) {
169 // free the entry
170 ltable[idx].dir = taken;
171 ltable[idx].numIter = 0;
172 ltable[idx].age = 0;
173 ltable[idx].confidence = 0;
174 }
175 } else {
176 DPRINTF(LTage, "Loop End predicted incorrectly:%lx\n", pc);
177 if (ltable[idx].numIter == 0) {
178 // first complete nest;
179 ltable[idx].confidence = 0;
180 ltable[idx].numIter = ltable[idx].currentIter;
181 } else {
182 //not the same number of iterations as last time: free the
183 //entry
184 ltable[idx].numIter = 0;
185 ltable[idx].age = 0;
186 ltable[idx].confidence = 0;
187 }
188 }
189 ltable[idx].currentIter = 0;
190 }
191
192 } else if (taken) {
193 //try to allocate an entry on taken branch
194 int nrand = random_mt.random<int>();
195 for (int i = 0; i < (1 << logLoopTableAssoc); i++) {
196 int loop_hit = (nrand + i) & ((1 << logLoopTableAssoc) - 1);
197 idx = bi->loopIndex + loop_hit;
198 if (ltable[idx].age == 0) {
199 DPRINTF(LTage, "Allocating loop pred entry for branch %lx\n",
200 pc);
201 ltable[idx].dir = !taken;
202 ltable[idx].tag = bi->loopTag;
203 ltable[idx].numIter = 0;
204 ltable[idx].age = (1 << loopTableAgeBits) - 1;
205 ltable[idx].confidence = 0;
206 ltable[idx].currentIter = 1;
207 break;
208
209 }
210 else
211 ltable[idx].age--;
212 }
213 }
214
215}
216
217//prediction
218bool
219LTAGE::predict(ThreadID tid, Addr branch_pc, bool cond_branch, void* &b)
220{
221 LTageBranchInfo *bi = new LTageBranchInfo(nHistoryTables+1);
222 b = (void*)(bi);
223
224 bool pred_taken = tagePredict(tid, branch_pc, cond_branch, bi);
225
226 if (cond_branch) {
227 bi->loopPred = getLoop(branch_pc, bi); // loop prediction
228
229 if ((loopUseCounter >= 0) && bi->loopPredValid) {
230 pred_taken = bi->loopPred;
231 bi->provider = LOOP;
232 }
233 DPRINTF(LTage, "Predict for %lx: taken?:%d, loopTaken?:%d, "
234 "loopValid?:%d, loopUseCounter:%d, tagePred:%d, altPred:%d\n",
235 branch_pc, pred_taken, bi->loopPred, bi->loopPredValid,
236 loopUseCounter, bi->tagePred, bi->altTaken);
237 }
238
239 specLoopUpdate(branch_pc, pred_taken, bi);
240 return pred_taken;
241}
242
243void
244LTAGE::condBranchUpdate(Addr branch_pc, bool taken,
245 TageBranchInfo* tage_bi, int nrand)
246{
247 LTageBranchInfo* bi = static_cast<LTageBranchInfo*>(tage_bi);
248
249 // first update the loop predictor
250 loopUpdate(branch_pc, taken, bi);
251
252 if (bi->loopPredValid) {
253 if (bi->tagePred != bi->loopPred) {
254 ctrUpdate(loopUseCounter,
255 (bi->loopPred == taken),
256 withLoopBits);
257 }
258 }
259
260 TAGE::condBranchUpdate(branch_pc, taken, bi, nrand);
261}
262
263void
264LTAGE::squash(ThreadID tid, bool taken, void *bp_history)
265{
266 TAGE::squash(tid, taken, bp_history);
267
268 LTageBranchInfo* bi = (LTageBranchInfo*)(bp_history);
269
270 if (bi->condBranch) {
271 if (bi->loopHit >= 0) {
272 int idx = bi->loopIndex + bi->loopHit;
273 ltable[idx].currentIterSpec = bi->currentIter;
274 }
275 }
276}
277
278void
279LTAGE::squash(ThreadID tid, void *bp_history)
280{
281 LTageBranchInfo* bi = (LTageBranchInfo*)(bp_history);
282 if (bi->condBranch) {
283 if (bi->loopHit >= 0) {
284 int idx = bi->loopIndex + bi->loopHit;
285 ltable[idx].currentIterSpec = bi->currentIter;
286 }
287 }
288
289 TAGE::squash(tid, bp_history);
290}
291
292
293void
294LTAGE::updateStats(bool taken, TageBranchInfo* bi)
295{
296 TAGE::updateStats(taken, bi);
297
298 LTageBranchInfo * ltage_bi = static_cast<LTageBranchInfo *>(bi);
299
300 if (ltage_bi->provider == LOOP) {
301 if (taken == ltage_bi->loopPred) {
302 loopPredictorCorrect++;
303 } else {
304 loopPredictorWrong++;
305 }
306 }
307}
308
309
310
311void
312LTAGE::regStats()
313{
314 TAGE::regStats();
315
316 loopPredictorCorrect
317 .name(name() + ".loopPredictorCorrect")
318 .desc("Number of times the loop predictor is the provider and "
319 "the prediction is correct");
320
321 loopPredictorWrong
322 .name(name() + ".loopPredictorWrong")
323 .desc("Number of times the loop predictor is the provier and "
324 "the prediction is wrong");
325}
326
327
328
329LTAGE*
330LTAGEParams::create()
331{
332 return new LTAGE(this);
333}