Throttle.cc revision 6891:77451885bb00
1
2/*
3 * Copyright (c) 1999-2008 Mark D. Hill and David A. Wood
4 * All rights reserved.
5 *
6 * Redistribution and use in source and binary forms, with or without
7 * modification, are permitted provided that the following conditions are
8 * met: redistributions of source code must retain the above copyright
9 * notice, this list of conditions and the following disclaimer;
10 * redistributions in binary form must reproduce the above copyright
11 * notice, this list of conditions and the following disclaimer in the
12 * documentation and/or other materials provided with the distribution;
13 * neither the name of the copyright holders nor the names of its
14 * contributors may be used to endorse or promote products derived from
15 * this software without specific prior written permission.
16 *
17 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
18 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
19 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
20 * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
21 * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
22 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
23 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
24 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
25 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
26 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
27 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
28 */
29
30/*
31 * $Id$
32 *
33 * Description: see Throttle.hh
34 *
35 */
36
37#include "mem/ruby/network/simple/Throttle.hh"
38#include "mem/ruby/buffers/MessageBuffer.hh"
39#include "mem/ruby/network/Network.hh"
40#include "mem/ruby/system/System.hh"
41#include "mem/ruby/slicc_interface/NetworkMessage.hh"
42#include "mem/protocol/Protocol.hh"
43
44const int HIGH_RANGE = 256;
45const int ADJUST_INTERVAL = 50000;
46const int MESSAGE_SIZE_MULTIPLIER = 1000;
47//const int BROADCAST_SCALING = 4; // Have a 16p system act like a 64p systems
48const int BROADCAST_SCALING = 1;
49const int PRIORITY_SWITCH_LIMIT = 128;
50
51static int network_message_to_size(NetworkMessage* net_msg_ptr);
52
53extern std::ostream * debug_cout_ptr;
54
55Throttle::Throttle(int sID, NodeID node, int link_latency, int link_bandwidth_multiplier)
56{
57  init(node, link_latency, link_bandwidth_multiplier);
58  m_sID = sID;
59}
60
61Throttle::Throttle(NodeID node, int link_latency, int link_bandwidth_multiplier)
62{
63  init(node, link_latency, link_bandwidth_multiplier);
64  m_sID = 0;
65}
66
67void Throttle::init(NodeID node, int link_latency, int link_bandwidth_multiplier)
68{
69  m_node = node;
70  m_vnets = 0;
71
72  ASSERT(link_bandwidth_multiplier > 0);
73  m_link_bandwidth_multiplier = link_bandwidth_multiplier;
74  m_link_latency = link_latency;
75
76  m_bash_counter = HIGH_RANGE;
77  m_bandwidth_since_sample = 0;
78  m_last_bandwidth_sample = 0;
79  m_wakeups_wo_switch = 0;
80  clearStats();
81}
82
83void Throttle::clear()
84{
85  for (int counter = 0; counter < m_vnets; counter++) {
86    m_in[counter]->clear();
87    m_out[counter]->clear();
88  }
89}
90
91void Throttle::addLinks(const Vector<MessageBuffer*>& in_vec, const Vector<MessageBuffer*>& out_vec)
92{
93  assert(in_vec.size() == out_vec.size());
94  for (int i=0; i<in_vec.size(); i++) {
95    addVirtualNetwork(in_vec[i], out_vec[i]);
96  }
97
98  m_message_counters.setSize(MessageSizeType_NUM);
99  for (int i=0; i<MessageSizeType_NUM; i++) {
100    m_message_counters[i].setSize(in_vec.size());
101    for (int j=0; j<m_message_counters[i].size(); j++) {
102      m_message_counters[i][j] = 0;
103    }
104  }
105}
106
107void Throttle::addVirtualNetwork(MessageBuffer* in_ptr, MessageBuffer* out_ptr)
108{
109  m_units_remaining.insertAtBottom(0);
110  m_in.insertAtBottom(in_ptr);
111  m_out.insertAtBottom(out_ptr);
112
113  // Set consumer and description
114  m_in[m_vnets]->setConsumer(this);
115  string desc = "[Queue to Throttle " + NodeIDToString(m_sID) + " " + NodeIDToString(m_node) + "]";
116  m_in[m_vnets]->setDescription(desc);
117  m_vnets++;
118}
119
120void Throttle::wakeup()
121{
122  // Limits the number of message sent to a limited number of bytes/cycle.
123  assert(getLinkBandwidth() > 0);
124  int bw_remaining = getLinkBandwidth();
125
126  // Give the highest numbered link priority most of the time
127  m_wakeups_wo_switch++;
128  int highest_prio_vnet = m_vnets-1;
129  int lowest_prio_vnet = 0;
130  int counter = 1;
131  bool schedule_wakeup = false;
132
133  // invert priorities to avoid starvation seen in the component network
134  if (m_wakeups_wo_switch > PRIORITY_SWITCH_LIMIT) {
135    m_wakeups_wo_switch = 0;
136    highest_prio_vnet = 0;
137    lowest_prio_vnet = m_vnets-1;
138    counter = -1;
139  }
140
141  for (int vnet = highest_prio_vnet; (vnet*counter) >= (counter*lowest_prio_vnet); vnet -= counter) {
142
143    assert(m_out[vnet] != NULL);
144    assert(m_in[vnet] != NULL);
145    assert(m_units_remaining[vnet] >= 0);
146
147    while ((bw_remaining > 0) && ((m_in[vnet]->isReady()) || (m_units_remaining[vnet] > 0)) && m_out[vnet]->areNSlotsAvailable(1)) {
148
149      // See if we are done transferring the previous message on this virtual network
150      if (m_units_remaining[vnet] == 0 && m_in[vnet]->isReady()) {
151
152        // Find the size of the message we are moving
153        MsgPtr msg_ptr = m_in[vnet]->peekMsgPtr();
154        NetworkMessage* net_msg_ptr = dynamic_cast<NetworkMessage*>(msg_ptr.ref());
155        m_units_remaining[vnet] += network_message_to_size(net_msg_ptr);
156
157        DEBUG_NEWLINE(NETWORK_COMP,HighPrio);
158        DEBUG_MSG(NETWORK_COMP,HighPrio,"throttle: " + int_to_string(m_node)
159                  + " my bw " + int_to_string(getLinkBandwidth())
160                  + " bw spent enqueueing net msg " + int_to_string(m_units_remaining[vnet])
161                  + " time: " + int_to_string(g_eventQueue_ptr->getTime()) + ".");
162
163        // Move the message
164        m_out[vnet]->enqueue(m_in[vnet]->peekMsgPtr(), m_link_latency);
165        m_in[vnet]->pop();
166
167        // Count the message
168        m_message_counters[net_msg_ptr->getMessageSize()][vnet]++;
169
170        DEBUG_MSG(NETWORK_COMP,LowPrio,*m_out[vnet]);
171        DEBUG_NEWLINE(NETWORK_COMP,HighPrio);
172      }
173
174      // Calculate the amount of bandwidth we spent on this message
175      int diff = m_units_remaining[vnet] - bw_remaining;
176      m_units_remaining[vnet] = max(0, diff);
177      bw_remaining = max(0, -diff);
178    }
179
180    if ((bw_remaining > 0) && ((m_in[vnet]->isReady()) || (m_units_remaining[vnet] > 0)) && !m_out[vnet]->areNSlotsAvailable(1)) {
181      DEBUG_MSG(NETWORK_COMP,LowPrio,vnet);
182      schedule_wakeup = true; // schedule me to wakeup again because I'm waiting for my output queue to become available
183    }
184  }
185
186  // We should only wake up when we use the bandwidth
187  //  assert(bw_remaining != getLinkBandwidth());  // This is only mostly true
188
189  // Record that we used some or all of the link bandwidth this cycle
190  double ratio = 1.0-(double(bw_remaining)/double(getLinkBandwidth()));
191  // If ratio = 0, we used no bandwidth, if ratio = 1, we used all
192  linkUtilized(ratio);
193
194  // Sample the link bandwidth utilization over a number of cycles
195  int bw_used = getLinkBandwidth()-bw_remaining;
196  m_bandwidth_since_sample += bw_used;
197
198  // FIXME - comment out the bash specific code for faster performance
199  // Start Bash code
200  // Update the predictor
201  Time current_time = g_eventQueue_ptr->getTime();
202  while ((current_time - m_last_bandwidth_sample) > ADJUST_INTERVAL) {
203    // Used less bandwidth
204    m_bash_counter--;
205
206    // Make sure we don't overflow
207    m_bash_counter = min(HIGH_RANGE, m_bash_counter);
208    m_bash_counter = max(0, m_bash_counter);
209
210    // Reset samples
211    m_last_bandwidth_sample += ADJUST_INTERVAL;
212    m_bandwidth_since_sample = 0;
213  }
214  // End Bash code
215
216  if ((bw_remaining > 0) && !schedule_wakeup) {
217    // We have extra bandwidth and our output buffer was available, so we must not have anything else to do until another message arrives.
218    DEBUG_MSG(NETWORK_COMP,LowPrio,*this);
219    DEBUG_MSG(NETWORK_COMP,LowPrio,"not scheduled again");
220  } else {
221    DEBUG_MSG(NETWORK_COMP,LowPrio,*this);
222    DEBUG_MSG(NETWORK_COMP,LowPrio,"scheduled again");
223    // We are out of bandwidth for this cycle, so wakeup next cycle and continue
224    g_eventQueue_ptr->scheduleEvent(this, 1);
225  }
226}
227
228bool Throttle::broadcastBandwidthAvailable(int rand) const
229{
230  bool result =  !(m_bash_counter > ((HIGH_RANGE/4) + (rand % (HIGH_RANGE/2))));
231  return result;
232}
233
234void Throttle::printStats(ostream& out) const
235{
236  out << "utilized_percent: " << getUtilization() << endl;
237}
238
239void Throttle::clearStats()
240{
241  m_ruby_start = g_eventQueue_ptr->getTime();
242  m_links_utilized = 0.0;
243
244  for (int i=0; i<m_message_counters.size(); i++) {
245    for (int j=0; j<m_message_counters[i].size(); j++) {
246      m_message_counters[i][j] = 0;
247    }
248  }
249}
250
251void Throttle::printConfig(ostream& out) const
252{
253
254}
255
256double Throttle::getUtilization() const
257{
258  return (100.0 * double(m_links_utilized)) / (double(g_eventQueue_ptr->getTime()-m_ruby_start));
259}
260
261void Throttle::print(ostream& out) const
262{
263  out << "[Throttle: " << m_sID << " " << m_node << " bw: " << getLinkBandwidth() << "]";
264}
265
266// Helper function
267
268static
269int network_message_to_size(NetworkMessage* net_msg_ptr)
270{
271  assert(net_msg_ptr != NULL);
272
273  // Artificially increase the size of broadcast messages
274  if (BROADCAST_SCALING > 1) {
275    if (net_msg_ptr->getDestination().isBroadcast()) {
276      return (RubySystem::getNetwork()->MessageSizeType_to_int(net_msg_ptr->getMessageSize()) * MESSAGE_SIZE_MULTIPLIER * BROADCAST_SCALING);
277    }
278  }
279  return (RubySystem::getNetwork()->MessageSizeType_to_int(net_msg_ptr->getMessageSize()) * MESSAGE_SIZE_MULTIPLIER);
280}
281