dma_device.hh revision 11625:2344c9dcc0d6
1/* 2 * Copyright (c) 2012-2013, 2015 ARM Limited 3 * All rights reserved. 4 * 5 * The license below extends only to copyright in the software and shall 6 * not be construed as granting a license to any other intellectual 7 * property including but not limited to intellectual property relating 8 * to a hardware implementation of the functionality of the software 9 * licensed hereunder. You may use the software subject to the license 10 * terms below provided that you ensure that this notice is replicated 11 * unmodified and in its entirety in all distributions of the software, 12 * modified or unmodified, in source code or in binary form. 13 * 14 * Copyright (c) 2004-2005 The Regents of The University of Michigan 15 * All rights reserved. 16 * 17 * Redistribution and use in source and binary forms, with or without 18 * modification, are permitted provided that the following conditions are 19 * met: redistributions of source code must retain the above copyright 20 * notice, this list of conditions and the following disclaimer; 21 * redistributions in binary form must reproduce the above copyright 22 * notice, this list of conditions and the following disclaimer in the 23 * documentation and/or other materials provided with the distribution; 24 * neither the name of the copyright holders nor the names of its 25 * contributors may be used to endorse or promote products derived from 26 * this software without specific prior written permission. 27 * 28 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS 29 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT 30 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR 31 * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT 32 * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, 33 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT 34 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, 35 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY 36 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT 37 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE 38 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 39 * 40 * Authors: Ali Saidi 41 * Nathan Binkert 42 * Andreas Sandberg 43 */ 44 45#ifndef __DEV_DMA_DEVICE_HH__ 46#define __DEV_DMA_DEVICE_HH__ 47 48#include <deque> 49#include <memory> 50 51#include "base/circlebuf.hh" 52#include "dev/io_device.hh" 53#include "params/DmaDevice.hh" 54#include "sim/drain.hh" 55#include "sim/system.hh" 56 57class DmaPort : public MasterPort, public Drainable 58{ 59 private: 60 61 /** 62 * Take the first packet of the transmit list and attempt to send 63 * it as a timing request. If it is successful, schedule the 64 * sending of the next packet, otherwise remember that we are 65 * waiting for a retry. 66 */ 67 void trySendTimingReq(); 68 69 /** 70 * For timing, attempt to send the first item on the transmit 71 * list, and if it is successful and there are more packets 72 * waiting, then schedule the sending of the next packet. For 73 * atomic, simply send and process everything on the transmit 74 * list. 75 */ 76 void sendDma(); 77 78 /** 79 * Handle a response packet by updating the corresponding DMA 80 * request state to reflect the bytes received, and also update 81 * the pending request counter. If the DMA request that this 82 * packet is part of is complete, then signal the completion event 83 * if present, potentially with a delay added to it. 84 * 85 * @param pkt Response packet to handler 86 * @param delay Additional delay for scheduling the completion event 87 */ 88 void handleResp(PacketPtr pkt, Tick delay = 0); 89 90 struct DmaReqState : public Packet::SenderState 91 { 92 /** Event to call on the device when this transaction (all packets) 93 * complete. */ 94 Event *completionEvent; 95 96 /** Total number of bytes that this transaction involves. */ 97 const Addr totBytes; 98 99 /** Number of bytes that have been acked for this transaction. */ 100 Addr numBytes; 101 102 /** Amount to delay completion of dma by */ 103 const Tick delay; 104 105 DmaReqState(Event *ce, Addr tb, Tick _delay) 106 : completionEvent(ce), totBytes(tb), numBytes(0), delay(_delay) 107 {} 108 }; 109 110 public: 111 /** The device that owns this port. */ 112 MemObject *const device; 113 114 /** The system that device/port are in. This is used to select which mode 115 * we are currently operating in. */ 116 System *const sys; 117 118 /** Id for all requests */ 119 const MasterID masterId; 120 121 protected: 122 /** Use a deque as we never do any insertion or removal in the middle */ 123 std::deque<PacketPtr> transmitList; 124 125 /** Event used to schedule a future sending from the transmit list. */ 126 EventWrapper<DmaPort, &DmaPort::sendDma> sendEvent; 127 128 /** Number of outstanding packets the dma port has. */ 129 uint32_t pendingCount; 130 131 /** If the port is currently waiting for a retry before it can 132 * send whatever it is that it's sending. */ 133 bool inRetry; 134 135 protected: 136 137 bool recvTimingResp(PacketPtr pkt) override; 138 void recvReqRetry() override; 139 140 void queueDma(PacketPtr pkt); 141 142 public: 143 144 DmaPort(MemObject *dev, System *s); 145 146 RequestPtr dmaAction(Packet::Command cmd, Addr addr, int size, Event *event, 147 uint8_t *data, Tick delay, Request::Flags flag = 0); 148 149 bool dmaPending() const { return pendingCount > 0; } 150 151 DrainState drain() override; 152}; 153 154class DmaDevice : public PioDevice 155{ 156 protected: 157 DmaPort dmaPort; 158 159 public: 160 typedef DmaDeviceParams Params; 161 DmaDevice(const Params *p); 162 virtual ~DmaDevice() { } 163 164 void dmaWrite(Addr addr, int size, Event *event, uint8_t *data, 165 Tick delay = 0) 166 { 167 dmaPort.dmaAction(MemCmd::WriteReq, addr, size, event, data, delay); 168 } 169 170 void dmaRead(Addr addr, int size, Event *event, uint8_t *data, 171 Tick delay = 0) 172 { 173 dmaPort.dmaAction(MemCmd::ReadReq, addr, size, event, data, delay); 174 } 175 176 bool dmaPending() const { return dmaPort.dmaPending(); } 177 178 void init() override; 179 180 unsigned int cacheBlockSize() const { return sys->cacheLineSize(); } 181 182 BaseMasterPort &getMasterPort(const std::string &if_name, 183 PortID idx = InvalidPortID) override; 184 185}; 186 187/** 188 * DMA callback class. 189 * 190 * Allows one to register for a callback event after a sequence of (potentially 191 * non-contiguous) DMA transfers on a DmaPort completes. Derived classes must 192 * implement the process() method and use getChunkEvent() to allocate a 193 * callback event for each participating DMA. 194 */ 195class DmaCallback : public Drainable 196{ 197 public: 198 virtual const std::string name() const { return "DmaCallback"; } 199 200 /** 201 * DmaPort ensures that all oustanding DMA accesses have completed before 202 * it finishes draining. However, DmaChunkEvents scheduled with a delay 203 * might still be sitting on the event queue. Therefore, draining is not 204 * complete until count is 0, which ensures that all outstanding 205 * DmaChunkEvents associated with this DmaCallback have fired. 206 */ 207 DrainState drain() override 208 { 209 return count ? DrainState::Draining : DrainState::Drained; 210 } 211 212 protected: 213 int count; 214 215 DmaCallback() 216 : count(0) 217 { } 218 219 virtual ~DmaCallback() { } 220 221 /** 222 * Callback function invoked on completion of all chunks. 223 */ 224 virtual void process() = 0; 225 226 private: 227 /** 228 * Called by DMA engine completion event on each chunk completion. 229 * Since the object may delete itself here, callers should not use 230 * the object pointer after calling this function. 231 */ 232 void chunkComplete() 233 { 234 if (--count == 0) { 235 process(); 236 // Need to notify DrainManager that this object is finished 237 // draining, even though it is immediately deleted. 238 signalDrainDone(); 239 delete this; 240 } 241 } 242 243 /** 244 * Event invoked by DmaDevice on completion of each chunk. 245 */ 246 class DmaChunkEvent : public Event 247 { 248 private: 249 DmaCallback *callback; 250 251 public: 252 DmaChunkEvent(DmaCallback *cb) 253 : Event(Default_Pri, AutoDelete), callback(cb) 254 { } 255 256 void process() { callback->chunkComplete(); } 257 }; 258 259 public: 260 261 /** 262 * Request a chunk event. Chunks events should be provided to each DMA 263 * request that wishes to participate in this DmaCallback. 264 */ 265 Event *getChunkEvent() 266 { 267 ++count; 268 return new DmaChunkEvent(this); 269 } 270}; 271 272/** 273 * Buffered DMA engine helper class 274 * 275 * This class implements a simple DMA engine that feeds a FIFO 276 * buffer. The size of the buffer, the maximum number of pending 277 * requests and the maximum request size are all set when the engine 278 * is instantiated. 279 * 280 * An <i>asynchronous</i> transfer of a <i>block</i> of data 281 * (designated by a start address and a size) is started by calling 282 * the startFill() method. The DMA engine will aggressively try to 283 * keep the internal FIFO full. As soon as there is room in the FIFO 284 * for more data <i>and</i> there are free request slots, a new fill 285 * will be started. 286 * 287 * Data in the FIFO can be read back using the get() and tryGet() 288 * methods. Both request a block of data from the FIFO. However, get() 289 * panics if the block cannot be satisfied, while tryGet() simply 290 * returns false. The latter call makes it possible to implement 291 * custom buffer underrun handling. 292 * 293 * A simple use case would be something like this: 294 * \code{.cpp} 295 * // Create a DMA engine with a 1KiB buffer. Issue up to 8 concurrent 296 * // uncacheable 64 byte (maximum) requests. 297 * DmaReadFifo *dma = new DmaReadFifo(port, 1024, 64, 8, 298 * Request::UNCACHEABLE); 299 * 300 * // Start copying 4KiB data from 0xFF000000 301 * dma->startFill(0xFF000000, 0x1000); 302 * 303 * // Some time later when there is data in the FIFO. 304 * uint8_t data[8]; 305 * dma->get(data, sizeof(data)) 306 * \endcode 307 * 308 * 309 * The DMA engine allows new blocks to be requested as soon as the 310 * last request for a block has been sent (i.e., there is no need to 311 * wait for pending requests to complete). This can be queried with 312 * the atEndOfBlock() method and more advanced implementations may 313 * override the onEndOfBlock() callback. 314 */ 315class DmaReadFifo : public Drainable, public Serializable 316{ 317 public: 318 DmaReadFifo(DmaPort &port, size_t size, 319 unsigned max_req_size, 320 unsigned max_pending, 321 Request::Flags flags = 0); 322 323 ~DmaReadFifo(); 324 325 public: // Serializable 326 void serialize(CheckpointOut &cp) const override; 327 void unserialize(CheckpointIn &cp) override; 328 329 public: // Drainable 330 DrainState drain() override; 331 332 public: // FIFO access 333 /** 334 * @{ 335 * @name FIFO access 336 */ 337 /** 338 * Try to read data from the FIFO. 339 * 340 * This method reads len bytes of data from the FIFO and stores 341 * them in the memory location pointed to by dst. The method 342 * fails, and no data is written to the buffer, if the FIFO 343 * doesn't contain enough data to satisfy the request. 344 * 345 * @param dst Pointer to a destination buffer 346 * @param len Amount of data to read. 347 * @return true on success, false otherwise. 348 */ 349 bool tryGet(uint8_t *dst, size_t len); 350 351 template<typename T> 352 bool tryGet(T &value) { 353 return tryGet(static_cast<T *>(&value), sizeof(T)); 354 }; 355 356 /** 357 * Read data from the FIFO and panic on failure. 358 * 359 * @see tryGet() 360 * 361 * @param dst Pointer to a destination buffer 362 * @param len Amount of data to read. 363 */ 364 void get(uint8_t *dst, size_t len); 365 366 template<typename T> 367 T get() { 368 T value; 369 get(static_cast<uint8_t *>(&value), sizeof(T)); 370 return value; 371 }; 372 373 /** Get the amount of data stored in the FIFO */ 374 size_t size() const { return buffer.size(); } 375 /** Flush the FIFO */ 376 void flush() { buffer.flush(); } 377 378 /** @} */ 379 public: // FIFO fill control 380 /** 381 * @{ 382 * @name FIFO fill control 383 */ 384 /** 385 * Start filling the FIFO. 386 * 387 * @warn It's considered an error to call start on an active DMA 388 * engine unless the last request from the active block has been 389 * sent (i.e., atEndOfBlock() is true). 390 * 391 * @param start Physical address to copy from. 392 * @param size Size of the block to copy. 393 */ 394 void startFill(Addr start, size_t size); 395 396 /** 397 * Stop the DMA engine. 398 * 399 * Stop filling the FIFO and ignore incoming responses for pending 400 * requests. The onEndOfBlock() callback will not be called after 401 * this method has been invoked. However, once the last response 402 * has been received, the onIdle() callback will still be called. 403 */ 404 void stopFill(); 405 406 /** 407 * Has the DMA engine sent out the last request for the active 408 * block? 409 */ 410 bool atEndOfBlock() const { 411 return nextAddr == endAddr; 412 } 413 414 /** 415 * Is the DMA engine active (i.e., are there still in-flight 416 * accesses)? 417 */ 418 bool isActive() const { 419 return !(pendingRequests.empty() && atEndOfBlock()); 420 } 421 422 /** @} */ 423 protected: // Callbacks 424 /** 425 * @{ 426 * @name Callbacks 427 */ 428 /** 429 * End of block callback 430 * 431 * This callback is called <i>once</i> after the last access in a 432 * block has been sent. It is legal for a derived class to call 433 * startFill() from this method to initiate a transfer. 434 */ 435 virtual void onEndOfBlock() {}; 436 437 /** 438 * Last response received callback 439 * 440 * This callback is called when the DMA engine becomes idle (i.e., 441 * there are no pending requests). 442 * 443 * It is possible for a DMA engine to reach the end of block and 444 * become idle at the same tick. In such a case, the 445 * onEndOfBlock() callback will be called first. This callback 446 * will <i>NOT</i> be called if that callback initiates a new DMA transfer. 447 */ 448 virtual void onIdle() {}; 449 450 /** @} */ 451 private: // Configuration 452 /** Maximum request size in bytes */ 453 const Addr maxReqSize; 454 /** Maximum FIFO size in bytes */ 455 const size_t fifoSize; 456 /** Request flags */ 457 const Request::Flags reqFlags; 458 459 DmaPort &port; 460 461 private: 462 class DmaDoneEvent : public Event 463 { 464 public: 465 DmaDoneEvent(DmaReadFifo *_parent, size_t max_size); 466 467 void kill(); 468 void cancel(); 469 bool canceled() const { return _canceled; } 470 void reset(size_t size); 471 void process(); 472 473 bool done() const { return _done; } 474 size_t requestSize() const { return _requestSize; } 475 const uint8_t *data() const { return _data.data(); } 476 uint8_t *data() { return _data.data(); } 477 478 private: 479 DmaReadFifo *parent; 480 bool _done; 481 bool _canceled; 482 size_t _requestSize; 483 std::vector<uint8_t> _data; 484 }; 485 486 typedef std::unique_ptr<DmaDoneEvent> DmaDoneEventUPtr; 487 488 /** 489 * DMA request done, handle incoming data and issue new 490 * request. 491 */ 492 void dmaDone(); 493 494 /** Handle pending requests that have been flagged as done. */ 495 void handlePending(); 496 497 /** Try to issue new DMA requests */ 498 void resumeFill(); 499 500 private: // Internal state 501 Fifo<uint8_t> buffer; 502 503 Addr nextAddr; 504 Addr endAddr; 505 506 std::deque<DmaDoneEventUPtr> pendingRequests; 507 std::deque<DmaDoneEventUPtr> freeRequests; 508}; 509 510#endif // __DEV_DMA_DEVICE_HH__ 511