DRAMCtrl.py revision 10146
19569SN/A# Copyright (c) 2012-2013 ARM Limited
29243SN/A# All rights reserved.
39243SN/A#
49243SN/A# The license below extends only to copyright in the software and shall
59243SN/A# not be construed as granting a license to any other intellectual
69243SN/A# property including but not limited to intellectual property relating
79243SN/A# to a hardware implementation of the functionality of the software
89243SN/A# licensed hereunder.  You may use the software subject to the license
99243SN/A# terms below provided that you ensure that this notice is replicated
109243SN/A# unmodified and in its entirety in all distributions of the software,
119243SN/A# modified or unmodified, in source code or in binary form.
129243SN/A#
139831SN/A# Copyright (c) 2013 Amin Farmahini-Farahani
149831SN/A# All rights reserved.
159831SN/A#
169243SN/A# Redistribution and use in source and binary forms, with or without
179243SN/A# modification, are permitted provided that the following conditions are
189243SN/A# met: redistributions of source code must retain the above copyright
199243SN/A# notice, this list of conditions and the following disclaimer;
209243SN/A# redistributions in binary form must reproduce the above copyright
219243SN/A# notice, this list of conditions and the following disclaimer in the
229243SN/A# documentation and/or other materials provided with the distribution;
239243SN/A# neither the name of the copyright holders nor the names of its
249243SN/A# contributors may be used to endorse or promote products derived from
259243SN/A# this software without specific prior written permission.
269243SN/A#
279243SN/A# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
289243SN/A# "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
299243SN/A# LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
309243SN/A# A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
319243SN/A# OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
329243SN/A# SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
339243SN/A# LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
349243SN/A# DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
359243SN/A# THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
369243SN/A# (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
379243SN/A# OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
389243SN/A#
399243SN/A# Authors: Andreas Hansson
409243SN/A#          Ani Udipi
419243SN/A
429243SN/Afrom m5.params import *
439243SN/Afrom AbstractMemory import *
449243SN/A
459243SN/A# Enum for memory scheduling algorithms, currently First-Come
469243SN/A# First-Served and a First-Row Hit then First-Come First-Served
479243SN/Aclass MemSched(Enum): vals = ['fcfs', 'frfcfs']
489243SN/A
4910136SN/A# Enum for the address mapping. With Ch, Ra, Ba, Ro and Co denoting
5010136SN/A# channel, rank, bank, row and column, respectively, and going from
5110136SN/A# MSB to LSB.  Available are RoRaBaChCo and RoRaBaCoCh, that are
5210136SN/A# suitable for an open-page policy, optimising for sequential accesses
5310136SN/A# hitting in the open row. For a closed-page policy, RoCoRaBaCh
5410136SN/A# maximises parallelism.
5510136SN/Aclass AddrMap(Enum): vals = ['RoRaBaChCo', 'RoRaBaCoCh', 'RoCoRaBaCh']
569243SN/A
5710144SN/A# Enum for the page policy, either open, open_adaptive, close, or
5810144SN/A# close_adaptive.
5910144SN/Aclass PageManage(Enum): vals = ['open', 'open_adaptive', 'close',
6010144SN/A                                'close_adaptive']
619243SN/A
6210146Sandreas.hansson@arm.com# DRAMCtrl is a single-channel single-ported DRAM controller model
639243SN/A# that aims to model the most important system-level performance
649243SN/A# effects of a DRAM without getting into too much detail of the DRAM
659243SN/A# itself.
6610146Sandreas.hansson@arm.comclass DRAMCtrl(AbstractMemory):
6710146Sandreas.hansson@arm.com    type = 'DRAMCtrl'
6810146Sandreas.hansson@arm.com    cxx_header = "mem/dram_ctrl.hh"
699243SN/A
709243SN/A    # single-ported on the system interface side, instantiate with a
719243SN/A    # bus in front of the controller for multiple ports
729243SN/A    port = SlavePort("Slave port")
739243SN/A
749243SN/A    # the basic configuration of the controller architecture
7510145SN/A    write_buffer_size = Param.Unsigned(64, "Number of write queue entries")
769972SN/A    read_buffer_size = Param.Unsigned(32, "Number of read queue entries")
779243SN/A
7810140SN/A    # threshold in percent for when to forcefully trigger writes and
7910140SN/A    # start emptying the write buffer
8010140SN/A    write_high_thresh_perc = Param.Percent(85, "Threshold to force writes")
819972SN/A
8210140SN/A    # threshold in percentage for when to start writes if the read
8310140SN/A    # queue is empty
8410140SN/A    write_low_thresh_perc = Param.Percent(50, "Threshold to start writes")
8510140SN/A
8610140SN/A    # minimum write bursts to schedule before switching back to reads
8710140SN/A    min_writes_per_switch = Param.Unsigned(16, "Minimum write bursts before "
8810140SN/A                                           "switching to reads")
899243SN/A
909243SN/A    # scheduler, address map and page policy
919489SN/A    mem_sched_policy = Param.MemSched('frfcfs', "Memory scheduling policy")
9210136SN/A    addr_mapping = Param.AddrMap('RoRaBaChCo', "Address mapping policy")
9310145SN/A    page_policy = Param.PageManage('open_adaptive', "Page management policy")
949243SN/A
9510141SN/A    # enforce a limit on the number of accesses per row
9610141SN/A    max_accesses_per_row = Param.Unsigned(16, "Max accesses per row before "
9710141SN/A                                          "closing");
9810141SN/A
999726SN/A    # pipeline latency of the controller and PHY, split into a
1009726SN/A    # frontend part and a backend part, with reads and writes serviced
1019726SN/A    # by the queues only seeing the frontend contribution, and reads
1029726SN/A    # serviced by the memory seeing the sum of the two
1039726SN/A    static_frontend_latency = Param.Latency("10ns", "Static frontend latency")
1049726SN/A    static_backend_latency = Param.Latency("10ns", "Static backend latency")
1059726SN/A
1069489SN/A    # the physical organisation of the DRAM
1079831SN/A    device_bus_width = Param.Unsigned("data bus width in bits for each DRAM "\
1089831SN/A                                      "device/chip")
1099831SN/A    burst_length = Param.Unsigned("Burst lenght (BL) in beats")
1109831SN/A    device_rowbuffer_size = Param.MemorySize("Page (row buffer) size per "\
1119831SN/A                                           "device/chip")
1129831SN/A    devices_per_rank = Param.Unsigned("Number of devices/chips per rank")
1139489SN/A    ranks_per_channel = Param.Unsigned("Number of ranks per channel")
1149489SN/A    banks_per_rank = Param.Unsigned("Number of banks per rank")
1159566SN/A    # only used for the address mapping as the controller by
1169566SN/A    # construction is a single channel and multiple controllers have
1179566SN/A    # to be instantiated for a multi-channel configuration
1189566SN/A    channels = Param.Unsigned(1, "Number of channels")
1199489SN/A
1209243SN/A    # timing behaviour and constraints - all in nanoseconds
1219243SN/A
1229243SN/A    # the amount of time in nanoseconds from issuing an activate command
1239243SN/A    # to the data being available in the row buffer for a read/write
1249489SN/A    tRCD = Param.Latency("RAS to CAS delay")
1259243SN/A
1269243SN/A    # the time from issuing a read/write command to seeing the actual data
1279489SN/A    tCL = Param.Latency("CAS latency")
1289243SN/A
1299243SN/A    # minimum time between a precharge and subsequent activate
1309489SN/A    tRP = Param.Latency("Row precharge time")
1319243SN/A
1329963SN/A    # minimum time between an activate and a precharge to the same row
1339963SN/A    tRAS = Param.Latency("ACT to PRE delay")
1349963SN/A
1359243SN/A    # time to complete a burst transfer, typically the burst length
1369243SN/A    # divided by two due to the DDR bus, but by making it a parameter
1379243SN/A    # it is easier to also evaluate SDR memories like WideIO.
1389831SN/A    # This parameter has to account for burst length.
1399831SN/A    # Read/Write requests with data size larger than one full burst are broken
14010146Sandreas.hansson@arm.com    # down into multiple requests in the controller
1419489SN/A    tBURST = Param.Latency("Burst duration (for DDR burst length / 2 cycles)")
1429243SN/A
1439243SN/A    # time taken to complete one refresh cycle (N rows in all banks)
1449489SN/A    tRFC = Param.Latency("Refresh cycle time")
1459243SN/A
1469243SN/A    # refresh command interval, how often a "ref" command needs
1479243SN/A    # to be sent. It is 7.8 us for a 64ms refresh requirement
1489489SN/A    tREFI = Param.Latency("Refresh command interval")
1499243SN/A
1509243SN/A    # write-to-read turn around penalty, assumed same as read-to-write
1519489SN/A    tWTR = Param.Latency("Write to read switching time")
1529243SN/A
1539971SN/A    # minimum row activate to row activate delay time
1549971SN/A    tRRD = Param.Latency("ACT to ACT delay")
1559971SN/A
1569488SN/A    # time window in which a maximum number of activates are allowed
1579488SN/A    # to take place, set to 0 to disable
1589489SN/A    tXAW = Param.Latency("X activation window")
1599489SN/A    activation_limit = Param.Unsigned("Max number of activates in window")
1609488SN/A
1619488SN/A    # Currently rolled into other params
1629243SN/A    ######################################################################
1639243SN/A
1649963SN/A    # tRC  - assumed to be tRAS + tRP
1659243SN/A
1669728SN/A# A single DDR3 x64 interface (one command and address bus), with
1679728SN/A# default timings based on DDR3-1600 4 Gbit parts in an 8x8
1689728SN/A# configuration, which would amount to 4 Gbyte of memory.
16910146Sandreas.hansson@arm.comclass DDR3_1600_x64(DRAMCtrl):
1709831SN/A    # 8x8 configuration, 8 devices each with an 8-bit interface
1719831SN/A    device_bus_width = 8
1729831SN/A
1739831SN/A    # DDR3 is a BL8 device
1749831SN/A    burst_length = 8
1759831SN/A
1769831SN/A    # Each device has a page (row buffer) size of 1KB
1779728SN/A    # (this depends on the memory density)
1789831SN/A    device_rowbuffer_size = '1kB'
1799831SN/A
1809831SN/A    # 8x8 configuration, so 8 devices
1819831SN/A    devices_per_rank = 8
1829489SN/A
1839489SN/A    # Use two ranks
1849489SN/A    ranks_per_channel = 2
1859489SN/A
1869489SN/A    # DDR3 has 8 banks in all configurations
1879489SN/A    banks_per_rank = 8
1889489SN/A
1899970SN/A    # DDR3-1600 11-11-11-28
1909489SN/A    tRCD = '13.75ns'
1919489SN/A    tCL = '13.75ns'
1929489SN/A    tRP = '13.75ns'
1939970SN/A    tRAS = '35ns'
1949489SN/A
1959831SN/A    # 8 beats across an x64 interface translates to 4 clocks @ 800 MHz.
1969831SN/A    # Note this is a BL8 DDR device.
1979489SN/A    tBURST = '5ns'
1989489SN/A
1999728SN/A    # DDR3, 4 Gbit has a tRFC of 240 CK and tCK = 1.25 ns
2009489SN/A    tRFC = '300ns'
2019489SN/A
2029489SN/A    # DDR3, <=85C, half for >85C
2039489SN/A    tREFI = '7.8us'
2049489SN/A
2059489SN/A    # Greater of 4 CK or 7.5 ns, 4 CK @ 800 MHz = 5 ns
2069489SN/A    tWTR = '7.5ns'
2079489SN/A
2089971SN/A    # Assume 5 CK for activate to activate for different banks
2099971SN/A    tRRD = '6.25ns'
2109971SN/A
2119489SN/A    # With a 2kbyte page size, DDR3-1600 lands around 40 ns
2129489SN/A    tXAW = '40ns'
2139489SN/A    activation_limit = 4
2149489SN/A
2159489SN/A
21610137SN/A# A single DDR3 x64 interface (one command and address bus), with
21710137SN/A# default timings based on DDR3-1333 4 Gbit parts in an 8x8
21810137SN/A# configuration, which would amount to 4 GByte of memory.  This
21910137SN/A# configuration is primarily for comparing with DRAMSim2, and all the
22010137SN/A# parameters except ranks_per_channel are based on the DRAMSim2 config
22110137SN/A# file DDR3_micron_32M_8B_x8_sg15.ini. Note that ranks_per_channel has
22210137SN/A# to be manually set, depending on size of the memory to be
22310137SN/A# simulated. By default DRAMSim2 has 2048MB of memory with a single
22410137SN/A# rank. Therefore for 4 GByte memory, set ranks_per_channel = 2
22510146Sandreas.hansson@arm.comclass DDR3_1333_x64_DRAMSim2(DRAMCtrl):
22610137SN/A    # 8x8 configuration, 8 devices each with an 8-bit interface
22710137SN/A    device_bus_width = 8
22810137SN/A
22910137SN/A    # DDR3 is a BL8 device
23010137SN/A    burst_length = 8
23110137SN/A
23210137SN/A    # Each device has a page (row buffer) size of 1KB
23310137SN/A    # (this depends on the memory density)
23410137SN/A    device_rowbuffer_size = '1kB'
23510137SN/A
23610137SN/A    # 8x8 configuration, so 8 devices
23710137SN/A    devices_per_rank = 8
23810137SN/A
23910137SN/A    # Use two ranks
24010137SN/A    ranks_per_channel = 2
24110137SN/A
24210137SN/A    # DDR3 has 8 banks in all configurations
24310137SN/A    banks_per_rank = 8
24410137SN/A
24510137SN/A    tRCD = '15ns'
24610137SN/A    tCL = '15ns'
24710137SN/A    tRP = '15ns'
24810137SN/A    tRAS = '36ns'
24910137SN/A
25010137SN/A    # 8 beats across an x64 interface translates to 4 clocks @ 666.66 MHz.
25110137SN/A    # Note this is a BL8 DDR device.
25210137SN/A    tBURST = '6ns'
25310137SN/A
25410137SN/A    tRFC = '160ns'
25510137SN/A
25610137SN/A    # DDR3, <=85C, half for >85C
25710137SN/A    tREFI = '7.8us'
25810137SN/A
25910137SN/A    # Greater of 4 CK or 7.5 ns, 4 CK @ 666.66 MHz = 6 ns
26010137SN/A    tWTR = '7.5ns'
26110137SN/A
26210137SN/A    tRRD = '6.0ns'
26310137SN/A
26410137SN/A    tXAW = '30ns'
26510137SN/A    activation_limit = 4
26610137SN/A
26710137SN/A
2689728SN/A# A single LPDDR2-S4 x32 interface (one command/address bus), with
2699728SN/A# default timings based on a LPDDR2-1066 4 Gbit part in a 1x32
2709728SN/A# configuration.
27110146Sandreas.hansson@arm.comclass LPDDR2_S4_1066_x32(DRAMCtrl):
2729831SN/A    # 1x32 configuration, 1 device with a 32-bit interface
2739831SN/A    device_bus_width = 32
2749831SN/A
2759831SN/A    # LPDDR2_S4 is a BL4 and BL8 device
2769831SN/A    burst_length = 8
2779831SN/A
2789831SN/A    # Each device has a page (row buffer) size of 1KB
2799831SN/A    # (this depends on the memory density)
2809831SN/A    device_rowbuffer_size = '1kB'
2819831SN/A
2829831SN/A    # 1x32 configuration, so 1 device
2839831SN/A    devices_per_rank = 1
2849489SN/A
2859708SN/A    # Use a single rank
2869708SN/A    ranks_per_channel = 1
2879489SN/A
2889489SN/A    # LPDDR2-S4 has 8 banks in all configurations
2899489SN/A    banks_per_rank = 8
2909489SN/A
2919489SN/A    # Fixed at 15 ns
2929489SN/A    tRCD = '15ns'
2939489SN/A
2949489SN/A    # 8 CK read latency, 4 CK write latency @ 533 MHz, 1.876 ns cycle time
2959489SN/A    tCL = '15ns'
2969489SN/A
2979728SN/A    # Pre-charge one bank 15 ns (all banks 18 ns)
2989728SN/A    tRP = '15ns'
2999489SN/A
3009970SN/A    tRAS = '42ns'
3019963SN/A
3029831SN/A    # 8 beats across an x32 DDR interface translates to 4 clocks @ 533 MHz.
3039831SN/A    # Note this is a BL8 DDR device.
3049831SN/A    # Requests larger than 32 bytes are broken down into multiple requests
30510146Sandreas.hansson@arm.com    # in the controller
3069831SN/A    tBURST = '7.5ns'
3079489SN/A
3089708SN/A    # LPDDR2-S4, 4 Gbit
3099489SN/A    tRFC = '130ns'
3109489SN/A    tREFI = '3.9us'
3119489SN/A
3129489SN/A    # Irrespective of speed grade, tWTR is 7.5 ns
3139489SN/A    tWTR = '7.5ns'
3149489SN/A
3159971SN/A    # Activate to activate irrespective of density and speed grade
3169971SN/A    tRRD = '10.0ns'
3179971SN/A
3189708SN/A    # Irrespective of density, tFAW is 50 ns
3199489SN/A    tXAW = '50ns'
3209489SN/A    activation_limit = 4
3219664SN/A
3229728SN/A# A single WideIO x128 interface (one command and address bus), with
3239728SN/A# default timings based on an estimated WIO-200 8 Gbit part.
32410146Sandreas.hansson@arm.comclass WideIO_200_x128(DRAMCtrl):
3259831SN/A    # 1x128 configuration, 1 device with a 128-bit interface
3269831SN/A    device_bus_width = 128
3279831SN/A
3289831SN/A    # This is a BL4 device
3299831SN/A    burst_length = 4
3309831SN/A
3319831SN/A    # Each device has a page (row buffer) size of 4KB
3329831SN/A    # (this depends on the memory density)
3339831SN/A    device_rowbuffer_size = '4kB'
3349831SN/A
3359831SN/A    # 1x128 configuration, so 1 device
3369831SN/A    devices_per_rank = 1
3379664SN/A
3389664SN/A    # Use one rank for a one-high die stack
3399664SN/A    ranks_per_channel = 1
3409664SN/A
3419664SN/A    # WideIO has 4 banks in all configurations
3429664SN/A    banks_per_rank = 4
3439664SN/A
3449664SN/A    # WIO-200
3459664SN/A    tRCD = '18ns'
3469664SN/A    tCL = '18ns'
3479664SN/A    tRP = '18ns'
3489970SN/A    tRAS = '42ns'
3499664SN/A
3509831SN/A    # 4 beats across an x128 SDR interface translates to 4 clocks @ 200 MHz.
3519831SN/A    # Note this is a BL4 SDR device.
3529664SN/A    tBURST = '20ns'
3539664SN/A
3549664SN/A    # WIO 8 Gb
3559664SN/A    tRFC = '210ns'
3569664SN/A
3579664SN/A    # WIO 8 Gb, <=85C, half for >85C
3589664SN/A    tREFI = '3.9us'
3599664SN/A
3609664SN/A    # Greater of 2 CK or 15 ns, 2 CK @ 200 MHz = 10 ns
3619664SN/A    tWTR = '15ns'
3629664SN/A
3639971SN/A    # Activate to activate irrespective of density and speed grade
3649971SN/A    tRRD = '10.0ns'
3659971SN/A
3669664SN/A    # Two instead of four activation window
3679664SN/A    tXAW = '50ns'
3689664SN/A    activation_limit = 2
3699709SN/A
3709728SN/A# A single LPDDR3 x32 interface (one command/address bus), with
3719728SN/A# default timings based on a LPDDR3-1600 4 Gbit part in a 1x32
3729728SN/A# configuration
37310146Sandreas.hansson@arm.comclass LPDDR3_1600_x32(DRAMCtrl):
3749831SN/A    # 1x32 configuration, 1 device with a 32-bit interface
3759831SN/A    device_bus_width = 32
3769831SN/A
3779831SN/A    # LPDDR3 is a BL8 device
3789831SN/A    burst_length = 8
3799831SN/A
3809976SN/A    # Each device has a page (row buffer) size of 4KB
3819976SN/A    device_rowbuffer_size = '4kB'
3829831SN/A
3839831SN/A    # 1x32 configuration, so 1 device
3849831SN/A    devices_per_rank = 1
3859709SN/A
3869709SN/A    # Use a single rank
3879709SN/A    ranks_per_channel = 1
3889709SN/A
3899709SN/A    # LPDDR3 has 8 banks in all configurations
3909709SN/A    banks_per_rank = 8
3919709SN/A
3929709SN/A    # Fixed at 15 ns
3939709SN/A    tRCD = '15ns'
3949709SN/A
3959709SN/A    # 12 CK read latency, 6 CK write latency @ 800 MHz, 1.25 ns cycle time
3969709SN/A    tCL = '15ns'
3979709SN/A
3989970SN/A    tRAS = '42ns'
3999963SN/A
4009728SN/A    # Pre-charge one bank 15 ns (all banks 18 ns)
4019728SN/A    tRP = '15ns'
4029709SN/A
4039831SN/A    # 8 beats across a x32 DDR interface translates to 4 clocks @ 800 MHz.
4049831SN/A    # Note this is a BL8 DDR device.
4059831SN/A    # Requests larger than 32 bytes are broken down into multiple requests
40610146Sandreas.hansson@arm.com    # in the controller
4079831SN/A    tBURST = '5ns'
4089709SN/A
4099709SN/A    # LPDDR3, 4 Gb
4109709SN/A    tRFC = '130ns'
4119709SN/A    tREFI = '3.9us'
4129709SN/A
4139709SN/A    # Irrespective of speed grade, tWTR is 7.5 ns
4149709SN/A    tWTR = '7.5ns'
4159709SN/A
4169971SN/A    # Activate to activate irrespective of density and speed grade
4179971SN/A    tRRD = '10.0ns'
4189971SN/A
4199709SN/A    # Irrespective of size, tFAW is 50 ns
4209709SN/A    tXAW = '50ns'
4219709SN/A    activation_limit = 4
422