Deleted Added
sdiff udiff text old ( 7720:65d338a8dba4 ) new ( 7901:f9b675da608a )
full compact
1/*
2 * Copyright (c) 2007 The Hewlett-Packard Development Company
3 * All rights reserved.
4 *
5 * The license below extends only to copyright in the software and shall
6 * not be construed as granting a license to any other intellectual
7 * property including but not limited to intellectual property relating
8 * to a hardware implementation of the functionality of the software
9 * licensed hereunder. You may use the software subject to the license
10 * terms below provided that you ensure that this notice is replicated
11 * unmodified and in its entirety in all distributions of the software,
12 * modified or unmodified, in source code or in binary form.
13 *
14 * Redistribution and use in source and binary forms, with or without
15 * modification, are permitted provided that the following conditions are
16 * met: redistributions of source code must retain the above copyright
17 * notice, this list of conditions and the following disclaimer;
18 * redistributions in binary form must reproduce the above copyright
19 * notice, this list of conditions and the following disclaimer in the
20 * documentation and/or other materials provided with the distribution;
21 * neither the name of the copyright holders nor the names of its
22 * contributors may be used to endorse or promote products derived from
23 * this software without specific prior written permission.
24 *
25 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
26 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
27 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
28 * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
29 * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
30 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
31 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
32 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
33 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
34 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
35 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
36 *
37 * Authors: Gabe Black
38 */
39
40#include "arch/x86/bios/smbios.hh"
41#include "arch/x86/bios/intelmp.hh"
42#include "arch/x86/regs/misc.hh"
43#include "arch/x86/system.hh"
44#include "arch/vtophys.hh"
45#include "base/intmath.hh"
46#include "base/loader/object_file.hh"
47#include "base/loader/symtab.hh"
48#include "base/trace.hh"
49#include "cpu/thread_context.hh"
50#include "mem/physical.hh"
51#include "params/X86System.hh"
52#include "sim/byteswap.hh"
53
54
55using namespace LittleEndianGuest;
56using namespace X86ISA;
57
58X86System::X86System(Params *p) :
59 System(p), smbiosTable(p->smbios_table),
60 mpFloatingPointer(p->intel_mp_pointer),
61 mpConfigTable(p->intel_mp_table),
62 rsdp(p->acpi_description_table_pointer)
63{
64 if (kernel->getArch() == ObjectFile::I386)
65 fatal("Loading a 32 bit x86 kernel is not supported.\n");
66}
67
68static void
69installSegDesc(ThreadContext *tc, SegmentRegIndex seg,
70 SegDescriptor desc, bool longmode)
71{
72 uint64_t base = desc.baseLow + (desc.baseHigh << 24);
73 bool honorBase = !longmode || seg == SEGMENT_REG_FS ||
74 seg == SEGMENT_REG_GS ||
75 seg == SEGMENT_REG_TSL ||
76 seg == SYS_SEGMENT_REG_TR;
77 uint64_t limit = desc.limitLow | (desc.limitHigh << 16);
78
79 SegAttr attr = 0;
80
81 attr.dpl = desc.dpl;
82 attr.unusable = 0;
83 attr.defaultSize = desc.d;
84 attr.longMode = desc.l;
85 attr.avl = desc.avl;
86 attr.granularity = desc.g;
87 attr.present = desc.p;
88 attr.system = desc.s;
89 attr.type = desc.type;
90 if (desc.s) {
91 if (desc.type.codeOrData) {
92 // Code segment
93 attr.expandDown = 0;
94 attr.readable = desc.type.r;
95 attr.writable = 0;
96 } else {
97 // Data segment
98 attr.expandDown = desc.type.e;
99 attr.readable = 1;
100 attr.writable = desc.type.w;
101 }
102 } else {
103 attr.readable = 1;
104 attr.writable = 1;
105 attr.expandDown = 0;
106 }
107
108 tc->setMiscReg(MISCREG_SEG_BASE(seg), base);
109 tc->setMiscReg(MISCREG_SEG_EFF_BASE(seg), honorBase ? base : 0);
110 tc->setMiscReg(MISCREG_SEG_LIMIT(seg), limit);
111 tc->setMiscReg(MISCREG_SEG_ATTR(seg), (MiscReg)attr);
112}
113
114void
115X86System::initState()
116{
117 System::initState();
118
119 ThreadContext *tc = threadContexts[0];
120 // This is the boot strap processor (BSP). Initialize it to look like
121 // the boot loader has just turned control over to the 64 bit OS. We
122 // won't actually set up real mode or legacy protected mode descriptor
123 // tables because we aren't executing any code that would require
124 // them. We do, however toggle the control bits in the correct order
125 // while allowing consistency checks and the underlying mechansims
126 // just to be safe.
127
128 const int NumPDTs = 4;
129
130 const Addr PageMapLevel4 = 0x70000;
131 const Addr PageDirPtrTable = 0x71000;
132 const Addr PageDirTable[NumPDTs] =
133 {0x72000, 0x73000, 0x74000, 0x75000};
134 const Addr GDTBase = 0x76000;
135
136 const int PML4Bits = 9;
137 const int PDPTBits = 9;
138 const int PDTBits = 9;
139
140 // Get a port to write the page tables and descriptor tables.
141 FunctionalPort * physPort = tc->getPhysPort();
142
143 /*
144 * Set up the gdt.
145 */
146 uint8_t numGDTEntries = 0;
147 // Place holder at selector 0
148 uint64_t nullDescriptor = 0;
149 physPort->writeBlob(GDTBase + numGDTEntries * 8,
150 (uint8_t *)(&nullDescriptor), 8);
151 numGDTEntries++;
152
153 //64 bit code segment
154 SegDescriptor csDesc = 0;
155 csDesc.type.codeOrData = 1;
156 csDesc.type.c = 0; // Not conforming
157 csDesc.type.r = 1; // Readable
158 csDesc.dpl = 0; // Privelege level 0
159 csDesc.p = 1; // Present
160 csDesc.l = 1; // 64 bit
161 csDesc.d = 0; // default operand size
162 csDesc.g = 1; // Page granularity
163 csDesc.s = 1; // Not a system segment
164 csDesc.limitHigh = 0xF;
165 csDesc.limitLow = 0xFF;
166 //Because we're dealing with a pointer and I don't think it's
167 //guaranteed that there isn't anything in a nonvirtual class between
168 //it's beginning in memory and it's actual data, we'll use an
169 //intermediary.
170 uint64_t csDescVal = csDesc;
171 physPort->writeBlob(GDTBase + numGDTEntries * 8,
172 (uint8_t *)(&csDescVal), 8);
173
174 numGDTEntries++;
175
176 SegSelector cs = 0;
177 cs.si = numGDTEntries - 1;
178
179 tc->setMiscReg(MISCREG_CS, (MiscReg)cs);
180
181 //32 bit data segment
182 SegDescriptor dsDesc = 0;
183 dsDesc.type.codeOrData = 0;
184 dsDesc.type.e = 0; // Not expand down
185 dsDesc.type.w = 1; // Writable
186 dsDesc.dpl = 0; // Privelege level 0
187 dsDesc.p = 1; // Present
188 dsDesc.d = 1; // default operand size
189 dsDesc.g = 1; // Page granularity
190 dsDesc.s = 1; // Not a system segment
191 dsDesc.limitHigh = 0xF;
192 dsDesc.limitLow = 0xFF;
193 uint64_t dsDescVal = dsDesc;
194 physPort->writeBlob(GDTBase + numGDTEntries * 8,
195 (uint8_t *)(&dsDescVal), 8);
196
197 numGDTEntries++;
198
199 SegSelector ds = 0;
200 ds.si = numGDTEntries - 1;
201
202 tc->setMiscReg(MISCREG_DS, (MiscReg)ds);
203 tc->setMiscReg(MISCREG_ES, (MiscReg)ds);
204 tc->setMiscReg(MISCREG_FS, (MiscReg)ds);
205 tc->setMiscReg(MISCREG_GS, (MiscReg)ds);
206 tc->setMiscReg(MISCREG_SS, (MiscReg)ds);
207
208 tc->setMiscReg(MISCREG_TSL, 0);
209 tc->setMiscReg(MISCREG_TSG_BASE, GDTBase);
210 tc->setMiscReg(MISCREG_TSG_LIMIT, 8 * numGDTEntries - 1);
211
212 SegDescriptor tssDesc = 0;
213 tssDesc.type = 0xB;
214 tssDesc.dpl = 0; // Privelege level 0
215 tssDesc.p = 1; // Present
216 tssDesc.d = 1; // default operand size
217 tssDesc.g = 1; // Page granularity
218 tssDesc.s = 1; // Not a system segment
219 tssDesc.limitHigh = 0xF;
220 tssDesc.limitLow = 0xFF;
221 uint64_t tssDescVal = tssDesc;
222 physPort->writeBlob(GDTBase + numGDTEntries * 8,
223 (uint8_t *)(&tssDescVal), 8);
224
225 numGDTEntries++;
226
227 SegSelector tss = 0;
228 tss.si = numGDTEntries - 1;
229
230 tc->setMiscReg(MISCREG_TR, (MiscReg)tss);
231 installSegDesc(tc, SYS_SEGMENT_REG_TR, tssDesc, true);
232
233 /*
234 * Identity map the first 4GB of memory. In order to map this region
235 * of memory in long mode, there needs to be one actual page map level
236 * 4 entry which points to one page directory pointer table which
237 * points to 4 different page directory tables which are full of two
238 * megabyte pages. All of the other entries in valid tables are set
239 * to indicate that they don't pertain to anything valid and will
240 * cause a fault if used.
241 */
242
243 // Put valid values in all of the various table entries which indicate
244 // that those entries don't point to further tables or pages. Then
245 // set the values of those entries which are needed.
246
247 // Page Map Level 4
248
249 // read/write, user, not present
250 uint64_t pml4e = X86ISA::htog(0x6);
251 for (int offset = 0; offset < (1 << PML4Bits) * 8; offset += 8) {
252 physPort->writeBlob(PageMapLevel4 + offset, (uint8_t *)(&pml4e), 8);
253 }
254 // Point to the only PDPT
255 pml4e = X86ISA::htog(0x7 | PageDirPtrTable);
256 physPort->writeBlob(PageMapLevel4, (uint8_t *)(&pml4e), 8);
257
258 // Page Directory Pointer Table
259
260 // read/write, user, not present
261 uint64_t pdpe = X86ISA::htog(0x6);
262 for (int offset = 0; offset < (1 << PDPTBits) * 8; offset += 8) {
263 physPort->writeBlob(PageDirPtrTable + offset,
264 (uint8_t *)(&pdpe), 8);
265 }
266 // Point to the PDTs
267 for (int table = 0; table < NumPDTs; table++) {
268 pdpe = X86ISA::htog(0x7 | PageDirTable[table]);
269 physPort->writeBlob(PageDirPtrTable + table * 8,
270 (uint8_t *)(&pdpe), 8);
271 }
272
273 // Page Directory Tables
274
275 Addr base = 0;
276 const Addr pageSize = 2 << 20;
277 for (int table = 0; table < NumPDTs; table++) {
278 for (int offset = 0; offset < (1 << PDTBits) * 8; offset += 8) {
279 // read/write, user, present, 4MB
280 uint64_t pdte = X86ISA::htog(0x87 | base);
281 physPort->writeBlob(PageDirTable[table] + offset,
282 (uint8_t *)(&pdte), 8);
283 base += pageSize;
284 }
285 }
286
287 /*
288 * Transition from real mode all the way up to Long mode
289 */
290 CR0 cr0 = tc->readMiscRegNoEffect(MISCREG_CR0);
291 //Turn off paging.
292 cr0.pg = 0;
293 tc->setMiscReg(MISCREG_CR0, cr0);
294 //Turn on protected mode.
295 cr0.pe = 1;
296 tc->setMiscReg(MISCREG_CR0, cr0);
297
298 CR4 cr4 = tc->readMiscRegNoEffect(MISCREG_CR4);
299 //Turn on pae.
300 cr4.pae = 1;
301 tc->setMiscReg(MISCREG_CR4, cr4);
302
303 //Point to the page tables.
304 tc->setMiscReg(MISCREG_CR3, PageMapLevel4);
305
306 Efer efer = tc->readMiscRegNoEffect(MISCREG_EFER);
307 //Enable long mode.
308 efer.lme = 1;
309 tc->setMiscReg(MISCREG_EFER, efer);
310
311 //Start using longmode segments.
312 installSegDesc(tc, SEGMENT_REG_CS, csDesc, true);
313 installSegDesc(tc, SEGMENT_REG_DS, dsDesc, true);
314 installSegDesc(tc, SEGMENT_REG_ES, dsDesc, true);
315 installSegDesc(tc, SEGMENT_REG_FS, dsDesc, true);
316 installSegDesc(tc, SEGMENT_REG_GS, dsDesc, true);
317 installSegDesc(tc, SEGMENT_REG_SS, dsDesc, true);
318
319 //Activate long mode.
320 cr0.pg = 1;
321 tc->setMiscReg(MISCREG_CR0, cr0);
322
323 tc->pcState(tc->getSystemPtr()->kernelEntry);
324
325 // We should now be in long mode. Yay!
326
327 Addr ebdaPos = 0xF0000;
328 Addr fixed, table;
329
330 //Write out the SMBios/DMI table
331 writeOutSMBiosTable(ebdaPos, fixed, table);
332 ebdaPos += (fixed + table);
333 ebdaPos = roundUp(ebdaPos, 16);
334
335 //Write out the Intel MP Specification configuration table
336 writeOutMPTable(ebdaPos, fixed, table);
337 ebdaPos += (fixed + table);
338}
339
340void
341X86System::writeOutSMBiosTable(Addr header,
342 Addr &headerSize, Addr &structSize, Addr table)
343{
344 // Get a port to write the table and header to memory.
345 FunctionalPort * physPort = threadContexts[0]->getPhysPort();
346
347 // If the table location isn't specified, just put it after the header.
348 // The header size as of the 2.5 SMBios specification is 0x1F bytes
349 if (!table)
350 table = header + 0x1F;
351 smbiosTable->setTableAddr(table);
352
353 smbiosTable->writeOut(physPort, header, headerSize, structSize);
354
355 // Do some bounds checking to make sure we at least didn't step on
356 // ourselves.
357 assert(header > table || header + headerSize <= table);
358 assert(table > header || table + structSize <= header);
359}
360
361void
362X86System::writeOutMPTable(Addr fp,
363 Addr &fpSize, Addr &tableSize, Addr table)
364{
365 // Get a port to write the table and header to memory.
366 FunctionalPort * physPort = threadContexts[0]->getPhysPort();
367
368 // If the table location isn't specified and it exists, just put
369 // it after the floating pointer. The fp size as of the 1.4 Intel MP
370 // specification is 0x10 bytes.
371 if (mpConfigTable) {
372 if (!table)
373 table = fp + 0x10;
374 mpFloatingPointer->setTableAddr(table);
375 }
376
377 fpSize = mpFloatingPointer->writeOut(physPort, fp);
378 if (mpConfigTable)
379 tableSize = mpConfigTable->writeOut(physPort, table);
380 else
381 tableSize = 0;
382
383 // Do some bounds checking to make sure we at least didn't step on
384 // ourselves and the fp structure was the size we thought it was.
385 assert(fp > table || fp + fpSize <= table);
386 assert(table > fp || table + tableSize <= fp);
387 assert(fpSize == 0x10);
388}
389
390
391X86System::~X86System()
392{
393 delete smbiosTable;
394}
395
396void
397X86System::serialize(std::ostream &os)
398{
399 System::serialize(os);
400}
401
402
403void
404X86System::unserialize(Checkpoint *cp, const std::string &section)
405{
406 System::unserialize(cp,section);
407}
408
409X86System *
410X86SystemParams::create()
411{
412 return new X86System(this);
413}