blob: 2b9f2510507b4c3faa0dab6dfc9223d461bc9eae [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * linux/boot/head.S
3 *
4 * Copyright (C) 1991, 1992, 1993 Linus Torvalds
Linus Torvalds1da177e2005-04-16 15:20:36 -07005 */
6
7/*
8 * head.S contains the 32-bit startup code.
9 *
10 * NOTE!!! Startup happens at absolute address 0x00001000, which is also where
11 * the page directory will exist. The startup code will be overwritten by
12 * the page directory. [According to comments etc elsewhere on a compressed
13 * kernel it will end up at 0x1000 + 1Mb I hope so as I assume this. - AC]
14 *
15 * Page 0 is deliberately kept safe, since System Management Mode code in
16 * laptops may need to access the BIOS data stored there. This is also
17 * useful for future device drivers that either access the BIOS via VM86
18 * mode.
19 */
20
21/*
Domen Puncerf4549442005-06-25 14:58:59 -070022 * High loaded stuff by Hans Lermen & Werner Almesberger, Feb. 1996
Linus Torvalds1da177e2005-04-16 15:20:36 -070023 */
H. Peter Anvinb40d68d2009-05-08 15:59:13 -070024 .code32
25 .text
Linus Torvalds1da177e2005-04-16 15:20:36 -070026
27#include <linux/linkage.h>
28#include <asm/segment.h>
Jeremy Fitzhardinge0341c142009-02-13 11:14:01 -080029#include <asm/pgtable_types.h>
30#include <asm/page_types.h>
Alexander van Heukelum7c539762008-04-08 12:54:30 +020031#include <asm/boot.h>
Vivek Goyal1ab60e02007-05-02 19:27:07 +020032#include <asm/msr.h>
Cyrill Gorcunove83e31f42008-05-12 15:43:39 +020033#include <asm/processor-flags.h>
Eric W. Biedermanbd531472007-10-26 11:29:04 -060034#include <asm/asm-offsets.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070035
H. Peter Anvinb40d68d2009-05-08 15:59:13 -070036 .section ".text.head"
Linus Torvalds1da177e2005-04-16 15:20:36 -070037 .code32
Cyrill Gorcunov2d4eeecb2009-02-14 00:50:22 +030038ENTRY(startup_32)
Linus Torvalds1da177e2005-04-16 15:20:36 -070039 cld
H. Peter Anvinb40d68d2009-05-08 15:59:13 -070040 /*
41 * Test KEEP_SEGMENTS flag to see if the bootloader is asking
42 * us to not reload segments
43 */
Eric W. Biedermanbd531472007-10-26 11:29:04 -060044 testb $(1<<6), BP_loadflags(%esi)
45 jnz 1f
46
Linus Torvalds1da177e2005-04-16 15:20:36 -070047 cli
Vivek Goyal1ab60e02007-05-02 19:27:07 +020048 movl $(__KERNEL_DS), %eax
49 movl %eax, %ds
50 movl %eax, %es
51 movl %eax, %ss
Eric W. Biedermanbd531472007-10-26 11:29:04 -0600521:
Linus Torvalds1da177e2005-04-16 15:20:36 -070053
H. Peter Anvinb40d68d2009-05-08 15:59:13 -070054/*
55 * Calculate the delta between where we were compiled to run
Vivek Goyal1ab60e02007-05-02 19:27:07 +020056 * at and where we were actually loaded at. This can only be done
57 * with a short local call on x86. Nothing else will tell us what
58 * address we are running at. The reserved chunk of the real-mode
H. Peter Anvin85414b62007-07-11 12:18:33 -070059 * data at 0x1e4 (defined as a scratch field) are used as the stack
60 * for this calculation. Only 4 bytes are needed.
Vivek Goyal1ab60e02007-05-02 19:27:07 +020061 */
H. Peter Anvinbd2a3692009-05-05 23:24:50 -070062 leal (BP_scratch+4)(%esi), %esp
Vivek Goyal1ab60e02007-05-02 19:27:07 +020063 call 1f
641: popl %ebp
65 subl $1b, %ebp
66
Vivek Goyala4831e02007-05-02 19:27:08 +020067/* setup a stack and make sure cpu supports long mode. */
Alexander van Heukelum7c539762008-04-08 12:54:30 +020068 movl $boot_stack_end, %eax
Vivek Goyala4831e02007-05-02 19:27:08 +020069 addl %ebp, %eax
70 movl %eax, %esp
71
72 call verify_cpu
73 testl %eax, %eax
74 jnz no_longmode
75
H. Peter Anvinb40d68d2009-05-08 15:59:13 -070076/*
77 * Compute the delta between where we were compiled to run at
Vivek Goyal1ab60e02007-05-02 19:27:07 +020078 * and where the code will actually run at.
H. Peter Anvinb40d68d2009-05-08 15:59:13 -070079 *
80 * %ebp contains the address we are loaded at by the boot loader and %ebx
Vivek Goyal1ab60e02007-05-02 19:27:07 +020081 * contains the address where we should move the kernel image temporarily
82 * for safe in-place decompression.
83 */
84
85#ifdef CONFIG_RELOCATABLE
86 movl %ebp, %ebx
Andi Kleen31422c52008-02-04 16:48:08 +010087 addl $(PMD_PAGE_SIZE -1), %ebx
88 andl $PMD_PAGE_MASK, %ebx
Vivek Goyal1ab60e02007-05-02 19:27:07 +020089#else
90 movl $CONFIG_PHYSICAL_START, %ebx
91#endif
92
H. Peter Anvin02a884c2009-05-08 17:42:16 -070093 /* Target address to relocate to for decompression */
94 addl $z_extract_offset, %ebx
Linus Torvalds1da177e2005-04-16 15:20:36 -070095
96/*
Vivek Goyal1ab60e02007-05-02 19:27:07 +020097 * Prepare for entering 64 bit mode
Linus Torvalds1da177e2005-04-16 15:20:36 -070098 */
Vivek Goyal1ab60e02007-05-02 19:27:07 +020099
100 /* Load new GDT with the 64bit segments using 32bit descriptor */
101 leal gdt(%ebp), %eax
102 movl %eax, gdt+2(%ebp)
103 lgdt gdt(%ebp)
104
105 /* Enable PAE mode */
106 xorl %eax, %eax
Cyrill Gorcunove83e31f42008-05-12 15:43:39 +0200107 orl $(X86_CR4_PAE), %eax
Vivek Goyal1ab60e02007-05-02 19:27:07 +0200108 movl %eax, %cr4
109
110 /*
111 * Build early 4G boot pagetable
112 */
H. Peter Anvinb40d68d2009-05-08 15:59:13 -0700113 /* Initialize Page tables to 0 */
Vivek Goyal1ab60e02007-05-02 19:27:07 +0200114 leal pgtable(%ebx), %edi
115 xorl %eax, %eax
116 movl $((4096*6)/4), %ecx
117 rep stosl
118
119 /* Build Level 4 */
120 leal pgtable + 0(%ebx), %edi
121 leal 0x1007 (%edi), %eax
122 movl %eax, 0(%edi)
123
124 /* Build Level 3 */
125 leal pgtable + 0x1000(%ebx), %edi
126 leal 0x1007(%edi), %eax
127 movl $4, %ecx
1281: movl %eax, 0x00(%edi)
129 addl $0x00001000, %eax
130 addl $8, %edi
131 decl %ecx
132 jnz 1b
133
134 /* Build Level 2 */
135 leal pgtable + 0x2000(%ebx), %edi
136 movl $0x00000183, %eax
137 movl $2048, %ecx
1381: movl %eax, 0(%edi)
139 addl $0x00200000, %eax
140 addl $8, %edi
141 decl %ecx
142 jnz 1b
143
144 /* Enable the boot page tables */
145 leal pgtable(%ebx), %eax
146 movl %eax, %cr3
147
148 /* Enable Long mode in EFER (Extended Feature Enable Register) */
149 movl $MSR_EFER, %ecx
150 rdmsr
151 btsl $_EFER_LME, %eax
152 wrmsr
153
H. Peter Anvinb40d68d2009-05-08 15:59:13 -0700154 /*
155 * Setup for the jump to 64bit mode
Vivek Goyal1ab60e02007-05-02 19:27:07 +0200156 *
157 * When the jump is performend we will be in long mode but
158 * in 32bit compatibility mode with EFER.LME = 1, CS.L = 0, CS.D = 1
159 * (and in turn EFER.LMA = 1). To jump into 64bit mode we use
160 * the new gdt/idt that has __KERNEL_CS with CS.L = 1.
161 * We place all of the values on our mini stack so lret can
162 * used to perform that far jump.
163 */
164 pushl $__KERNEL_CS
165 leal startup_64(%ebp), %eax
166 pushl %eax
167
168 /* Enter paged protected Mode, activating Long Mode */
Cyrill Gorcunove83e31f42008-05-12 15:43:39 +0200169 movl $(X86_CR0_PG | X86_CR0_PE), %eax /* Enable Paging and Protected mode */
Vivek Goyal1ab60e02007-05-02 19:27:07 +0200170 movl %eax, %cr0
171
172 /* Jump from 32bit compatibility mode into 64bit mode. */
173 lret
Cyrill Gorcunov2d4eeecb2009-02-14 00:50:22 +0300174ENDPROC(startup_32)
Vivek Goyal1ab60e02007-05-02 19:27:07 +0200175
Vivek Goyala4831e02007-05-02 19:27:08 +0200176no_longmode:
177 /* This isn't an x86-64 CPU so hang */
1781:
179 hlt
180 jmp 1b
181
Thomas Gleixner250c2272007-10-11 11:17:24 +0200182#include "../../kernel/verify_cpu_64.S"
Vivek Goyala4831e02007-05-02 19:27:08 +0200183
H. Peter Anvinb40d68d2009-05-08 15:59:13 -0700184 /*
185 * Be careful here startup_64 needs to be at a predictable
Vivek Goyal1ab60e02007-05-02 19:27:07 +0200186 * address so I can export it in an ELF header. Bootloaders
187 * should look at the ELF header to find this address, as
188 * it may change in the future.
189 */
190 .code64
Vivek Goyala4831e02007-05-02 19:27:08 +0200191 .org 0x200
Vivek Goyal1ab60e02007-05-02 19:27:07 +0200192ENTRY(startup_64)
H. Peter Anvinb40d68d2009-05-08 15:59:13 -0700193 /*
194 * We come here either from startup_32 or directly from a
Vivek Goyal1ab60e02007-05-02 19:27:07 +0200195 * 64bit bootloader. If we come here from a bootloader we depend on
196 * an identity mapped page table being provied that maps our
197 * entire text+data+bss and hopefully all of memory.
198 */
199
200 /* Setup data segments. */
201 xorl %eax, %eax
202 movl %eax, %ds
203 movl %eax, %es
204 movl %eax, %ss
Zachary Amsden08da5a22007-08-10 22:31:05 +0200205 movl %eax, %fs
206 movl %eax, %gs
207 lldt %ax
208 movl $0x20, %eax
209 ltr %ax
Vivek Goyal1ab60e02007-05-02 19:27:07 +0200210
H. Peter Anvinb40d68d2009-05-08 15:59:13 -0700211 /*
212 * Compute the decompressed kernel start address. It is where
Vivek Goyal1ab60e02007-05-02 19:27:07 +0200213 * we were loaded at aligned to a 2M boundary. %rbp contains the
214 * decompressed kernel start address.
215 *
216 * If it is a relocatable kernel then decompress and run the kernel
217 * from load address aligned to 2MB addr, otherwise decompress and
218 * run the kernel from CONFIG_PHYSICAL_START
H. Peter Anvin02a884c2009-05-08 17:42:16 -0700219 *
220 * We cannot rely on the calculation done in 32-bit mode, since we
221 * may have been invoked via the 64-bit entry point.
Vivek Goyal1ab60e02007-05-02 19:27:07 +0200222 */
223
224 /* Start with the delta to where the kernel will run at. */
225#ifdef CONFIG_RELOCATABLE
226 leaq startup_32(%rip) /* - $startup_32 */, %rbp
Andi Kleen31422c52008-02-04 16:48:08 +0100227 addq $(PMD_PAGE_SIZE - 1), %rbp
228 andq $PMD_PAGE_MASK, %rbp
Vivek Goyal1ab60e02007-05-02 19:27:07 +0200229 movq %rbp, %rbx
230#else
231 movq $CONFIG_PHYSICAL_START, %rbp
232 movq %rbp, %rbx
233#endif
234
H. Peter Anvin02a884c2009-05-08 17:42:16 -0700235 /* Target address to relocate to for decompression */
236 leaq z_extract_offset(%rbp), %rbx
Vivek Goyal1ab60e02007-05-02 19:27:07 +0200237
H. Peter Anvin0a137732009-05-08 16:27:41 -0700238 /* Set up the stack */
239 leaq boot_stack_end(%rbx), %rsp
240
241 /* Zero EFLAGS */
242 pushq $0
243 popfq
244
H. Peter Anvinb40d68d2009-05-08 15:59:13 -0700245/*
246 * Copy the compressed kernel to the end of our buffer
Vivek Goyal1ab60e02007-05-02 19:27:07 +0200247 * where decompression in place becomes safe.
248 */
H. Peter Anvin36d37932009-05-08 16:45:15 -0700249 pushq %rsi
250 leaq (_bss-8)(%rip), %rsi
251 leaq (_bss-8)(%rbx), %rdi
H. Peter Anvin5b11f1c2009-05-08 16:20:34 -0700252 movq $_bss /* - $startup_32 */, %rcx
H. Peter Anvin36d37932009-05-08 16:45:15 -0700253 shrq $3, %rcx
254 std
255 rep movsq
256 cld
257 popq %rsi
Vivek Goyal1ab60e02007-05-02 19:27:07 +0200258
259/*
260 * Jump to the relocated address.
261 */
262 leaq relocated(%rbx), %rax
263 jmp *%rax
264
H. Peter Anvinb40d68d2009-05-08 15:59:13 -0700265 .text
Vivek Goyal1ab60e02007-05-02 19:27:07 +0200266relocated:
267
Linus Torvalds1da177e2005-04-16 15:20:36 -0700268/*
H. Peter Anvin0a137732009-05-08 16:27:41 -0700269 * Clear BSS (stack is currently empty)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700270 */
H. Peter Anvin36d37932009-05-08 16:45:15 -0700271 xorl %eax, %eax
272 leaq _bss(%rip), %rdi
273 leaq _ebss(%rip), %rcx
Vivek Goyal1ab60e02007-05-02 19:27:07 +0200274 subq %rdi, %rcx
H. Peter Anvin36d37932009-05-08 16:45:15 -0700275 shrq $3, %rcx
276 rep stosq
Vivek Goyal1ab60e02007-05-02 19:27:07 +0200277
Linus Torvalds1da177e2005-04-16 15:20:36 -0700278/*
279 * Do the decompression, and jump to the new kernel..
280 */
H. Peter Anvin02a884c2009-05-08 17:42:16 -0700281 pushq %rsi /* Save the real mode argument */
282 movq %rsi, %rdi /* real mode address */
283 leaq boot_heap(%rip), %rsi /* malloc area for uncompression */
284 leaq input_data(%rip), %rdx /* input_data */
285 movl $z_input_len, %ecx /* input_len */
286 movq %rbp, %r8 /* output target address */
Vivek Goyal1ab60e02007-05-02 19:27:07 +0200287 call decompress_kernel
288 popq %rsi
289
Linus Torvalds1da177e2005-04-16 15:20:36 -0700290/*
Vivek Goyal1ab60e02007-05-02 19:27:07 +0200291 * Jump to the decompressed kernel.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700292 */
Vivek Goyal1ab60e02007-05-02 19:27:07 +0200293 jmp *%rbp
Linus Torvalds1da177e2005-04-16 15:20:36 -0700294
Vivek Goyal1ab60e02007-05-02 19:27:07 +0200295 .data
296gdt:
297 .word gdt_end - gdt
298 .long gdt
299 .word 0
300 .quad 0x0000000000000000 /* NULL descriptor */
301 .quad 0x00af9a000000ffff /* __KERNEL_CS */
302 .quad 0x00cf92000000ffff /* __KERNEL_DS */
Zachary Amsden08da5a22007-08-10 22:31:05 +0200303 .quad 0x0080890000000000 /* TS descriptor */
304 .quad 0x0000000000000000 /* TS continued */
Vivek Goyal1ab60e02007-05-02 19:27:07 +0200305gdt_end:
Alexander van Heukelum7c539762008-04-08 12:54:30 +0200306
H. Peter Anvinb40d68d2009-05-08 15:59:13 -0700307/*
308 * Stack and heap for uncompression
309 */
310 .bss
311 .balign 4
Alexander van Heukelum7c539762008-04-08 12:54:30 +0200312boot_heap:
313 .fill BOOT_HEAP_SIZE, 1, 0
314boot_stack:
315 .fill BOOT_STACK_SIZE, 1, 0
316boot_stack_end:
H. Peter Anvin5b11f1c2009-05-08 16:20:34 -0700317
318/*
319 * Space for page tables (not in .bss so not zeroed)
320 */
321 .section ".pgtable","a",@nobits
322 .balign 4096
323pgtable:
324 .fill 6*4096, 1, 0