blob: 06cc7e59352b9df8b4a833acbb130e285c446341 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * linux/boot/head.S
3 *
4 * Copyright (C) 1991, 1992, 1993 Linus Torvalds
Linus Torvalds1da177e2005-04-16 15:20:36 -07005 */
6
7/*
8 * head.S contains the 32-bit startup code.
9 *
10 * NOTE!!! Startup happens at absolute address 0x00001000, which is also where
11 * the page directory will exist. The startup code will be overwritten by
12 * the page directory. [According to comments etc elsewhere on a compressed
13 * kernel it will end up at 0x1000 + 1Mb I hope so as I assume this. - AC]
14 *
15 * Page 0 is deliberately kept safe, since System Management Mode code in
16 * laptops may need to access the BIOS data stored there. This is also
17 * useful for future device drivers that either access the BIOS via VM86
18 * mode.
19 */
20
21/*
Domen Puncerf4549442005-06-25 14:58:59 -070022 * High loaded stuff by Hans Lermen & Werner Almesberger, Feb. 1996
Linus Torvalds1da177e2005-04-16 15:20:36 -070023 */
24.code32
25.text
26
27#include <linux/linkage.h>
28#include <asm/segment.h>
Jeremy Fitzhardinge0341c142009-02-13 11:14:01 -080029#include <asm/pgtable_types.h>
30#include <asm/page_types.h>
Alexander van Heukelum7c539762008-04-08 12:54:30 +020031#include <asm/boot.h>
Vivek Goyal1ab60e02007-05-02 19:27:07 +020032#include <asm/msr.h>
Cyrill Gorcunove83e31f42008-05-12 15:43:39 +020033#include <asm/processor-flags.h>
Eric W. Biedermanbd531472007-10-26 11:29:04 -060034#include <asm/asm-offsets.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070035
Vivek Goyal1ab60e02007-05-02 19:27:07 +020036.section ".text.head"
Linus Torvalds1da177e2005-04-16 15:20:36 -070037 .code32
Cyrill Gorcunov2d4eeecb2009-02-14 00:50:22 +030038ENTRY(startup_32)
Linus Torvalds1da177e2005-04-16 15:20:36 -070039 cld
Eric W. Biedermanbd531472007-10-26 11:29:04 -060040 /* test KEEP_SEGMENTS flag to see if the bootloader is asking
41 * us to not reload segments */
42 testb $(1<<6), BP_loadflags(%esi)
43 jnz 1f
44
Linus Torvalds1da177e2005-04-16 15:20:36 -070045 cli
Vivek Goyal1ab60e02007-05-02 19:27:07 +020046 movl $(__KERNEL_DS), %eax
47 movl %eax, %ds
48 movl %eax, %es
49 movl %eax, %ss
Eric W. Biedermanbd531472007-10-26 11:29:04 -0600501:
Linus Torvalds1da177e2005-04-16 15:20:36 -070051
Vivek Goyal1ab60e02007-05-02 19:27:07 +020052/* Calculate the delta between where we were compiled to run
53 * at and where we were actually loaded at. This can only be done
54 * with a short local call on x86. Nothing else will tell us what
55 * address we are running at. The reserved chunk of the real-mode
H. Peter Anvin85414b62007-07-11 12:18:33 -070056 * data at 0x1e4 (defined as a scratch field) are used as the stack
57 * for this calculation. Only 4 bytes are needed.
Vivek Goyal1ab60e02007-05-02 19:27:07 +020058 */
H. Peter Anvinbd2a3692009-05-05 23:24:50 -070059 leal (BP_scratch+4)(%esi), %esp
Vivek Goyal1ab60e02007-05-02 19:27:07 +020060 call 1f
611: popl %ebp
62 subl $1b, %ebp
63
Vivek Goyala4831e02007-05-02 19:27:08 +020064/* setup a stack and make sure cpu supports long mode. */
Alexander van Heukelum7c539762008-04-08 12:54:30 +020065 movl $boot_stack_end, %eax
Vivek Goyala4831e02007-05-02 19:27:08 +020066 addl %ebp, %eax
67 movl %eax, %esp
68
69 call verify_cpu
70 testl %eax, %eax
71 jnz no_longmode
72
Vivek Goyal1ab60e02007-05-02 19:27:07 +020073/* Compute the delta between where we were compiled to run at
74 * and where the code will actually run at.
75 */
76/* %ebp contains the address we are loaded at by the boot loader and %ebx
77 * contains the address where we should move the kernel image temporarily
78 * for safe in-place decompression.
79 */
80
81#ifdef CONFIG_RELOCATABLE
82 movl %ebp, %ebx
Andi Kleen31422c52008-02-04 16:48:08 +010083 addl $(PMD_PAGE_SIZE -1), %ebx
84 andl $PMD_PAGE_MASK, %ebx
Vivek Goyal1ab60e02007-05-02 19:27:07 +020085#else
86 movl $CONFIG_PHYSICAL_START, %ebx
87#endif
88
89 /* Replace the compressed data size with the uncompressed size */
90 subl input_len(%ebp), %ebx
91 movl output_len(%ebp), %eax
92 addl %eax, %ebx
93 /* Add 8 bytes for every 32K input block */
94 shrl $12, %eax
95 addl %eax, %ebx
96 /* Add 32K + 18 bytes of extra slack and align on a 4K boundary */
97 addl $(32768 + 18 + 4095), %ebx
98 andl $~4095, %ebx
Linus Torvalds1da177e2005-04-16 15:20:36 -070099
100/*
Vivek Goyal1ab60e02007-05-02 19:27:07 +0200101 * Prepare for entering 64 bit mode
Linus Torvalds1da177e2005-04-16 15:20:36 -0700102 */
Vivek Goyal1ab60e02007-05-02 19:27:07 +0200103
104 /* Load new GDT with the 64bit segments using 32bit descriptor */
105 leal gdt(%ebp), %eax
106 movl %eax, gdt+2(%ebp)
107 lgdt gdt(%ebp)
108
109 /* Enable PAE mode */
110 xorl %eax, %eax
Cyrill Gorcunove83e31f42008-05-12 15:43:39 +0200111 orl $(X86_CR4_PAE), %eax
Vivek Goyal1ab60e02007-05-02 19:27:07 +0200112 movl %eax, %cr4
113
114 /*
115 * Build early 4G boot pagetable
116 */
117 /* Initialize Page tables to 0*/
118 leal pgtable(%ebx), %edi
119 xorl %eax, %eax
120 movl $((4096*6)/4), %ecx
121 rep stosl
122
123 /* Build Level 4 */
124 leal pgtable + 0(%ebx), %edi
125 leal 0x1007 (%edi), %eax
126 movl %eax, 0(%edi)
127
128 /* Build Level 3 */
129 leal pgtable + 0x1000(%ebx), %edi
130 leal 0x1007(%edi), %eax
131 movl $4, %ecx
1321: movl %eax, 0x00(%edi)
133 addl $0x00001000, %eax
134 addl $8, %edi
135 decl %ecx
136 jnz 1b
137
138 /* Build Level 2 */
139 leal pgtable + 0x2000(%ebx), %edi
140 movl $0x00000183, %eax
141 movl $2048, %ecx
1421: movl %eax, 0(%edi)
143 addl $0x00200000, %eax
144 addl $8, %edi
145 decl %ecx
146 jnz 1b
147
148 /* Enable the boot page tables */
149 leal pgtable(%ebx), %eax
150 movl %eax, %cr3
151
152 /* Enable Long mode in EFER (Extended Feature Enable Register) */
153 movl $MSR_EFER, %ecx
154 rdmsr
155 btsl $_EFER_LME, %eax
156 wrmsr
157
158 /* Setup for the jump to 64bit mode
159 *
160 * When the jump is performend we will be in long mode but
161 * in 32bit compatibility mode with EFER.LME = 1, CS.L = 0, CS.D = 1
162 * (and in turn EFER.LMA = 1). To jump into 64bit mode we use
163 * the new gdt/idt that has __KERNEL_CS with CS.L = 1.
164 * We place all of the values on our mini stack so lret can
165 * used to perform that far jump.
166 */
167 pushl $__KERNEL_CS
168 leal startup_64(%ebp), %eax
169 pushl %eax
170
171 /* Enter paged protected Mode, activating Long Mode */
Cyrill Gorcunove83e31f42008-05-12 15:43:39 +0200172 movl $(X86_CR0_PG | X86_CR0_PE), %eax /* Enable Paging and Protected mode */
Vivek Goyal1ab60e02007-05-02 19:27:07 +0200173 movl %eax, %cr0
174
175 /* Jump from 32bit compatibility mode into 64bit mode. */
176 lret
Cyrill Gorcunov2d4eeecb2009-02-14 00:50:22 +0300177ENDPROC(startup_32)
Vivek Goyal1ab60e02007-05-02 19:27:07 +0200178
Vivek Goyala4831e02007-05-02 19:27:08 +0200179no_longmode:
180 /* This isn't an x86-64 CPU so hang */
1811:
182 hlt
183 jmp 1b
184
Thomas Gleixner250c2272007-10-11 11:17:24 +0200185#include "../../kernel/verify_cpu_64.S"
Vivek Goyala4831e02007-05-02 19:27:08 +0200186
Vivek Goyal1ab60e02007-05-02 19:27:07 +0200187 /* Be careful here startup_64 needs to be at a predictable
188 * address so I can export it in an ELF header. Bootloaders
189 * should look at the ELF header to find this address, as
190 * it may change in the future.
191 */
192 .code64
Vivek Goyala4831e02007-05-02 19:27:08 +0200193 .org 0x200
Vivek Goyal1ab60e02007-05-02 19:27:07 +0200194ENTRY(startup_64)
195 /* We come here either from startup_32 or directly from a
196 * 64bit bootloader. If we come here from a bootloader we depend on
197 * an identity mapped page table being provied that maps our
198 * entire text+data+bss and hopefully all of memory.
199 */
200
201 /* Setup data segments. */
202 xorl %eax, %eax
203 movl %eax, %ds
204 movl %eax, %es
205 movl %eax, %ss
Zachary Amsden08da5a22007-08-10 22:31:05 +0200206 movl %eax, %fs
207 movl %eax, %gs
208 lldt %ax
209 movl $0x20, %eax
210 ltr %ax
Vivek Goyal1ab60e02007-05-02 19:27:07 +0200211
212 /* Compute the decompressed kernel start address. It is where
213 * we were loaded at aligned to a 2M boundary. %rbp contains the
214 * decompressed kernel start address.
215 *
216 * If it is a relocatable kernel then decompress and run the kernel
217 * from load address aligned to 2MB addr, otherwise decompress and
218 * run the kernel from CONFIG_PHYSICAL_START
219 */
220
221 /* Start with the delta to where the kernel will run at. */
222#ifdef CONFIG_RELOCATABLE
223 leaq startup_32(%rip) /* - $startup_32 */, %rbp
Andi Kleen31422c52008-02-04 16:48:08 +0100224 addq $(PMD_PAGE_SIZE - 1), %rbp
225 andq $PMD_PAGE_MASK, %rbp
Vivek Goyal1ab60e02007-05-02 19:27:07 +0200226 movq %rbp, %rbx
227#else
228 movq $CONFIG_PHYSICAL_START, %rbp
229 movq %rbp, %rbx
230#endif
231
232 /* Replace the compressed data size with the uncompressed size */
233 movl input_len(%rip), %eax
234 subq %rax, %rbx
235 movl output_len(%rip), %eax
236 addq %rax, %rbx
237 /* Add 8 bytes for every 32K input block */
238 shrq $12, %rax
239 addq %rax, %rbx
240 /* Add 32K + 18 bytes of extra slack and align on a 4K boundary */
241 addq $(32768 + 18 + 4095), %rbx
242 andq $~4095, %rbx
243
244/* Copy the compressed kernel to the end of our buffer
245 * where decompression in place becomes safe.
246 */
Yinghai Lu4a9f54c2008-04-10 15:06:38 -0700247 leaq _end_before_pgt(%rip), %r8
248 leaq _end_before_pgt(%rbx), %r9
249 movq $_end_before_pgt /* - $startup_32 */, %rcx
Vivek Goyal1ab60e02007-05-02 19:27:07 +02002501: subq $8, %r8
251 subq $8, %r9
252 movq 0(%r8), %rax
253 movq %rax, 0(%r9)
254 subq $8, %rcx
255 jnz 1b
256
257/*
258 * Jump to the relocated address.
259 */
260 leaq relocated(%rbx), %rax
261 jmp *%rax
262
263.section ".text"
264relocated:
265
Linus Torvalds1da177e2005-04-16 15:20:36 -0700266/*
267 * Clear BSS
268 */
Vivek Goyal1ab60e02007-05-02 19:27:07 +0200269 xorq %rax, %rax
270 leaq _edata(%rbx), %rdi
Yinghai Lu4a9f54c2008-04-10 15:06:38 -0700271 leaq _end_before_pgt(%rbx), %rcx
Vivek Goyal1ab60e02007-05-02 19:27:07 +0200272 subq %rdi, %rcx
Linus Torvalds1da177e2005-04-16 15:20:36 -0700273 cld
274 rep
275 stosb
Vivek Goyal1ab60e02007-05-02 19:27:07 +0200276
277 /* Setup the stack */
Alexander van Heukelum7c539762008-04-08 12:54:30 +0200278 leaq boot_stack_end(%rip), %rsp
Vivek Goyal1ab60e02007-05-02 19:27:07 +0200279
280 /* zero EFLAGS after setting rsp */
281 pushq $0
282 popfq
283
Linus Torvalds1da177e2005-04-16 15:20:36 -0700284/*
285 * Do the decompression, and jump to the new kernel..
286 */
Vivek Goyal1ab60e02007-05-02 19:27:07 +0200287 pushq %rsi # Save the real mode argument
288 movq %rsi, %rdi # real mode address
Alexander van Heukelum7c539762008-04-08 12:54:30 +0200289 leaq boot_heap(%rip), %rsi # malloc area for uncompression
Vivek Goyal1ab60e02007-05-02 19:27:07 +0200290 leaq input_data(%rip), %rdx # input_data
291 movl input_len(%rip), %eax
292 movq %rax, %rcx # input_len
293 movq %rbp, %r8 # output
294 call decompress_kernel
295 popq %rsi
296
Linus Torvalds1da177e2005-04-16 15:20:36 -0700297/*
Vivek Goyal1ab60e02007-05-02 19:27:07 +0200298 * Jump to the decompressed kernel.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700299 */
Vivek Goyal1ab60e02007-05-02 19:27:07 +0200300 jmp *%rbp
Linus Torvalds1da177e2005-04-16 15:20:36 -0700301
Vivek Goyal1ab60e02007-05-02 19:27:07 +0200302 .data
303gdt:
304 .word gdt_end - gdt
305 .long gdt
306 .word 0
307 .quad 0x0000000000000000 /* NULL descriptor */
308 .quad 0x00af9a000000ffff /* __KERNEL_CS */
309 .quad 0x00cf92000000ffff /* __KERNEL_DS */
Zachary Amsden08da5a22007-08-10 22:31:05 +0200310 .quad 0x0080890000000000 /* TS descriptor */
311 .quad 0x0000000000000000 /* TS continued */
Vivek Goyal1ab60e02007-05-02 19:27:07 +0200312gdt_end:
Alexander van Heukelum7c539762008-04-08 12:54:30 +0200313
314.bss
315/* Stack and heap for uncompression */
316.balign 4
317boot_heap:
318 .fill BOOT_HEAP_SIZE, 1, 0
319boot_stack:
320 .fill BOOT_STACK_SIZE, 1, 0
321boot_stack_end: