2005-04-16 15:20:36 -07:00
/*
2007-10-12 21:10:53 -04:00
* prepare to run common code
2005-04-16 15:20:36 -07:00
*
* Copyright ( C ) 2000 Andrea Arcangeli < andrea @ suse . de > SuSE
*/
# include <linux/init.h>
# include <linux/linkage.h>
# include <linux/types.h>
# include <linux/kernel.h>
# include <linux/string.h>
# include <linux/percpu.h>
2008-01-30 13:30:19 +01:00
# include <linux/start_kernel.h>
2008-03-28 10:49:44 +08:00
# include <linux/io.h>
2005-04-16 15:20:36 -07:00
# include <asm/processor.h>
# include <asm/proto.h>
# include <asm/smp.h>
# include <asm/setup.h>
# include <asm/desc.h>
2005-11-05 17:25:53 +01:00
# include <asm/pgtable.h>
2007-05-02 19:27:07 +02:00
# include <asm/tlbflush.h>
2005-11-05 17:25:53 +01:00
# include <asm/sections.h>
2008-01-30 13:30:17 +01:00
# include <asm/kdebug.h>
2008-01-30 13:33:17 +01:00
# include <asm/e820.h>
2008-12-08 00:50:22 +01:00
# include <asm/trampoline.h>
2009-08-29 15:03:59 +02:00
# include <asm/bios_ebda.h>
2005-04-16 15:20:36 -07:00
2007-05-02 19:27:07 +02:00
static void __init zap_identity_mappings ( void )
{
pgd_t * pgd = pgd_offset_k ( 0UL ) ;
pgd_clear ( pgd ) ;
2008-01-30 13:33:54 +01:00
__flush_tlb_all ( ) ;
2007-05-02 19:27:07 +02:00
}
2005-04-16 15:20:36 -07:00
/* Don't add a printk in there. printk relies on the PDA which is not initialized
yet . */
static void __init clear_bss ( void )
{
memset ( __bss_start , 0 ,
2005-11-05 17:25:53 +01:00
( unsigned long ) __bss_stop - ( unsigned long ) __bss_start ) ;
2005-04-16 15:20:36 -07:00
}
static void __init copy_bootdata ( char * real_mode_data )
{
char * command_line ;
2007-10-15 17:13:22 -07:00
memcpy ( & boot_params , real_mode_data , sizeof boot_params ) ;
if ( boot_params . hdr . cmd_line_ptr ) {
command_line = __va ( boot_params . hdr . cmd_line_ptr ) ;
memcpy ( boot_command_line , command_line , COMMAND_LINE_SIZE ) ;
2005-04-16 15:20:36 -07:00
}
}
void __init x86_64_start_kernel ( char * real_mode_data )
{
int i ;
2008-02-21 13:45:16 +01:00
/*
* Build - time sanity checks on the kernel image and module
* area mappings . ( these are purely build - time and produce no code )
*/
BUILD_BUG_ON ( MODULES_VADDR < KERNEL_IMAGE_START ) ;
BUILD_BUG_ON ( MODULES_VADDR - KERNEL_IMAGE_START < KERNEL_IMAGE_SIZE ) ;
BUILD_BUG_ON ( MODULES_LEN + KERNEL_IMAGE_SIZE > 2 * PUD_SIZE ) ;
BUILD_BUG_ON ( ( KERNEL_IMAGE_START & ~ PMD_MASK ) ! = 0 ) ;
BUILD_BUG_ON ( ( MODULES_VADDR & ~ PMD_MASK ) ! = 0 ) ;
BUILD_BUG_ON ( ! ( MODULES_VADDR > __START_KERNEL ) ) ;
BUILD_BUG_ON ( ! ( ( ( MODULES_END - 1 ) & PGDIR_MASK ) = =
( __START_KERNEL & PGDIR_MASK ) ) ) ;
2008-07-31 16:48:31 +01:00
BUILD_BUG_ON ( __fix_to_virt ( __end_of_fixed_addresses ) < = MODULES_END ) ;
2008-02-21 13:45:16 +01:00
2006-12-07 02:14:12 +01:00
/* clear bss before set_intr_gate with early_idt_handler */
clear_bss ( ) ;
2007-05-02 19:27:07 +02:00
/* Make NULL pointers segfault */
zap_identity_mappings ( ) ;
2008-02-15 17:29:12 +01:00
/* Cleanup the over mapped high alias */
cleanup_highmap ( ) ;
2008-03-11 02:23:20 +01:00
for ( i = 0 ; i < NUM_EXCEPTION_VECTORS ; i + + ) {
2008-01-30 13:33:06 +01:00
# ifdef CONFIG_EARLY_PRINTK
2008-01-30 13:33:06 +01:00
set_intr_gate ( i , & early_idt_handlers [ i ] ) ;
2008-01-30 13:33:06 +01:00
# else
set_intr_gate ( i , early_idt_handler ) ;
# endif
}
2007-10-19 20:35:03 +02:00
load_idt ( ( const struct desc_ptr * ) & idt_descr ) ;
2005-11-05 17:25:53 +01:00
2008-09-28 18:49:46 +02:00
if ( console_loglevel = = 10 )
early_printk ( " Kernel alive \n " ) ;
2006-07-03 00:24:57 -07:00
2008-06-25 00:19:18 -04:00
x86_64_start_reservations ( real_mode_data ) ;
}
void __init x86_64_start_reservations ( char * real_mode_data )
{
2007-05-02 19:27:07 +02:00
copy_bootdata ( __va ( real_mode_data ) ) ;
2008-01-30 13:30:46 +01:00
x86: add brk allocation for very, very early allocations
Impact: new interface
Add a brk()-like allocator which effectively extends the bss in order
to allow very early code to do dynamic allocations. This is better than
using statically allocated arrays for data in subsystems which may never
get used.
The space for brk allocations is in the bss ELF segment, so that the
space is mapped properly by the code which maps the kernel, and so
that bootloaders keep the space free rather than putting a ramdisk or
something into it.
The bss itself, delimited by __bss_stop, ends before the brk area
(__brk_base to __brk_limit). The kernel text, data and bss is reserved
up to __bss_stop.
Any brk-allocated data is reserved separately just before the kernel
pagetable is built, as that code allocates from unreserved spaces
in the e820 map, potentially allocating from any unused brk memory.
Ultimately any unused memory in the brk area is used in the general
kernel memory pool.
Initially the brk space is set to 1MB, which is probably much larger
than any user needs (the largest current user is i386 head_32.S's code
to build the pagetables to map the kernel, which can get fairly large
with a big kernel image and no PSE support). So long as the system
has sufficient memory for the bootloader to reserve the kernel+1MB brk,
there are no bad effects resulting from an over-large brk.
Signed-off-by: Jeremy Fitzhardinge <jeremy.fitzhardinge@citrix.com>
Signed-off-by: H. Peter Anvin <hpa@zytor.com>
2009-02-26 17:35:44 -08:00
reserve_early ( __pa_symbol ( & _text ) , __pa_symbol ( & __bss_stop ) , " TEXT DATA BSS " ) ;
2008-01-30 13:33:17 +01:00
2008-03-18 12:51:22 -07:00
# ifdef CONFIG_BLK_DEV_INITRD
2008-01-30 13:33:17 +01:00
/* Reserve INITRD */
if ( boot_params . hdr . type_of_loader & & boot_params . hdr . ramdisk_image ) {
x86: Make sure free_init_pages() frees pages on page boundary
When CONFIG_NO_BOOTMEM=y, it could use memory more effiently, or
in a more compact fashion.
Example:
Allocated new RAMDISK: 00ec2000 - 0248ce57
Move RAMDISK from 000000002ea04000 - 000000002ffcee56 to 00ec2000 - 0248ce56
The new RAMDISK's end is not page aligned.
Last page could be shared with other users.
When free_init_pages are called for initrd or .init, the page
could be freed and we could corrupt other data.
code segment in free_init_pages():
| for (; addr < end; addr += PAGE_SIZE) {
| ClearPageReserved(virt_to_page(addr));
| init_page_count(virt_to_page(addr));
| memset((void *)(addr & ~(PAGE_SIZE-1)),
| POISON_FREE_INITMEM, PAGE_SIZE);
| free_page(addr);
| totalram_pages++;
| }
last half page could be used as one whole free page.
So page align the boundaries.
-v2: make the original initramdisk to be aligned, according to
Johannes, otherwise we have the chance to lose one page.
we still need to keep initrd_end not aligned, otherwise it could
confuse decompressor.
-v3: change to WARN_ON instead, suggested by Johannes.
-v4: use PAGE_ALIGN, suggested by Johannes.
We may fix that macro name later to PAGE_ALIGN_UP, and PAGE_ALIGN_DOWN
Add comments about assuming ramdisk start is aligned
in relocate_initrd(), change to re get ramdisk_image instead of save it
to make diff smaller. Add warning for wrong range, suggested by Johannes.
-v6: remove one WARN()
We need to align beginning in free_init_pages()
do not copy more than ramdisk_size, noticed by Johannes
Reported-by: Stanislaw Gruszka <sgruszka@redhat.com>
Tested-by: Stanislaw Gruszka <sgruszka@redhat.com>
Signed-off-by: Yinghai Lu <yinghai@kernel.org>
Acked-by: Johannes Weiner <hannes@cmpxchg.org>
Cc: David Miller <davem@davemloft.net>
Cc: Benjamin Herrenschmidt <benh@kernel.crashing.org>
Cc: Linus Torvalds <torvalds@linux-foundation.org>
LKML-Reference: <1269830604-26214-3-git-send-email-yinghai@kernel.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2010-03-28 19:42:55 -07:00
/* Assume only end is not page aligned */
2008-01-30 13:33:17 +01:00
unsigned long ramdisk_image = boot_params . hdr . ramdisk_image ;
unsigned long ramdisk_size = boot_params . hdr . ramdisk_size ;
x86: Make sure free_init_pages() frees pages on page boundary
When CONFIG_NO_BOOTMEM=y, it could use memory more effiently, or
in a more compact fashion.
Example:
Allocated new RAMDISK: 00ec2000 - 0248ce57
Move RAMDISK from 000000002ea04000 - 000000002ffcee56 to 00ec2000 - 0248ce56
The new RAMDISK's end is not page aligned.
Last page could be shared with other users.
When free_init_pages are called for initrd or .init, the page
could be freed and we could corrupt other data.
code segment in free_init_pages():
| for (; addr < end; addr += PAGE_SIZE) {
| ClearPageReserved(virt_to_page(addr));
| init_page_count(virt_to_page(addr));
| memset((void *)(addr & ~(PAGE_SIZE-1)),
| POISON_FREE_INITMEM, PAGE_SIZE);
| free_page(addr);
| totalram_pages++;
| }
last half page could be used as one whole free page.
So page align the boundaries.
-v2: make the original initramdisk to be aligned, according to
Johannes, otherwise we have the chance to lose one page.
we still need to keep initrd_end not aligned, otherwise it could
confuse decompressor.
-v3: change to WARN_ON instead, suggested by Johannes.
-v4: use PAGE_ALIGN, suggested by Johannes.
We may fix that macro name later to PAGE_ALIGN_UP, and PAGE_ALIGN_DOWN
Add comments about assuming ramdisk start is aligned
in relocate_initrd(), change to re get ramdisk_image instead of save it
to make diff smaller. Add warning for wrong range, suggested by Johannes.
-v6: remove one WARN()
We need to align beginning in free_init_pages()
do not copy more than ramdisk_size, noticed by Johannes
Reported-by: Stanislaw Gruszka <sgruszka@redhat.com>
Tested-by: Stanislaw Gruszka <sgruszka@redhat.com>
Signed-off-by: Yinghai Lu <yinghai@kernel.org>
Acked-by: Johannes Weiner <hannes@cmpxchg.org>
Cc: David Miller <davem@davemloft.net>
Cc: Benjamin Herrenschmidt <benh@kernel.crashing.org>
Cc: Linus Torvalds <torvalds@linux-foundation.org>
LKML-Reference: <1269830604-26214-3-git-send-email-yinghai@kernel.org>
Signed-off-by: Ingo Molnar <mingo@elte.hu>
2010-03-28 19:42:55 -07:00
unsigned long ramdisk_end = PAGE_ALIGN ( ramdisk_image + ramdisk_size ) ;
2008-02-01 17:49:41 +01:00
reserve_early ( ramdisk_image , ramdisk_end , " RAMDISK " ) ;
2008-01-30 13:33:17 +01:00
}
2008-03-18 12:51:22 -07:00
# endif
2008-01-30 13:33:17 +01:00
2009-08-29 15:03:59 +02:00
reserve_ebda_region ( ) ;
2008-01-30 13:33:17 +01:00
/*
* At this point everything still needed from the boot loader
* or BIOS or kernel text should be early reserved or marked not
* RAM in e820 . All other memory is free game .
*/
2005-04-16 15:20:36 -07:00
start_kernel ( ) ;
}