mirror of https://github.com/ipxe/ipxe.git
612 lines
15 KiB
ArmAsm
612 lines
15 KiB
ArmAsm
/*
|
|
Copyright (C) 2000, Entity Cyber, Inc.
|
|
|
|
Authors: Gary Byers (gb@thinguin.org)
|
|
Marty Connor (mdc@thinguin.org)
|
|
Eric Biederman (ebiederman@lnxi.com)
|
|
|
|
This code also derives a lot from arch/i386/boot/setup.S in
|
|
the linux kernel.
|
|
|
|
This software may be used and distributed according to the terms
|
|
of the GNU Public License (GPL), incorporated herein by reference.
|
|
|
|
Description:
|
|
|
|
This is just a little bit of code and data that can get prepended
|
|
to an Etherboot ROM image in order to allow LILO to load the
|
|
result as if it were a Linux kernel image.
|
|
|
|
A real Linux kernel image consists of a one-sector boot loader
|
|
(to load the image from a floppy disk), followed a few sectors
|
|
of setup code, followed by the kernel code itself. There's
|
|
a table in the first sector (starting at offset 497) that indicates
|
|
how many sectors of setup code follow the first sector and which
|
|
contains some other parameters that aren't interesting in this
|
|
case.
|
|
|
|
When LILO loads the sectors that comprise a kernel image, it doesn't
|
|
execute the code in the first sector (since that code would try to
|
|
load the image from a floppy disk.) The code in the first sector
|
|
below doesn't expect to get executed (and prints an error message
|
|
if it ever -is- executed.) LILO's only interested in knowing the
|
|
number of setup sectors advertised in the table (at offset 497 in
|
|
the first sector.)
|
|
|
|
Etherboot doesn't require much in the way of setup code.
|
|
Historically, the Linux kernel required at least 4 sectors of
|
|
setup code. Current versions of LILO look at the byte at
|
|
offset 497 in the first sector to indicate how many sectors
|
|
of setup code are contained in the image.
|
|
|
|
The setup code that is present here does a lot of things
|
|
exactly the way the linux kernel does them instead of in
|
|
ways more typical of etherboot. Generally this is so
|
|
the code can be strongly compatible with the linux kernel.
|
|
In addition the general etherboot technique of enabling the a20
|
|
after we switch into protected mode does not work if etherboot
|
|
is being loaded at 1MB.
|
|
*/
|
|
|
|
.equ CR0_PE,1
|
|
|
|
#ifdef GAS291
|
|
#define DATA32 data32;
|
|
#define ADDR32 addr32;
|
|
#define LJMPI(x) ljmp x
|
|
#else
|
|
#define DATA32 data32
|
|
#define ADDR32 addr32
|
|
/* newer GAS295 require #define LJMPI(x) ljmp *x */
|
|
#define LJMPI(x) ljmp x
|
|
#endif
|
|
|
|
/* Simple and small GDT entries for booting only */
|
|
#define GDT_ENTRY_BOOT_CS 2
|
|
#define GDT_ENTRY_BOOT_DS (GDT_ENTRY_BOOT_CS + 1)
|
|
#define __BOOT_CS (GDT_ENTRY_BOOT_CS * 8)
|
|
#define __BOOT_DS (GDT_ENTRY_BOOT_DS * 8)
|
|
|
|
|
|
#define SETUPSECS 4 /* Minimal nr of setup-sectors */
|
|
#define PREFIXSIZE ((SETUPSECS+1)*512)
|
|
#define PREFIXPGH (PREFIXSIZE / 16 )
|
|
#define BOOTSEG 0x07C0 /* original address of boot-sector */
|
|
#define INITSEG 0x9000 /* we move boot here - out of the way */
|
|
#define SETUPSEG 0x9020 /* setup starts here */
|
|
#define SYSSEG 0x1000 /* system loaded at 0x10000 (65536). */
|
|
|
|
#define DELTA_INITSEG (SETUPSEG - INITSEG) /* 0x0020 */
|
|
|
|
/* Signature words to ensure LILO loaded us right */
|
|
#define SIG1 0xAA55
|
|
#define SIG2 0x5A5A
|
|
|
|
.text
|
|
.code16
|
|
.arch i386
|
|
.org 0
|
|
.section ".prefix", "ax", @progbits
|
|
_prefix:
|
|
|
|
/*
|
|
This is a minimal boot sector. If anyone tries to execute it (e.g., if
|
|
a .lilo file is dd'ed to a floppy), print an error message.
|
|
*/
|
|
|
|
bootsector:
|
|
jmp $BOOTSEG, $go - _prefix /* reload cs:ip to match relocation addr */
|
|
go:
|
|
movw $0x2000, %di /* 0x2000 is arbitrary value >= length
|
|
of bootsect + room for stack */
|
|
|
|
movw $BOOTSEG, %ax
|
|
movw %ax,%ds
|
|
movw %ax,%es
|
|
|
|
cli
|
|
movw %ax, %ss /* put stack at BOOTSEG:0x2000. */
|
|
movw %di,%sp
|
|
sti
|
|
|
|
movw $why_end-why, %cx
|
|
movw $why - _prefix, %si
|
|
|
|
movw $0x0007, %bx /* page 0, attribute 7 (normal) */
|
|
movb $0x0e, %ah /* write char, tty mode */
|
|
prloop:
|
|
lodsb
|
|
int $0x10
|
|
loop prloop
|
|
freeze: jmp freeze
|
|
|
|
why: .ascii "This image cannot be loaded from a floppy disk.\r\n"
|
|
why_end:
|
|
|
|
|
|
.org 497
|
|
setup_sects:
|
|
.byte SETUPSECS
|
|
root_flags:
|
|
.word 0
|
|
syssize:
|
|
.word _verbatim_size_pgh - PREFIXPGH
|
|
swap_dev:
|
|
.word 0
|
|
ram_size:
|
|
.word 0
|
|
vid_mode:
|
|
.word 0
|
|
root_dev:
|
|
.word 0
|
|
boot_flag:
|
|
.word 0xAA55
|
|
|
|
/*
|
|
We're now at the beginning of the second sector of the image -
|
|
where the setup code goes.
|
|
|
|
We don't need to do too much setup for Etherboot.
|
|
|
|
This code gets loaded at SETUPSEG:0. It wants to start
|
|
executing the Etherboot image that's loaded at SYSSEG:0 and
|
|
whose entry point is SYSSEG:0.
|
|
*/
|
|
setup_code:
|
|
jmp trampoline
|
|
# This is the setup header, and it must start at %cs:2 (old 0x9020:2)
|
|
|
|
.ascii "HdrS" # header signature
|
|
.word 0x0203 # header version number (>= 0x0105)
|
|
# or else old loadlin-1.5 will fail)
|
|
realmode_swtch: .word 0, 0 # default_switch, SETUPSEG
|
|
start_sys_seg: .word SYSSEG # low load segment (obsolete)
|
|
.word kernel_version - setup_code
|
|
# pointing to kernel version string
|
|
# above section of header is compatible
|
|
# with loadlin-1.5 (header v1.5). Don't
|
|
# change it.
|
|
|
|
type_of_loader: .byte 0 # = 0, old one (LILO, Loadlin,
|
|
# Bootlin, SYSLX, bootsect...)
|
|
# See Documentation/i386/boot.txt for
|
|
# assigned ids
|
|
|
|
# flags, unused bits must be zero (RFU) bit within loadflags
|
|
loadflags:
|
|
LOADED_HIGH = 1 # If set, the kernel is loaded high
|
|
CAN_USE_HEAP = 0x80 # If set, the loader also has set
|
|
# heap_end_ptr to tell how much
|
|
# space behind setup.S can be used for
|
|
# heap purposes.
|
|
# Only the loader knows what is free
|
|
.byte LOADED_HIGH
|
|
|
|
setup_move_size: .word 0x8000 # size to move, when setup is not
|
|
# loaded at 0x90000. We will move setup
|
|
# to 0x90000 then just before jumping
|
|
# into the kernel. However, only the
|
|
# loader knows how much data behind
|
|
# us also needs to be loaded.
|
|
|
|
code32_start: # here loaders can put a different
|
|
# start address for 32-bit code.
|
|
.long 0x100000 # 0x100000 = default for big kernel
|
|
|
|
ramdisk_image: .long 0 # address of loaded ramdisk image
|
|
# Here the loader puts the 32-bit
|
|
# address where it loaded the image.
|
|
# This only will be read by the kernel.
|
|
|
|
ramdisk_size: .long 0 # its size in bytes
|
|
|
|
bootsect_kludge:
|
|
.long 0 # obsolete
|
|
|
|
heap_end_ptr: .word 0 # (Header version 0x0201 or later)
|
|
# space from here (exclusive) down to
|
|
# end of setup code can be used by setup
|
|
# for local heap purposes.
|
|
|
|
pad1: .word 0
|
|
cmd_line_ptr: .long 0 # (Header version 0x0202 or later)
|
|
# If nonzero, a 32-bit pointer
|
|
# to the kernel command line.
|
|
# The command line should be
|
|
# located between the start of
|
|
# setup and the end of low
|
|
# memory (0xa0000), or it may
|
|
# get overwritten before it
|
|
# gets read. If this field is
|
|
# used, there is no longer
|
|
# anything magical about the
|
|
# 0x90000 segment; the setup
|
|
# can be located anywhere in
|
|
# low memory 0x10000 or higher.
|
|
|
|
ramdisk_max: .long 0 # (Header version 0x0203 or later)
|
|
# The highest safe address for
|
|
# the contents of an initrd
|
|
|
|
trampoline: call start_of_setup
|
|
trampoline_end:
|
|
.space 1024
|
|
# End of setup header #####################################################
|
|
|
|
start_of_setup:
|
|
# Set %ds = %cs, we know that SETUPSEG = %cs at this point
|
|
movw %cs, %ax # aka SETUPSEG
|
|
movw %ax, %ds
|
|
# Check signature at end of setup
|
|
cmpw $SIG1, (setup_sig1 - setup_code)
|
|
jne bad_sig
|
|
|
|
cmpw $SIG2, (setup_sig2 - setup_code)
|
|
jne bad_sig
|
|
|
|
jmp good_sig1
|
|
|
|
# Routine to print asciiz string at ds:si
|
|
prtstr:
|
|
lodsb
|
|
andb %al, %al
|
|
jz fin
|
|
|
|
call prtchr
|
|
jmp prtstr
|
|
|
|
fin: ret
|
|
|
|
# Part of above routine, this one just prints ascii al
|
|
prtchr: pushw %ax
|
|
pushw %cx
|
|
movw $7,%bx
|
|
movw $0x01, %cx
|
|
movb $0x0e, %ah
|
|
int $0x10
|
|
popw %cx
|
|
popw %ax
|
|
ret
|
|
|
|
no_sig_mess: .string "No setup signature found ..."
|
|
|
|
good_sig1:
|
|
jmp good_sig
|
|
|
|
# We now have to find the rest of the setup code/data
|
|
bad_sig:
|
|
movw %cs, %ax # SETUPSEG
|
|
subw $DELTA_INITSEG, %ax # INITSEG
|
|
movw %ax, %ds
|
|
xorb %bh, %bh
|
|
movb (497), %bl # get setup sect from bootsect
|
|
subw $4, %bx # LILO loads 4 sectors of setup
|
|
shlw $8, %bx # convert to words (1sect=2^8 words)
|
|
movw %bx, %cx
|
|
shrw $3, %bx # convert to segment
|
|
addw $SYSSEG, %bx
|
|
movw %bx, %cs:(start_sys_seg - setup_code)
|
|
# Move rest of setup code/data to here
|
|
movw $2048, %di # four sectors loaded by LILO
|
|
subw %si, %si
|
|
pushw %cs
|
|
popw %es
|
|
movw $SYSSEG, %ax
|
|
movw %ax, %ds
|
|
rep
|
|
movsw
|
|
movw %cs, %ax # aka SETUPSEG
|
|
movw %ax, %ds
|
|
cmpw $SIG1, (setup_sig1 - setup_code)
|
|
jne no_sig
|
|
|
|
cmpw $SIG2, (setup_sig2 - setup_code)
|
|
jne no_sig
|
|
|
|
jmp good_sig
|
|
|
|
no_sig:
|
|
lea (no_sig_mess - setup_code), %si
|
|
call prtstr
|
|
|
|
no_sig_loop:
|
|
hlt
|
|
jmp no_sig_loop
|
|
|
|
good_sig:
|
|
cmpw $0, %cs:(realmode_swtch - setup_code)
|
|
jz rmodeswtch_normal
|
|
|
|
lcall *%cs:(realmode_swtch - setup_code)
|
|
jmp rmodeswtch_end
|
|
|
|
rmodeswtch_normal:
|
|
pushw %cs
|
|
call default_switch
|
|
|
|
rmodeswtch_end:
|
|
# we get the code32 start address and modify the below 'jmpi'
|
|
# (loader may have changed it)
|
|
movl %cs:(code32_start - setup_code), %eax
|
|
movl %eax, %cs:(code32 - setup_code)
|
|
|
|
# then we load the segment descriptors
|
|
movw %cs, %ax # aka SETUPSEG
|
|
movw %ax, %ds
|
|
|
|
#
|
|
# Enable A20. This is at the very best an annoying procedure.
|
|
# A20 code ported from SYSLINUX 1.52-1.63 by H. Peter Anvin.
|
|
#
|
|
|
|
A20_TEST_LOOPS = 32 # Iterations per wait
|
|
A20_ENABLE_LOOPS = 255 # Total loops to try
|
|
|
|
a20_try_loop:
|
|
|
|
# First, see if we are on a system with no A20 gate.
|
|
a20_none:
|
|
call a20_test
|
|
jnz a20_done
|
|
|
|
# Next, try the BIOS (INT 0x15, AX=0x2401)
|
|
a20_bios:
|
|
movw $0x2401, %ax
|
|
pushfl # Be paranoid about flags
|
|
int $0x15
|
|
popfl
|
|
|
|
call a20_test
|
|
jnz a20_done
|
|
|
|
# Try enabling A20 through the keyboard controller
|
|
a20_kbc:
|
|
call empty_8042
|
|
|
|
call a20_test # Just in case the BIOS worked
|
|
jnz a20_done # but had a delayed reaction.
|
|
|
|
movb $0xD1, %al # command write
|
|
outb %al, $0x64
|
|
call empty_8042
|
|
|
|
movb $0xDF, %al # A20 on
|
|
outb %al, $0x60
|
|
call empty_8042
|
|
|
|
# Wait until a20 really *is* enabled; it can take a fair amount of
|
|
# time on certain systems; Toshiba Tecras are known to have this
|
|
# problem.
|
|
a20_kbc_wait:
|
|
xorw %cx, %cx
|
|
a20_kbc_wait_loop:
|
|
call a20_test
|
|
jnz a20_done
|
|
loop a20_kbc_wait_loop
|
|
|
|
# Final attempt: use "configuration port A"
|
|
a20_fast:
|
|
inb $0x92, %al # Configuration Port A
|
|
orb $0x02, %al # "fast A20" version
|
|
andb $0xFE, %al # don't accidentally reset
|
|
outb %al, $0x92
|
|
|
|
# Wait for configuration port A to take effect
|
|
a20_fast_wait:
|
|
xorw %cx, %cx
|
|
a20_fast_wait_loop:
|
|
call a20_test
|
|
jnz a20_done
|
|
loop a20_fast_wait_loop
|
|
|
|
# A20 is still not responding. Try frobbing it again.
|
|
#
|
|
decb (a20_tries - setup_code)
|
|
jnz a20_try_loop
|
|
|
|
movw $(a20_err_msg - setup_code), %si
|
|
call prtstr
|
|
|
|
a20_die:
|
|
hlt
|
|
jmp a20_die
|
|
|
|
a20_tries:
|
|
.byte A20_ENABLE_LOOPS
|
|
|
|
a20_err_msg:
|
|
.ascii "linux: fatal error: A20 gate not responding!"
|
|
.byte 13, 10, 0
|
|
|
|
# If we get here, all is good
|
|
a20_done:
|
|
# Leave the idt alone
|
|
|
|
# set up gdt
|
|
xorl %eax, %eax # Compute gdt_base
|
|
movw %ds, %ax # (Convert %ds:gdt to a linear ptr)
|
|
shll $4, %eax
|
|
addl $(bImage_gdt - setup_code), %eax
|
|
movl %eax, (bImage_gdt_48+2 - setup_code)
|
|
DATA32 lgdt %ds:(bImage_gdt_48 - setup_code) # load gdt with whatever is
|
|
# appropriate
|
|
|
|
# Switch to protected mode
|
|
movl %cr0, %eax
|
|
orb $CR0_PE, %al
|
|
movl %eax, %cr0
|
|
|
|
DATA32 ljmp %ds:(code32 - setup_code)
|
|
code32:
|
|
.long 0x100000
|
|
.word __BOOT_CS, 0
|
|
|
|
# Here's a bunch of information about your current kernel..
|
|
kernel_version: .ascii "Etherboot "
|
|
.ascii VERSION
|
|
.byte 0
|
|
|
|
# This is the default real mode switch routine.
|
|
# to be called just before protected mode transition
|
|
default_switch:
|
|
cli # no interrupts allowed !
|
|
movb $0x80, %al # disable NMI for bootup
|
|
# sequence
|
|
outb %al, $0x70
|
|
lret
|
|
|
|
# This routine tests whether or not A20 is enabled. If so, it
|
|
# exits with zf = 0.
|
|
#
|
|
# The memory address used, 0x200, is the int $0x80 vector, which
|
|
# should be safe.
|
|
|
|
A20_TEST_ADDR = 4*0x80
|
|
|
|
a20_test:
|
|
pushw %cx
|
|
pushw %ax
|
|
xorw %cx, %cx
|
|
movw %cx, %fs # Low memory
|
|
decw %cx
|
|
movw %cx, %gs # High memory area
|
|
movw $A20_TEST_LOOPS, %cx
|
|
movw %fs:(A20_TEST_ADDR), %ax
|
|
pushw %ax
|
|
a20_test_wait:
|
|
incw %ax
|
|
movw %ax, %fs:(A20_TEST_ADDR)
|
|
call delay # Serialize and make delay constant
|
|
cmpw %gs:(A20_TEST_ADDR+0x10), %ax
|
|
loope a20_test_wait
|
|
|
|
popw %fs:(A20_TEST_ADDR)
|
|
popw %ax
|
|
popw %cx
|
|
ret
|
|
|
|
|
|
# This routine checks that the keyboard command queue is empty
|
|
# (after emptying the output buffers)
|
|
#
|
|
# Some machines have delusions that the keyboard buffer is always full
|
|
# with no keyboard attached...
|
|
#
|
|
# If there is no keyboard controller, we will usually get 0xff
|
|
# to all the reads. With each IO taking a microsecond and
|
|
# a timeout of 100,000 iterations, this can take about half a
|
|
# second ("delay" == outb to port 0x80). That should be ok,
|
|
# and should also be plenty of time for a real keyboard controller
|
|
# to empty.
|
|
#
|
|
|
|
empty_8042:
|
|
pushl %ecx
|
|
movl $100000, %ecx
|
|
|
|
empty_8042_loop:
|
|
decl %ecx
|
|
jz empty_8042_end_loop
|
|
|
|
call delay
|
|
|
|
inb $0x64, %al # 8042 status port
|
|
testb $1, %al # output buffer?
|
|
jz no_output
|
|
|
|
call delay
|
|
inb $0x60, %al # read it
|
|
jmp empty_8042_loop
|
|
|
|
no_output:
|
|
testb $2, %al # is input buffer full?
|
|
jnz empty_8042_loop # yes - loop
|
|
empty_8042_end_loop:
|
|
popl %ecx
|
|
|
|
|
|
# Delay is needed after doing I/O
|
|
delay:
|
|
outb %al,$0x80
|
|
ret
|
|
|
|
# Descriptor tables
|
|
#
|
|
# NOTE: The intel manual says gdt should be sixteen bytes aligned for
|
|
# efficiency reasons. However, there are machines which are known not
|
|
# to boot with misaligned GDTs, so alter this at your peril! If you alter
|
|
# GDT_ENTRY_BOOT_CS (in asm/segment.h) remember to leave at least two
|
|
# empty GDT entries (one for NULL and one reserved).
|
|
#
|
|
# NOTE: On some CPUs, the GDT must be 8 byte aligned. This is
|
|
# true for the Voyager Quad CPU card which will not boot without
|
|
# This directive. 16 byte aligment is recommended by intel.
|
|
#
|
|
.balign 16
|
|
bImage_gdt:
|
|
.fill GDT_ENTRY_BOOT_CS,8,0
|
|
|
|
.word 0xFFFF # 4Gb - (0x100000*0x1000 = 4Gb)
|
|
.word 0 # base address = 0
|
|
.word 0x9A00 # code read/exec
|
|
.word 0x00CF # granularity = 4096, 386
|
|
# (+5th nibble of limit)
|
|
|
|
.word 0xFFFF # 4Gb - (0x100000*0x1000 = 4Gb)
|
|
.word 0 # base address = 0
|
|
.word 0x9200 # data read/write
|
|
.word 0x00CF # granularity = 4096, 386
|
|
# (+5th nibble of limit)
|
|
bImage_gdt_end:
|
|
.balign 4
|
|
|
|
.word 0 # alignment byte
|
|
bImage_idt_48:
|
|
.word 0 # idt limit = 0
|
|
.long 0 # idt base = 0L
|
|
|
|
.word 0 # alignment byte
|
|
bImage_gdt_48:
|
|
.word bImage_gdt_end - bImage_gdt - 1 # gdt limit
|
|
.long bImage_gdt_48 - setup_code # gdt base (filled in later)
|
|
|
|
.section ".text16", "ax", @progbits
|
|
prefix_exit:
|
|
int $0x19 /* should try to boot machine */
|
|
prefix_exit_end:
|
|
.previous
|
|
|
|
|
|
.org (PREFIXSIZE - 4)
|
|
# Setup signature -- must be last
|
|
setup_sig1: .word SIG1
|
|
setup_sig2: .word SIG2
|
|
/* Etherboot expects to be contiguous in memory once loaded.
|
|
* The linux bImage protocol does not do this, but since we
|
|
* don't need any information that's left in the prefix, it
|
|
* doesn't matter: we just have to ensure that we make it to _start
|
|
*
|
|
* protected_start will live at 0x100000 and it will be the
|
|
* the first code called as we enter protected mode.
|
|
*/
|
|
.code32
|
|
protected_start:
|
|
/* Load segment registers */
|
|
movw $__BOOT_DS, %ax
|
|
movw %ax, %ss
|
|
movw %ax, %ds
|
|
movw %ax, %es
|
|
movw %ax, %fs
|
|
movw %ax, %gs
|
|
|
|
/* Use the internal etherboot stack */
|
|
movl $(_prefix_stack_end - protected_start + 0x100000), %esp
|
|
|
|
pushl $0 /* No parameters to preserve for exit path */
|
|
pushl $0 /* Use prefix exit path mechanism */
|
|
|
|
jmp _start
|
|
/*
|
|
That's about it.
|
|
*/
|