File: [local] / sys / arch / amd64 / amd64 / locore.S (download)
Revision 1.1.1.1 (vendor branch), Tue Mar 4 16:04:59 2008 UTC (16 years, 6 months ago) by nbrk
Branch: OPENBSD_4_2_BASE, MAIN
CVS Tags: jornada-partial-support-wip, HEAD Changes since 1.1: +0 -0 lines
Import of OpenBSD 4.2 release kernel tree with initial code to support
Jornada 720/728, StrongARM 1110-based handheld PC.
At this point kernel roots on NFS and boots into vfs_mountroot() and traps.
What is supported:
- glass console, Jornada framebuffer (jfb) works in 16bpp direct color mode
(needs some palette tweaks for non black/white/blue colors, i think)
- saic, SA11x0 interrupt controller (needs cleanup)
- sacom, SA11x0 UART (supported only as boot console for now)
- SA11x0 GPIO controller fully supported (but can't handle multiple interrupt
handlers on one gpio pin)
- sassp, SSP port on SA11x0 that attaches spibus
- Jornada microcontroller (jmcu) to control kbd, battery, etc throught
the SPI bus (wskbd attaches on jmcu, but not tested)
- tod functions seem work
- initial code for SA-1111 (chip companion) : this is TODO
Next important steps, i think:
- gpio and intc on sa1111
- pcmcia support for sa11x0 (and sa1111 help logic)
- REAL root on nfs when we have PCMCIA support (we may use any of supported pccard NICs)
- root on wd0! (using already supported PCMCIA-ATA)
|
/* $OpenBSD: locore.S,v 1.22 2007/05/27 08:58:31 art Exp $ */
/* $NetBSD: locore.S,v 1.13 2004/03/25 18:33:17 drochner Exp $ */
/*
* Copyright-o-rama!
*/
/*
* Copyright (c) 2001 Wasabi Systems, Inc.
* All rights reserved.
*
* Written by Frank van der Linden for Wasabi Systems, Inc.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
* 1. Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
* 2. Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in the
* documentation and/or other materials provided with the distribution.
* 3. All advertising materials mentioning features or use of this software
* must display the following acknowledgement:
* This product includes software developed for the NetBSD Project by
* Wasabi Systems, Inc.
* 4. The name of Wasabi Systems, Inc. may not be used to endorse
* or promote products derived from this software without specific prior
* written permission.
*
* THIS SOFTWARE IS PROVIDED BY WASABI SYSTEMS, INC. ``AS IS'' AND
* ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
* TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
* PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL WASABI SYSTEMS, INC
* BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
* CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
* SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
* INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
* CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
* ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
* POSSIBILITY OF SUCH DAMAGE.
*/
/*-
* Copyright (c) 1998, 2000 The NetBSD Foundation, Inc.
* All rights reserved.
*
* This code is derived from software contributed to The NetBSD Foundation
* by Charles M. Hannum.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
* 1. Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
* 2. Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in the
* documentation and/or other materials provided with the distribution.
* 3. All advertising materials mentioning features or use of this software
* must display the following acknowledgement:
* This product includes software developed by the NetBSD
* Foundation, Inc. and its contributors.
* 4. Neither the name of The NetBSD Foundation nor the names of its
* contributors may be used to endorse or promote products derived
* from this software without specific prior written permission.
*
* THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
* ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
* TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
* PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
* BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
* CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
* SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
* INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
* CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
* ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
* POSSIBILITY OF SUCH DAMAGE.
*/
/*-
* Copyright (c) 1990 The Regents of the University of California.
* All rights reserved.
*
* This code is derived from software contributed to Berkeley by
* William Jolitz.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
* 1. Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
* 2. Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in the
* documentation and/or other materials provided with the distribution.
* 3. Neither the name of the University nor the names of its contributors
* may be used to endorse or promote products derived from this software
* without specific prior written permission.
*
* THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
* ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
* ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
* FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
* DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
* OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
* HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
* LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
* OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
* SUCH DAMAGE.
*
* @(#)locore.s 7.3 (Berkeley) 5/13/91
*/
#include "assym.h"
#include "lapic.h"
#include "ioapic.h"
#include "ksyms.h"
#include <sys/errno.h>
#include <sys/syscall.h>
#include <machine/param.h>
#include <machine/segments.h>
#include <machine/specialreg.h>
#include <machine/trap.h>
#include <machine/frameasm.h>
#if NLAPIC > 0
#include <machine/i82489reg.h>
#endif
/*
* override user-land alignment before including asm.h
*/
#define ALIGN_DATA .align 8
#define ALIGN_TEXT .align 16,0x90
#define _ALIGN_TEXT ALIGN_TEXT
#include <machine/asm.h>
#define SET_CURPROC(proc,cpu) \
movq CPUVAR(SELF),cpu ; \
movq proc,CPUVAR(CURPROC) ; \
movq cpu,P_CPU(proc)
#define GET_CURPCB(reg) movq CPUVAR(CURPCB),reg
#define SET_CURPCB(reg) movq reg,CPUVAR(CURPCB)
/* XXX temporary kluge; these should not be here */
/* Get definitions for IOM_BEGIN, IOM_END, and IOM_SIZE */
#include <dev/isa/isareg.h>
/*
* Initialization
*/
.data
#if NLAPIC > 0
.align NBPG
.globl _C_LABEL(local_apic), _C_LABEL(lapic_id), _C_LABEL(lapic_tpr)
_C_LABEL(local_apic):
.space LAPIC_ID
_C_LABEL(lapic_id):
.long 0x00000000
.space LAPIC_TPRI-(LAPIC_ID+4)
_C_LABEL(lapic_tpr):
.space LAPIC_PPRI-LAPIC_TPRI
_C_LABEL(lapic_ppr):
.space LAPIC_ISR-LAPIC_PPRI
_C_LABEL(lapic_isr):
.space NBPG-LAPIC_ISR
#endif
.globl _C_LABEL(cpu_id),_C_LABEL(cpu_vendor), _C_LABEL(cpu_brand_id)
.globl _C_LABEL(cpuid_level),_C_LABEL(cpu_feature)
.globl _C_LABEL(cpu_ecxfeature)
.globl _C_LABEL(esym),_C_LABEL(boothowto),_C_LABEL(bootdev)
.globl _C_LABEL(bootinfo), _C_LABEL(bootinfo_size), _C_LABEL(atdevbase)
.globl _C_LABEL(proc0paddr),_C_LABEL(PTDpaddr)
.globl _C_LABEL(biosbasemem),_C_LABEL(biosextmem)
.globl _C_LABEL(bootapiver)
_C_LABEL(cpu): .long 0 # are we 386, 386sx, or 486,
# or Pentium, or..
_C_LABEL(cpu_id): .long 0 # saved from `cpuid' instruction
_C_LABEL(cpu_feature): .long 0 # feature flags from 'cpuid'
# instruction
_C_LABEL(cpu_ecxfeature):.long 0 # extended feature flags from 'cpuid'
_C_LABEL(cpuid_level): .long -1 # max. level accepted by 'cpuid'
# instruction
_C_LABEL(cpu_vendor): .space 16 # vendor string returned by `cpuid'
# instruction
_C_LABEL(cpu_brand_id): .long 0 # brand ID from 'cpuid' instruction
_C_LABEL(esym): .quad 0 # ptr to end of syms
_C_LABEL(atdevbase): .quad 0 # location of start of iomem in virtual
_C_LABEL(bootapiver): .long 0 # /boot API version
_C_LABEL(bootdev): .long 0 # device we booted from
_C_LABEL(proc0paddr): .quad 0
_C_LABEL(PTDpaddr): .quad 0 # paddr of PTD, for libkvm
#ifndef REALBASEMEM
_C_LABEL(biosbasemem): .long 0 # base memory reported by BIOS
#else
_C_LABEL(biosbasemem): .long REALBASEMEM
#endif
#ifndef REALEXTMEM
_C_LABEL(biosextmem): .long 0 # extended memory reported by BIOS
#else
_C_LABEL(biosextmem): .long REALEXTMEM
#endif
#define _RELOC(x) ((x) - KERNBASE)
#define RELOC(x) _RELOC(_C_LABEL(x))
.globl gdt64
gdt64:
.word gdt64_end-gdt64_start
.quad _RELOC(gdt64_start)
.align 64
gdt64_start:
.quad 0x0000000000000000 /* always empty */
.quad 0x00af9a000000ffff /* kernel CS */
.quad 0x00cf92000000ffff /* kernel DS */
gdt64_end:
farjmp64:
.long longmode-KERNBASE
.word GSEL(GCODE_SEL, SEL_KPL)
.space 512
tmpstk:
.globl _C_LABEL(cpu_private)
.comm _C_LABEL(cpu_private),NBPG,NBPG
/*
* Some hackage to deal with 64bit symbols in 32 bit mode.
* This may not be needed if things are cleaned up a little.
*/
.text
.globl _C_LABEL(kernel_text)
.set _C_LABEL(kernel_text),KERNTEXTOFF
.code32
.globl start
start: movw $0x1234,0x472 # warm boot
/*
* Load parameters from stack
* (howto, bootdev, bootapiver, esym, extmem, cnvmem, ac, av)
*/
movl 4(%esp),%eax
movl %eax, RELOC(boothowto)
movl 8(%esp),%eax
movl %eax, RELOC(bootdev)
movl 16(%esp), %eax
testl %eax,%eax
jz 1f
addl $KERNBASE_LO,%eax
movl $RELOC(esym),%ebp
movl %eax,(%ebp)
movl $KERNBASE_HI,4(%ebp)
1:
movl 20(%esp), %eax
movl %eax, RELOC(biosextmem)
movl 24(%esp), %eax
movl %eax, RELOC(biosbasemem)
movl 12(%esp), %eax
movl %eax, RELOC(bootapiver)
/*
* Copy the boot arguments to bootinfo[] in machdep.c.
*
* We are passed the size of bootinfo[] in bootinfo_size, and
* we report how much data /boot passed us back in the same variable.
*
* machdep.c can then take action if bootinfo_size >= bootinfo[]
* (which would meant that we may have been passed too much data).
*/
movl 28(%esp), %eax
movl %eax, %ecx
cmpl RELOC(bootinfo_size), %ecx /* Too much? */
jnc bi_size_ok
movl RELOC(bootinfo_size), %ecx /* Only copy this much */
bi_size_ok:
movl %eax, RELOC(bootinfo_size) /* Report full amount */
movl $RELOC(bootinfo), %edi /* Destination */
movl 32(%esp), %esi /* Source */
rep movsb /* Copy this many bytes */
/* First, reset the PSL. */
pushl $PSL_MBO
popfl
xorl %eax,%eax
cpuid
movl %eax,RELOC(cpuid_level)
movl $RELOC(cpu_vendor),%ebp
movl %ebx,(%ebp)
movl %edx,4(%ebp)
movl %ecx,8(%ebp)
movl $0, 12(%ebp)
movl $1,%eax
cpuid
movl %eax,RELOC(cpu_id)
movl %ecx,RELOC(cpu_ecxfeature)
movl %edx,RELOC(cpu_feature)
movl $0x80000001, %eax
cpuid
andl $CPUID_NXE, %edx /* other bits may clash */
orl %edx, RELOC(cpu_feature)
/* Brand ID is bits 0-7 of %ebx */
andl $255,%ebx
movl %ebx,RELOC(cpu_brand_id)
/*
* Finished with old stack; load new %esp now instead of later so we
* can trace this code without having to worry about the trace trap
* clobbering the memory test or the zeroing of the bss+bootstrap page
* tables.
*
* The boot program should check:
* text+data <= &stack_variable - more_space_for_stack
* text+data+bss+pad+space_for_page_tables <= end_of_memory
* Oops, the gdt is in the carcass of the boot program so clearing
* the rest of memory is still not possible.
*/
movl $RELOC(tmpstk),%esp
/*
* Virtual address space of kernel:
*
* text | data | bss | [syms] | page dir | proc0 kstack | L1 ptp | L2 ptp | L3
* 0 1 2 3
*/
#if L2_SLOT_KERNBASE > 0
#define TABLE_L2_ENTRIES (2 * (NKL2_KIMG_ENTRIES + 1))
#else
#define TABLE_L2_ENTRIES (NKL2_KIMG_ENTRIES + 1)
#endif
#if L3_SLOT_KERNBASE > 0
#define TABLE_L3_ENTRIES (2 * NKL3_KIMG_ENTRIES)
#else
#define TABLE_L3_ENTRIES NKL3_KIMG_ENTRIES
#endif
#define PROC0_PML4_OFF 0
#define PROC0_STK_OFF (PROC0_PML4_OFF + NBPG)
#define PROC0_PTP3_OFF (PROC0_STK_OFF + UPAGES * NBPG)
#define PROC0_PTP2_OFF (PROC0_PTP3_OFF + NKL4_KIMG_ENTRIES * NBPG)
#define PROC0_PTP1_OFF (PROC0_PTP2_OFF + TABLE_L3_ENTRIES * NBPG)
#define PROC0_DMP3_OFF (PROC0_PTP1_OFF + TABLE_L2_ENTRIES * NBPG)
#define PROC0_DMP2_OFF (PROC0_DMP3_OFF + NDML3_ENTRIES * NBPG)
#define TABLESIZE \
((NKL4_KIMG_ENTRIES + TABLE_L3_ENTRIES + TABLE_L2_ENTRIES + 1 + UPAGES + \
NDML3_ENTRIES + NDML2_ENTRIES) * NBPG)
#define fillkpt \
1: movl %eax,(%ebx) ; /* store phys addr */ \
movl $0,4(%ebx) ; /* upper 32 bits 0 */ \
addl $8,%ebx ; /* next pte/pde */ \
addl $NBPG,%eax ; /* next phys page */ \
loop 1b ; \
/* Find end of kernel image. */
movl $RELOC(end),%edi
#if (NKSYMS || defined(DDB) || defined(LKM)) && !defined(SYMTAB_SPACE)
/* Save the symbols (if loaded). */
movl RELOC(esym),%eax
testl %eax,%eax
jz 1f
subl $KERNBASE_LO,%eax /* XXX */
movl %eax,%edi
1:
#endif
/* Clear tables */
movl %edi,%esi
addl $PGOFSET,%esi
andl $~PGOFSET,%esi
movl %esi,%edi
xorl %eax,%eax
cld
movl $TABLESIZE,%ecx
shrl $2,%ecx
rep
stosl
leal (PROC0_PTP1_OFF)(%esi), %ebx
/*
* Compute etext - KERNBASE. This can't be > 4G, or we can't deal
* with it anyway, since we can't load it in 32 bit mode. So use
* the bottom 32 bits.
*/
movl $RELOC(etext),%edx
addl $PGOFSET,%edx
andl $~PGOFSET,%edx
/*
* Skip the first MB.
*/
movl $(KERNTEXTOFF_LO - KERNBASE_LO),%eax
movl %eax,%ecx
shrl $(PGSHIFT-3),%ecx /* ((n >> PGSHIFT) << 3) for # pdes */
addl %ecx,%ebx
/* Map kernel text read-only */
movl %edx,%ecx
subl %eax,%ecx
shrl $PGSHIFT,%ecx
orl $(PG_V|PG_KR),%eax
fillkpt
/* Map the data, BSS, and bootstrap tables read-write. */
leal (PG_V|PG_KW)(%edx),%eax
movl $TABLESIZE,%ecx
addl %esi,%ecx /* %ecx = &end[TABLESIZE] */
subl %edx,%ecx /* %ecx = %ecx - etext */
shrl $PGSHIFT,%ecx
fillkpt
/* Map ISA I/O mem (later atdevbase) */
movl $(IOM_BEGIN|PG_V|PG_KW/*|PG_N*/),%eax
movl $(IOM_SIZE>>PGSHIFT),%ecx
fillkpt
/* Set up level 2 pages */
leal (PROC0_PTP2_OFF)(%esi),%ebx
leal (PROC0_PTP1_OFF)(%esi),%eax
orl $(PG_V|PG_KW), %eax
movl $(NKL2_KIMG_ENTRIES+1),%ecx
fillkpt
#if L2_SLOT_KERNBASE > 0
/* If needed, set up level 2 entries for actual kernel mapping */
leal (PROC0_PTP2_OFF+ L2_SLOT_KERNBASE*8)(%esi),%ebx
leal (PROC0_PTP1_OFF)(%esi),%eax
orl $(PG_V|PG_KW), %eax
movl $(NKL2_KIMG_ENTRIES+1),%ecx
fillkpt
#endif
/* Set up level 3 pages */
leal (PROC0_PTP3_OFF)(%esi),%ebx
leal (PROC0_PTP2_OFF)(%esi),%eax
orl $(PG_V|PG_KW), %eax
movl $NKL3_KIMG_ENTRIES,%ecx
fillkpt
#if L3_SLOT_KERNBASE > 0
/* If needed, set up level 3 entries for actual kernel mapping */
leal (PROC0_PTP3_OFF+ L3_SLOT_KERNBASE*8)(%esi),%ebx
leal (PROC0_PTP2_OFF)(%esi),%eax
orl $(PG_V|PG_KW), %eax
movl $NKL3_KIMG_ENTRIES,%ecx
fillkpt
#endif
/* Set up top level entries for identity mapping */
leal (PROC0_PML4_OFF)(%esi),%ebx
leal (PROC0_PTP3_OFF)(%esi),%eax
orl $(PG_V|PG_KW), %eax
movl $NKL4_KIMG_ENTRIES,%ecx
fillkpt
/* Set up top level entries for actual kernel mapping */
leal (PROC0_PML4_OFF + L4_SLOT_KERNBASE*8)(%esi),%ebx
leal (PROC0_PTP3_OFF)(%esi),%eax
orl $(PG_V|PG_KW), %eax
movl $NKL4_KIMG_ENTRIES,%ecx
fillkpt
/*
* Map the first 4 GB with the direct map. We'll map the rest
* in pmap_bootstrap. But we always need the first 4GB during
* bootstrap.
*/
leal (PROC0_DMP2_OFF)(%esi), %ebx
xorl %eax, %eax
orl $(PG_V|PG_KW|PG_PS|PG_G), %eax
movl $(NDML2_ENTRIES * NPDPG), %ecx
1: movl %eax, (%ebx)
movl $0, 4(%ebx)
addl $8, %ebx
addl $NBPD_L2, %eax
loop 1b
leal (PROC0_DMP3_OFF)(%esi), %ebx
leal (PROC0_DMP2_OFF)(%esi), %eax
orl $(PG_V|PG_KW), %eax
movl $NDML2_ENTRIES, %ecx
fillkpt
leal (PROC0_PML4_OFF + PDIR_SLOT_DIRECT * 8)(%esi), %ebx
leal (PROC0_DMP3_OFF)(%esi), %eax
orl $(PG_V|PG_KW), %eax
movl $NDML3_ENTRIES, %ecx
fillkpt
/* Install recursive top level PDE */
leal (PROC0_PML4_OFF + PDIR_SLOT_PTE*8)(%esi),%ebx
leal (PROC0_PML4_OFF)(%esi),%eax
orl $(PG_V|PG_KW),%eax
movl %eax,(%ebx)
movl $0, 4(%ebx)
/* Save phys. addr of PTD, for libkvm. */
movl $RELOC(PTDpaddr),%ebp
movl %esi,(%ebp)
movl $0,4(%ebp)
/*
* Startup checklist:
* 1. Enable PAE (and SSE while here).
*/
movl %cr4,%eax
orl $(CR4_DEFAULT),%eax
movl %eax,%cr4
/*
* 2. Set Long Mode Enable in EFER. Also enable the
* syscall extensions.
*/
movl $MSR_EFER,%ecx
rdmsr
xorl %eax,%eax /* XXX */
orl $(EFER_LME|EFER_SCE),%eax
wrmsr
/*
* 3. Load %cr3 with pointer to PML4.
*/
movl %esi,%eax
movl %eax,%cr3
/*
* 4. Enable paging and the rest of it.
*/
movl %cr0,%eax
orl $(CR0_PE|CR0_PG|CR0_NE|CR0_TS|CR0_MP|CR0_WP),%eax
movl %eax,%cr0
jmp compat
compat:
/*
* 5.
* Not quite done yet, we're now in a compatibility segment,
* in legacy mode. We must jump to a long mode segment.
* Need to set up a temporary GDT with a long mode segment
* in it to do that.
*/
movl $RELOC(gdt64),%eax
lgdt (%eax)
movl $RELOC(farjmp64),%eax
ljmp *(%eax)
.code64
longmode:
/*
* 6.
* Finally, we're in long mode. However, we're still
* in the identity mapped area (could not jump out
* of that earlier because it would have been a > 32bit
* jump). We can do that now, so here we go.
*/
movabsq $longmode_hi,%rax
jmp *%rax
longmode_hi:
/*
* We have arrived.
* There's no need anymore for the identity mapping in low
* memory, remove it.
*/
movq $KERNBASE,%r8
#if L2_SLOT_KERNBASE > 0
movq $(NKL2_KIMG_ENTRIES+1),%rcx
leaq (PROC0_PTP2_OFF)(%rsi),%rbx
addq %r8, %rbx
1: movq $0,(%rbx)
addq $8,%rbx
loop 1b
#endif
#if L3_SLOT_KERNBASE > 0
movq $NKL3_KIMG_ENTRIES,%rcx
leaq (PROC0_PTP3_OFF)(%rsi),%rbx
addq %r8, %rbx
1: movq $0,(%rbx)
addq $8,%rbx
loop 1b
#endif
movq $NKL4_KIMG_ENTRIES,%rcx
leaq (PROC0_PML4_OFF)(%rsi),%rbx # old, phys address of PML4
addq %r8, %rbx # new, virtual address of PML4
1: movq $0,(%rbx)
addq $8,%rbx
loop 1b
/* Relocate atdevbase. */
movq $(TABLESIZE+KERNBASE),%rdx
addq %rsi,%rdx
movq %rdx,_C_LABEL(atdevbase)(%rip)
/* Set up bootstrap stack. */
leaq (PROC0_STK_OFF)(%rsi),%rax
addq %r8,%rax
movq %rax,_C_LABEL(proc0paddr)(%rip)
leaq (USPACE-FRAMESIZE)(%rax),%rsp
movq %rsi,PCB_CR3(%rax) # pcb->pcb_cr3
xorq %rbp,%rbp # mark end of frames
xorw %ax,%ax
movw %ax,%gs
movw %ax,%fs
/* XXX merge these */
leaq TABLESIZE(%rsi),%rdi
call _C_LABEL(init_x86_64)
call _C_LABEL(main)
/*****************************************************************************/
/*
* Signal trampoline; copied to top of user stack.
*/
NENTRY(sigcode)
call *%rax
movq %rsp,%rdi
pushq %rdi /* fake return address */
movq $SYS_sigreturn,%rax
int $0x80
movq $SYS_exit,%rax
syscall
.globl _C_LABEL(esigcode)
_C_LABEL(esigcode):
/*
* void lgdt(struct region_descriptor *rdp);
* Change the global descriptor table.
*/
NENTRY(lgdt)
/* Reload the descriptor table. */
movq %rdi,%rax
lgdt (%rax)
/* Flush the prefetch q. */
jmp 1f
nop
1: /* Reload "stale" selectors. */
movl $GSEL(GDATA_SEL, SEL_KPL),%eax
movl %eax,%ds
movl %eax,%es
movl %eax,%ss
/* Reload code selector by doing intersegment return. */
popq %rax
pushq $GSEL(GCODE_SEL, SEL_KPL)
pushq %rax
lretq
ENTRY(setjmp)
/*
* Only save registers that must be preserved across function
* calls according to the ABI (%rbx, %rsp, %rbp, %r12-%r15)
* and %rip.
*/
movq %rdi,%rax
movq %rbx,(%rax)
movq %rsp,8(%rax)
movq %rbp,16(%rax)
movq %r12,24(%rax)
movq %r13,32(%rax)
movq %r14,40(%rax)
movq %r15,48(%rax)
movq (%rsp),%rdx
movq %rdx,56(%rax)
xorl %eax,%eax
ret
ENTRY(longjmp)
movq %rdi,%rax
movq (%rax),%rbx
movq 8(%rax),%rsp
movq 16(%rax),%rbp
movq 24(%rax),%r12
movq 32(%rax),%r13
movq 40(%rax),%r14
movq 48(%rax),%r15
movq 56(%rax),%rdx
movq %rdx,(%rsp)
xorl %eax,%eax
incl %eax
ret
/*****************************************************************************/
/*
* The following primitives manipulate the run queues.
* _whichqs tells which of the 32 queues _qs
* have processes in them. Setrq puts processes into queues, Remrq
* removes them from queues. The running process is on no queue,
* other processes are on a queue related to p->p_pri, divided by 4
* actually to shrink the 0-127 range of priorities into the 32 available
* queues.
*/
.globl _C_LABEL(whichqs),_C_LABEL(qs)
.globl _C_LABEL(uvmexp),_C_LABEL(panic)
#if NAPM > 0
.globl _C_LABEL(apm_cpu_idle),_C_LABEL(apm_cpu_busy)
#endif
#ifdef DIAGNOSTIC
NENTRY(switch_error1)
movabsq $1f,%rdi
call _C_LABEL(panic)
/* NOTREACHED */
1: .asciz "cpu_switch 1"
NENTRY(switch_error2)
movabsq $1f,%rdi
call _C_LABEL(panic)
/* NOTREACHED */
1: .asciz "cpu_switch 2"
NENTRY(switch_error3)
movabsq $1f,%rdi
call _C_LABEL(panic)
/* NOTREACHED */
1: .asciz "cpu_switch 3"
#endif /* DIAGNOSTIC */
/*
* int cpu_switch(struct proc *)
* Find a runnable process and switch to it. Wait if necessary. If the new
* proc is the same as the old one, we short-circuit the context save and
* restore.
*/
ENTRY(cpu_switch)
pushq %rbx
pushq %rbp
pushq %r12
pushq %r13
pushq %r14
pushq %r15
movq %rdi,%r13
/*
* Clear curproc so that we don't accumulate system time while idle.
* This also insures that schedcpu() will move the old proc to
* the correct queue if it happens to get called from the spllower()
* below and changes the priority. (See corresponding comment in
* userret()).
*/
movq $0,CPUVAR(CURPROC)
/*
* First phase: find new proc.
*
* Registers:
* %rax - queue head, scratch, then zero
* %r8 - queue number
* %ecx - cached value of whichqs
* %rdx - next process in queue
* %r13 - old proc
* %r12 - new proc
*/
/* Look for new proc. */
cli # splhigh doesn't do a cli
movl _C_LABEL(whichqs)(%rip),%ecx
bsfl %ecx,%r8d # find a full q
jnz switch_dequeue
/*
* idling: save old context
*
* Registers:
* %rax, %rcx - scratch
* %r13 - old proc, then old pcb
* %r12 - idle pcb
*/
/* old proc still in %rdi */
call _C_LABEL(pmap_deactivate)
movq P_ADDR(%r13),%r13
/* Save stack pointers */
movq %rsp,PCB_RSP(%r13)
movq %rbp,PCB_RBP(%r13)
/* Find idle PCB for this CPU */
#ifndef MULTIPROCESSOR
leaq _C_LABEL(proc0)(%rip),%rcx
movq P_ADDR(%rcx),%r12
movl P_MD_TSS_SEL(%rcx),%edx
#else
movq CPUVAR(IDLE_PCB),%r12
movl CPUVAR(IDLE_TSS_SEL),%edx
#endif
movq $0,CPUVAR(CURPROC)
/* Restore the idle context (avoid interrupts) */
cli
/* Restore stack pointers. */
movq PCB_RSP(%r12),%rsp
movq PCB_RBP(%r12),%rbp
/* Switch address space. */
movq PCB_CR3(%r12),%rcx
movq %rcx,%cr3
#ifdef MULTIPROCESSOR
movq CPUVAR(GDT),%rax
#else
movq _C_LABEL(gdtstore)(%rip),%rax
#endif
/* Switch TSS. Reset "task busy" flag before */
andl $~0x0200,4(%rax,%rdx, 1)
ltr %dx
/* Restore cr0 (including FPU state). */
movl PCB_CR0(%r12),%ecx
movq %rcx,%cr0
SET_CURPCB(%r12)
xorq %r13,%r13
sti
idle_unlock:
#if defined(MULTIPROCESSOR) || defined(LOCKDEBUG)
call _C_LABEL(sched_unlock_idle)
#endif
/* Interrupts are okay again. */
movl $IPL_NONE,%edi
call _C_LABEL(Xspllower)
jmp idle_start
idle_zero:
sti
call _C_LABEL(uvm_pageidlezero)
cli
cmpl $0,_C_LABEL(whichqs)(%rip)
jnz idle_exit
idle_loop:
/* Try to zero some pages. */
movl _C_LABEL(uvm)+UVM_PAGE_IDLE_ZERO(%rip),%ecx
testl %ecx,%ecx
jnz idle_zero
sti
hlt
NENTRY(mpidle)
idle_start:
cli
cmpl $0,_C_LABEL(whichqs)(%rip)
jz idle_loop
idle_exit:
movl $IPL_HIGH,CPUVAR(ILEVEL)
sti
#if defined(MULTIPROCESSOR) || defined(LOCKDEBUG)
call _C_LABEL(sched_lock_idle)
#endif
switch_search:
movl _C_LABEL(whichqs)(%rip),%ecx
bsfl %ecx,%r8d
jz idle_unlock
switch_dequeue:
sti
movq %r8,%r9
shlq $4, %r9
leaq _C_LABEL(qs)(%rip),%rax
addq %r9,%rax
/* movq (%rax),%rax */
movq P_FORW(%rax),%r12 # unlink from front of process q
#ifdef DIAGNOSTIC
cmpq %r12,%rax # linked to self (i.e. nothing queued)?
je _C_LABEL(switch_error1) # not possible
#endif /* DIAGNOSTIC */
movq P_FORW(%r12),%rdx
movq %rdx,P_FORW(%rax)
movq %rax,P_BACK(%rdx)
cmpq %rdx,%rax # q empty?
jne 3f
btrl %r8d,%ecx # yes, clear to indicate empty
movl %ecx,_C_LABEL(whichqs)(%rip) # update q status
3: /* We just did it. */
xorq %rax,%rax
movl %eax,CPUVAR(RESCHED)
switch_resume:
#ifdef DIAGNOSTIC
cmpq %rax,P_WCHAN(%r12)
jne _C_LABEL(switch_error2)
cmpb $SRUN,P_STAT(%r12)
jne _C_LABEL(switch_error3)
#endif
/* Isolate proc. XXX Is this necessary? */
movq %rax,P_BACK(%r12)
/* Record new proc. */
movb $SONPROC,P_STAT(%r12) # p->p_stat = SONPROC
SET_CURPROC(%r12,%rcx)
/* Skip context switch if same proc. */
xorl %ebx,%ebx
cmpq %r12,%r13
je switch_return
/* If old proc exited, don't bother. */
testq %r13,%r13
jz switch_exited
/*
* Second phase: save old context.
*
* Registers:
* %rax, %rcx - scratch
* %r13 - old proc, then old pcb
* %r12 - new proc
*/
movq %r13,%rdi
call pmap_deactivate
movq P_ADDR(%r13),%r13
/* Save stack pointers. */
movq %rsp,PCB_RSP(%r13)
movq %rbp,PCB_RBP(%r13)
switch_exited:
/*
* Third phase: restore saved context.
*
* Registers:
* %rax, %rcx, %rdx - scratch
* %r13 - new pcb
* %r12 - new process
*/
/* No interrupts while loading new state. */
cli
movq P_ADDR(%r12),%r13
/* Restore stack pointers. */
movq PCB_RSP(%r13),%rsp
movq PCB_RBP(%r13),%rbp
#if 0
/* Don't bother with the rest if switching to a system process. */
testl $P_SYSTEM,P_FLAG(%r12)
jnz switch_restored
#endif
/* Load TSS info. */
#ifdef MULTIPROCESSOR
movq CPUVAR(GDT),%rax
#else
movq _C_LABEL(gdtstore)(%rip),%rax
#endif
movl P_MD_TSS_SEL(%r12),%edx
/* Switch TSS. Reset "task busy" flag before */
andl $~0x0200,4(%rax,%rdx, 1)
ltr %dx
movq %r12,%rdi
call _C_LABEL(pmap_activate)
#if 0
switch_restored:
#endif
/* Restore cr0 (including FPU state). */
movl PCB_CR0(%r13),%ecx
#ifdef MULTIPROCESSOR
movq PCB_FPCPU(%r13),%r8
cmpq CPUVAR(SELF),%r8
jz 1f
orl $CR0_TS,%ecx
1:
#endif
movq %rcx,%cr0
SET_CURPCB(%r13)
/* Interrupts are okay again. */
sti
switch_return:
#if defined(MULTIPROCESSOR) || defined(LOCKDEBUG)
call _C_LABEL(sched_unlock_idle)
#endif
movl $IPL_NONE,%edi
call _C_LABEL(Xspllower)
movl $IPL_HIGH,CPUVAR(ILEVEL)
movl %ebx,%eax
popq %r15
popq %r14
popq %r13
popq %r12
popq %rbp
popq %rbx
ret
ENTRY(cpu_switchto)
pushq %rbx
pushq %rbp
pushq %r12
pushq %r13
pushq %r14
pushq %r15
movq %rdi,%r13
movq %rsi,%r12
movq $0,CPUVAR(CURPROC)
xorq %rax,%rax
jmp switch_resume
/*
* void switch_exit(struct proc *l, void (*exit)(struct proc *));
* Switch to proc0's saved context and deallocate the address space and kernel
* stack for p. Then jump into cpu_switch(), as if we were in proc0 all along.
*/
.globl _C_LABEL(proc0)
ENTRY(switch_exit)
#ifdef MULTIPROCESSOR
movq CPUVAR(IDLE_PCB),%r8
movl CPUVAR(IDLE_TSS_SEL),%edx
#else
leaq _C_LABEL(proc0)(%rip),%r9
movq P_ADDR(%r9),%r8
movl P_MD_TSS_SEL(%r9),%edx
#endif
/* In case we fault... */
movq $0,CPUVAR(CURPROC)
cli
/* Restore stack pointers. */
movq PCB_RSP(%r8),%rsp
movq PCB_RBP(%r8),%rbp
/* Load TSS info. */
#ifdef MULTIPROCESSOR
movq CPUVAR(GDT),%rax
#else
movq _C_LABEL(gdtstore)(%rip),%rax
#endif
/* Switch address space. */
movq PCB_CR3(%r8),%rcx
movq %rcx,%cr3
/* Switch TSS. */
andl $~0x0200,4-SEL_KPL(%rax,%rdx,1)
ltr %dx
/* We're always in the kernel, so we don't need the LDT. */
/* Restore cr0 (including FPU state). */
movl PCB_CR0(%r8),%ecx
movq %rcx,%cr0
/* Record new pcb. */
SET_CURPCB(%r8)
/* Interrupts are okay again. */
sti
/*
* Schedule the dead process's vmspace and stack to be freed.
* {lpw_}exit2(l). Function still in %rsi (2nd arg), proc in
* %rdi (first arg).
*/
call *%rsi
/* Jump into cpu_switch() with the right state. */
xorq %r13,%r13
movq %r13, CPUVAR(CURPROC)
jmp switch_search
/*
* savectx(struct pcb *pcb);
* Update pcb, saving current processor state.
*/
ENTRY(savectx)
/* Save stack pointers. */
movq %rsp,PCB_RSP(%rdi)
movq %rbp,PCB_RBP(%rdi)
ret
IDTVEC(syscall32)
sysret /* go away please */
/*
* syscall insn entry. This currently isn't much faster, but
* it can be made faster in the future.
*/
IDTVEC(syscall)
swapgs
movq %r15,CPUVAR(SCRATCH)
movq CPUVAR(CURPCB),%r15
movq PCB_RSP0(%r15),%r15
xchgq %r15,%rsp
sti
/*
* XXX don't need this whole frame, split of the
* syscall frame and trapframe is needed.
* First, leave some room for the trapno, error,
* ss:rsp, etc, so that all GP registers can be
* saved. Then, fill in the rest.
*/
pushq $(LSEL(LUDATA_SEL, SEL_UPL))
pushq %r15
subq $(TF_RSP-TF_TRAPNO),%rsp
movq CPUVAR(SCRATCH),%r15
subq $32,%rsp
INTR_SAVE_GPRS
movw %fs,TF_FS(%rsp)
movw %gs,TF_GS(%rsp)
movw %es,TF_ES(%rsp)
movw $(LSEL(LUDATA_SEL, SEL_UPL)),TF_DS(%rsp)
movq %r11, TF_RFLAGS(%rsp) /* old rflags from syscall insn */
movq $(LSEL(LUCODE_SEL, SEL_UPL)), TF_CS(%rsp)
movq %rcx,TF_RIP(%rsp)
movq $2,TF_ERR(%rsp)
movq $T_ASTFLT, TF_TRAPNO(%rsp)
movq CPUVAR(CURPROC),%r14
movq %rsp,P_MD_REGS(%r14) # save pointer to frame
andl $~MDP_IRET,P_MD_FLAGS(%r14)
movq %rsp,%rdi
call _C_LABEL(syscall)
1: /* Check for ASTs on exit to user mode. */
cli
CHECK_ASTPENDING(%r11)
je 2f
/* Always returning to user mode here. */
CLEAR_ASTPENDING(%r11)
sti
/* Pushed T_ASTFLT into tf_trapno on entry. */
movq %rsp,%rdi
call _C_LABEL(trap)
jmp 1b
2:
sti
testl $MDP_IRET, P_MD_FLAGS(%r14)
jne iret_return;
syscall_return:
#ifdef DIAGNOSTIC
cmpl $IPL_NONE,CPUVAR(ILEVEL)
jne 3f
#endif
/*
* XXX interrupts off longer than they should be here.
*/
cli
swapgs
movw TF_ES(%rsp),%es
movw TF_FS(%rsp),%fs
movw TF_GS(%rsp),%gs
INTR_RESTORE_GPRS
movw $(LSEL(LUDATA_SEL, SEL_UPL)),%r11
movw %r11,%ds
addq $48,%rsp
popq %rcx /* return rip */
addq $8,%rsp
popq %r11 /* flags as set by sysret insn */
movq %ss:(%rsp),%rsp
sysretq
#ifdef DIAGNOSTIC
3: movabsq $4f, %rdi
movl TF_RAX(%rsp),%esi
movl TF_RDI(%rsp),%edx
movl %ebx,%ecx
movl CPUVAR(ILEVEL),%r8d
xorq %rax,%rax
call _C_LABEL(printf)
#ifdef DDB
int $3
#endif /* DDB */
movl $IPL_NONE,CPUVAR(ILEVEL)
jmp 1b
4: .asciz "WARNING: SPL NOT LOWERED ON SYSCALL %d %d EXIT %x %x\n"
#endif
NENTRY(proc_trampoline)
#ifdef MULTIPROCESSOR
call _C_LABEL(proc_trampoline_mp)
#endif
movl $IPL_NONE,CPUVAR(ILEVEL)
movq %r13,%rdi
call *%r12
INTRFASTEXIT
/* NOTREACHED */
NENTRY(child_trampoline)
#ifdef MULTIPROCESSOR
call _C_LABEL(proc_trampoline_mp)
#endif
movl $IPL_NONE,CPUVAR(ILEVEL)
movq %r13,%rdi
call *%r12
jmp syscall_return
.globl _C_LABEL(osyscall_return)
/* XXX - can we zap the following two? */
/*
* Old call gate entry for syscall. only needed if we're
* going to support running old NetBSD or ibcs2 binaries, etc,
* on NetBSD/amd64.
*/
IDTVEC(oosyscall)
/* Set rflags in trap frame. */
pushfq
popq 8(%rsp)
pushq $7 # size of instruction for restart
jmp osyscall1
/*
* Trap gate entry for int $80 syscall, also used by sigreturn.
*/
IDTVEC(osyscall)
pushq $2 # size of instruction for restart
osyscall1:
pushq $T_ASTFLT # trap # for doing ASTs
INTRENTRY
sti
movq CPUVAR(CURPROC),%rdx
movq %rsp,P_MD_REGS(%rdx) # save pointer to frame
movq %rsp,%rdi
call _C_LABEL(syscall)
_C_LABEL(osyscall_return):
2: /* Check for ASTs on exit to user mode. */
cli
CHECK_ASTPENDING(%r11)
je 1f
/* Always returning to user mode here. */
CLEAR_ASTPENDING(%r11)
sti
/* Pushed T_ASTFLT into tf_trapno on entry. */
movq %rsp,%rdi
call _C_LABEL(trap)
jmp 2b
iret_return:
#ifndef DIAGNOSTIC
1: INTRFASTEXIT
#else /* DIAGNOSTIC */
1: cmpl $IPL_NONE,CPUVAR(ILEVEL)
jne 3f
INTRFASTEXIT
3: sti
movabsq $4f, %rdi
xorq %rax,%rax
call _C_LABEL(printf)
#ifdef DDB
int $3
#endif /* DDB */
movl $IPL_NONE,CPUVAR(ILEVEL)
jmp 2b
4: .asciz "WARNING: SPL NOT LOWERED ON SYSCALL EXIT\n"
#endif /* DIAGNOSTIC */
ENTRY(pagezero)
movq $-PAGE_SIZE,%rdx
subq %rdx,%rdi
xorq %rax,%rax
1:
movnti %rax,(%rdi,%rdx)
movnti %rax,8(%rdi,%rdx)
movnti %rax,16(%rdi,%rdx)
movnti %rax,24(%rdi,%rdx)
addq $32,%rdx
jne 1b
sfence
ret