main.c revision 203829
166458Sdfr/*-
266458Sdfr * Initial implementation:
366458Sdfr * Copyright (c) 2001 Robert Drehmel
466458Sdfr * All rights reserved.
566458Sdfr *
666458Sdfr * As long as the above copyright statement and this notice remain
766458Sdfr * unchanged, you can do what ever you want with this file.
866458Sdfr */
966458Sdfr/*-
1066458Sdfr * Copyright (c) 2008 Marius Strobl <marius@FreeBSD.org>
1166458Sdfr * All rights reserved.
1266458Sdfr *
1366458Sdfr * Redistribution and use in source and binary forms, with or without
1466458Sdfr * modification, are permitted provided that the following conditions
1566458Sdfr * are met:
1666458Sdfr * 1. Redistributions of source code must retain the above copyright
1766458Sdfr *    notice, this list of conditions and the following disclaimer.
1866458Sdfr * 2. Redistributions in binary form must reproduce the above copyright
1966458Sdfr *    notice, this list of conditions and the following disclaimer in the
2066458Sdfr *    documentation and/or other materials provided with the distribution.
2166458Sdfr *
2266458Sdfr * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
2366458Sdfr * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
2466458Sdfr * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
2566458Sdfr * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
2666458Sdfr * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
2766458Sdfr * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
2866458Sdfr * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
2966458Sdfr * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
3066458Sdfr * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
3166458Sdfr * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
3266458Sdfr * SUCH DAMAGE.
3366458Sdfr */
3466458Sdfr
3566458Sdfr#include <sys/cdefs.h>
3666458Sdfr__FBSDID("$FreeBSD: head/sys/boot/sparc64/loader/main.c 203829 2010-02-13 14:13:39Z marius $");
3766458Sdfr
3866458Sdfr/*
3966458Sdfr * FreeBSD/sparc64 kernel loader - machine dependent part
4066458Sdfr *
4166458Sdfr *  - implements copyin and readin functions that map kernel
4266458Sdfr *    pages on demand.  The machine independent code does not
4366458Sdfr *    know the size of the kernel early enough to pre-enter
4466458Sdfr *    TTEs and install just one 4MB mapping seemed to limiting
4566458Sdfr *    to me.
4666458Sdfr */
4766458Sdfr
4866458Sdfr#include <stand.h>
4966458Sdfr#include <sys/param.h>
50117126Sscottl#include <sys/exec.h>
51117126Sscottl#include <sys/linker.h>
5266458Sdfr#include <sys/queue.h>
5366458Sdfr#include <sys/types.h>
5466458Sdfr
5566458Sdfr#include <vm/vm.h>
5666458Sdfr#include <machine/asi.h>
5766458Sdfr#include <machine/cmt.h>
58146214Snyan#include <machine/cpufunc.h>
5966458Sdfr#include <machine/elf.h>
6066458Sdfr#include <machine/fireplane.h>
6166458Sdfr#include <machine/jbus.h>
6266458Sdfr#include <machine/lsu.h>
6366458Sdfr#include <machine/metadata.h>
6466458Sdfr#include <machine/tte.h>
6566458Sdfr#include <machine/tlb.h>
6666458Sdfr#include <machine/upa.h>
6766458Sdfr#include <machine/ver.h>
6866458Sdfr#include <machine/vmparam.h>
6966458Sdfr
7066458Sdfr#include "bootstrap.h"
7166458Sdfr#include "libofw.h"
7266458Sdfr#include "dev_net.h"
7366458Sdfr
7466458Sdfr#ifndef CTASSERT
7566458Sdfr#define	CTASSERT(x)		_CTASSERT(x, __LINE__)
76135262Sphk#define	_CTASSERT(x, y)		__CTASSERT(x, y)
77135262Sphk#define	__CTASSERT(x, y)	typedef char __assert ## y[(x) ? 1 : -1]
7866458Sdfr#endif
7966458Sdfr
8066458Sdfrextern char bootprog_name[], bootprog_rev[], bootprog_date[], bootprog_maker[];
8166458Sdfr
8266458Sdfrenum {
8366458Sdfr	HEAPVA		= 0x800000,
8466458Sdfr	HEAPSZ		= 0x1000000,
8566458Sdfr	LOADSZ		= 0x1000000	/* for kernel and modules */
8666458Sdfr};
8766458Sdfr
8866458Sdfr/* At least Sun Fire V1280 require page sized allocations to be claimed. */
8966458SdfrCTASSERT(HEAPSZ % PAGE_SIZE == 0);
9066458Sdfr
9166458Sdfrstatic struct mmu_ops {
9266458Sdfr	void (*tlb_init)(void);
9366458Sdfr	int (*mmu_mapin)(vm_offset_t va, vm_size_t len);
9466458Sdfr} *mmu_ops;
95135262Sphk
9666458Sdfrtypedef void kernel_entry_t(vm_offset_t mdp, u_long o1, u_long o2, u_long o3,
9766458Sdfr    void *openfirmware);
98135262Sphk
9966458Sdfrstatic inline u_long dtlb_get_data_sun4u(u_int);
10066458Sdfrstatic void dtlb_enter_sun4u(u_long, u_long);
10166458Sdfrstatic vm_offset_t dtlb_va_to_pa_sun4u(vm_offset_t);
10266458Sdfrstatic inline u_long itlb_get_data_sun4u(u_int);
10366458Sdfrstatic void itlb_enter_sun4u(u_long, u_long);
10466458Sdfrstatic vm_offset_t itlb_va_to_pa_sun4u(vm_offset_t);
10566458Sdfrstatic void itlb_relocate_locked0_sun4u(void);
10666458Sdfrextern vm_offset_t md_load(char *, vm_offset_t *);
10766458Sdfrstatic int sparc64_autoload(void);
10866458Sdfrstatic ssize_t sparc64_readin(const int, vm_offset_t, const size_t);
109177215Simpstatic ssize_t sparc64_copyin(const void *, vm_offset_t, size_t);
110117126Sscottlstatic void sparc64_maphint(vm_offset_t, size_t);
111117126Sscottlstatic vm_offset_t claim_virt(vm_offset_t, size_t, int);
11266458Sdfrstatic vm_offset_t alloc_phys(size_t, int);
113135262Sphkstatic int map_phys(int, size_t, vm_offset_t, vm_offset_t);
11466458Sdfrstatic void release_phys(vm_offset_t, u_int);
11566458Sdfrstatic int __elfN(exec)(struct preloaded_file *);
11666458Sdfrstatic int mmu_mapin_sun4u(vm_offset_t, vm_size_t);
117135262Sphkstatic int mmu_mapin_sun4v(vm_offset_t, vm_size_t);
11866458Sdfrstatic vm_offset_t init_heap(void);
11966458Sdfrstatic phandle_t find_bsp_sun4u(phandle_t, uint32_t);
120135262Sphkconst char *cpu_cpuid_prop_sun4u(void);
12166458Sdfruint32_t cpu_get_mid_sun4u(void);
12266458Sdfrstatic void tlb_init_sun4u(void);
12366458Sdfrstatic void tlb_init_sun4v(void);
12466458Sdfr
12566458Sdfr#ifdef LOADER_DEBUG
12666458Sdfrtypedef u_int64_t tte_t;
12766458Sdfr
12866458Sdfrstatic void pmap_print_tlb_sun4u(void);
12966458Sdfrstatic void pmap_print_tte_sun4u(tte_t, tte_t);
13066458Sdfr#endif
13166458Sdfr
13266458Sdfrstatic struct mmu_ops mmu_ops_sun4u = { tlb_init_sun4u, mmu_mapin_sun4u };
13366458Sdfrstatic struct mmu_ops mmu_ops_sun4v = { tlb_init_sun4v, mmu_mapin_sun4v };
13466458Sdfr
13566458Sdfr/* sun4u */
13666458Sdfrstruct tlb_entry *dtlb_store;
13766458Sdfrstruct tlb_entry *itlb_store;
13866458Sdfru_int dtlb_slot;
13966458Sdfru_int itlb_slot;
14066458Sdfrint cpu_impl;
14166458Sdfrstatic u_int dtlb_slot_max;
14266458Sdfrstatic u_int itlb_slot_max;
14366458Sdfr
14466458Sdfr/* sun4v */
14566458Sdfrstatic struct tlb_entry *tlb_store;
14666458Sdfrstatic int is_sun4v = 0;
14766458Sdfr/*
14866458Sdfr * no direct TLB access on sun4v
14966458Sdfr * we somewhat arbitrarily declare enough
15066458Sdfr * slots to cover a 4GB AS with 4MB pages
15166458Sdfr */
15266458Sdfr#define	SUN4V_TLB_SLOT_MAX	(1 << 10)
15366458Sdfr
15466458Sdfrstatic vm_offset_t curkva = 0;
15566458Sdfrstatic vm_offset_t heapva;
15666458Sdfr
15766458Sdfrstatic phandle_t root;
15866458Sdfr
15966458Sdfr/*
16066458Sdfr * Machine dependent structures that the machine independent
16166458Sdfr * loader part uses.
16266458Sdfr */
16366458Sdfrstruct devsw *devsw[] = {
16466458Sdfr#ifdef LOADER_DISK_SUPPORT
16566458Sdfr	&ofwdisk,
16666458Sdfr#endif
16766458Sdfr#ifdef LOADER_NET_SUPPORT
16866458Sdfr	&netdev,
16966458Sdfr#endif
17066458Sdfr	0
17166458Sdfr};
17266458Sdfrstruct arch_switch archsw;
17366458Sdfr
17466458Sdfrstatic struct file_format sparc64_elf = {
17566458Sdfr	__elfN(loadfile),
17666458Sdfr	__elfN(exec)
17766458Sdfr};
17866458Sdfrstruct file_format *file_formats[] = {
17966458Sdfr	&sparc64_elf,
18066458Sdfr	0
18166458Sdfr};
18266458Sdfrstruct fs_ops *file_system[] = {
18366458Sdfr#ifdef LOADER_UFS_SUPPORT
18466458Sdfr	&ufs_fsops,
18566458Sdfr#endif
18666458Sdfr#ifdef LOADER_CD9660_SUPPORT
18766458Sdfr	&cd9660_fsops,
18866458Sdfr#endif
18966458Sdfr#ifdef LOADER_ZIP_SUPPORT
19066458Sdfr	&zipfs_fsops,
19166458Sdfr#endif
19266458Sdfr#ifdef LOADER_GZIP_SUPPORT
19366458Sdfr	&gzipfs_fsops,
19466458Sdfr#endif
19566458Sdfr#ifdef LOADER_BZIP2_SUPPORT
19666458Sdfr	&bzipfs_fsops,
19766458Sdfr#endif
19866458Sdfr#ifdef LOADER_NFS_SUPPORT
19966458Sdfr	&nfs_fsops,
20066458Sdfr#endif
20166458Sdfr#ifdef LOADER_TFTP_SUPPORT
20266458Sdfr	&tftp_fsops,
20366458Sdfr#endif
20466458Sdfr	0
20566458Sdfr};
20666458Sdfrstruct netif_driver *netif_drivers[] = {
20766458Sdfr#ifdef LOADER_NET_SUPPORT
20866458Sdfr	&ofwnet,
20966458Sdfr#endif
21066458Sdfr	0
21166458Sdfr};
21292676Speter
21366458Sdfrextern struct console ofwconsole;
21492676Speterstruct console *consoles[] = {
21566458Sdfr	&ofwconsole,
21666458Sdfr	0
21766458Sdfr};
21866458Sdfr
21966458Sdfr#ifdef LOADER_DEBUG
22066458Sdfrstatic int
22166458Sdfrwatch_phys_set_mask(vm_offset_t pa, u_long mask)
22266458Sdfr{
22366458Sdfr	u_long lsucr;
22466458Sdfr
22566458Sdfr	stxa(AA_DMMU_PWPR, ASI_DMMU, pa & (((2UL << 38) - 1) << 3));
22695710Speter	lsucr = ldxa(0, ASI_LSU_CTL_REG);
22766458Sdfr	lsucr = ((lsucr | LSU_PW) & ~LSU_PM_MASK) |
22866458Sdfr	    (mask << LSU_PM_SHIFT);
22966458Sdfr	stxa(0, ASI_LSU_CTL_REG, lsucr);
23066458Sdfr	return (0);
23166458Sdfr}
23266458Sdfr
23366458Sdfrstatic int
23466458Sdfrwatch_phys_set(vm_offset_t pa, int sz)
23566458Sdfr{
23666458Sdfr	u_long off;
23766458Sdfr
23866458Sdfr	off = (u_long)pa & 7;
23966458Sdfr	/* Test for misaligned watch points. */
24066458Sdfr	if (off + sz > 8)
24166458Sdfr		return (-1);
24266458Sdfr	return (watch_phys_set_mask(pa, ((1 << sz) - 1) << off));
24366458Sdfr}
24466458Sdfr
24566458Sdfr
24666458Sdfrstatic int
24766458Sdfrwatch_virt_set_mask(vm_offset_t va, u_long mask)
24866458Sdfr{
24966458Sdfr	u_long lsucr;
25066458Sdfr
25166458Sdfr	stxa(AA_DMMU_VWPR, ASI_DMMU, va & (((2UL << 41) - 1) << 3));
25266458Sdfr	lsucr = ldxa(0, ASI_LSU_CTL_REG);
25366458Sdfr	lsucr = ((lsucr | LSU_VW) & ~LSU_VM_MASK) |
25466458Sdfr	    (mask << LSU_VM_SHIFT);
25566458Sdfr	stxa(0, ASI_LSU_CTL_REG, lsucr);
25666458Sdfr	return (0);
25766458Sdfr}
25866458Sdfr
25966458Sdfrstatic int
26066458Sdfrwatch_virt_set(vm_offset_t va, int sz)
26166458Sdfr{
26266458Sdfr	u_long off;
26366458Sdfr
26466458Sdfr	off = (u_long)va & 7;
26566458Sdfr	/* Test for misaligned watch points. */
26666458Sdfr	if (off + sz > 8)
26766458Sdfr		return (-1);
26866458Sdfr	return (watch_virt_set_mask(va, ((1 << sz) - 1) << off));
26966458Sdfr}
27066458Sdfr#endif
27166458Sdfr
27266458Sdfr/*
27366458Sdfr * archsw functions
27466458Sdfr */
27566458Sdfrstatic int
27666458Sdfrsparc64_autoload(void)
27766458Sdfr{
27866458Sdfr
27966458Sdfr	return (0);
28066458Sdfr}
28166458Sdfr
28266458Sdfrstatic ssize_t
28366458Sdfrsparc64_readin(const int fd, vm_offset_t va, const size_t len)
28466458Sdfr{
28566458Sdfr
28666458Sdfr	mmu_ops->mmu_mapin(va, len);
28766458Sdfr	return (read(fd, (void *)va, len));
28866458Sdfr}
28966458Sdfr
29066458Sdfrstatic ssize_t
29166458Sdfrsparc64_copyin(const void *src, vm_offset_t dest, size_t len)
29266458Sdfr{
29366458Sdfr
29466458Sdfr	mmu_ops->mmu_mapin(dest, len);
29566458Sdfr	memcpy((void *)dest, src, len);
29666458Sdfr	return (len);
29766458Sdfr}
29866458Sdfr
29966458Sdfrstatic void
30066458Sdfrsparc64_maphint(vm_offset_t va, size_t len)
30166458Sdfr{
30266458Sdfr	vm_paddr_t pa;
30366458Sdfr	vm_offset_t mva;
30466458Sdfr	size_t size;
30566458Sdfr	int i, free_excess = 0;
30666458Sdfr
30766458Sdfr	if (!is_sun4v)
30866458Sdfr		return;
30966458Sdfr
31066458Sdfr	if (tlb_store[va >> 22].te_pa != -1)
31166458Sdfr		return;
31266458Sdfr
31366458Sdfr	/* round up to nearest 4MB page */
31466458Sdfr	size = (len + PAGE_MASK_4M) & ~PAGE_MASK_4M;
31566458Sdfr#if 0
31666458Sdfr	pa = alloc_phys(PAGE_SIZE_256M, PAGE_SIZE_256M);
31766458Sdfr
31866458Sdfr	if (pa != -1)
31966458Sdfr		free_excess = 1;
32066458Sdfr	else
32166458Sdfr#endif
32266458Sdfr		pa = alloc_phys(size, PAGE_SIZE_256M);
32366458Sdfr	if (pa == -1)
32466458Sdfr		pa = alloc_phys(size, PAGE_SIZE_4M);
32566458Sdfr	if (pa == -1)
32666458Sdfr		panic("%s: out of memory", __func__);
32766458Sdfr
32866458Sdfr	for (i = 0; i < size; i += PAGE_SIZE_4M) {
32966458Sdfr		mva = claim_virt(va + i, PAGE_SIZE_4M, 0);
33066458Sdfr		if (mva != (va + i))
33166458Sdfr			panic("%s: can't claim virtual page "
33266458Sdfr			    "(wanted %#lx, got %#lx)",
33366458Sdfr			    __func__, va, mva);
334171312Smarcel
335135262Sphk		tlb_store[mva >> 22].te_pa = pa + i;
33666458Sdfr		if (map_phys(-1, PAGE_SIZE_4M, mva, pa + i) != 0)
33766458Sdfr			printf("%s: can't map physical page\n", __func__);
33866458Sdfr	}
33966458Sdfr	if (free_excess)
34066458Sdfr		release_phys(pa, PAGE_SIZE_256M);
34166458Sdfr}
34266458Sdfr
34366458Sdfr/*
34466458Sdfr * other MD functions
34566458Sdfr */
34666458Sdfrstatic vm_offset_t
34766458Sdfrclaim_virt(vm_offset_t virt, size_t size, int align)
34866458Sdfr{
34966458Sdfr	vm_offset_t mva;
35066458Sdfr
35166458Sdfr	if (OF_call_method("claim", mmu, 3, 1, virt, size, align, &mva) == -1)
35266458Sdfr		return ((vm_offset_t)-1);
35366458Sdfr	return (mva);
35466458Sdfr}
35566458Sdfr
35666458Sdfrstatic vm_offset_t
35766458Sdfralloc_phys(size_t size, int align)
35866458Sdfr{
35966458Sdfr	cell_t phys_hi, phys_low;
36066458Sdfr
36166458Sdfr	if (OF_call_method("claim", memory, 2, 2, size, align, &phys_low,
36266458Sdfr	    &phys_hi) == -1)
36366458Sdfr		return ((vm_offset_t)-1);
36466458Sdfr	return ((vm_offset_t)phys_hi << 32 | phys_low);
36566458Sdfr}
36666458Sdfr
36766458Sdfrstatic int
36866458Sdfrmap_phys(int mode, size_t size, vm_offset_t virt, vm_offset_t phys)
36966458Sdfr{
37066458Sdfr
37166458Sdfr	return (OF_call_method("map", mmu, 5, 0, (uint32_t)phys,
37266458Sdfr	    (uint32_t)(phys >> 32), virt, size, mode));
37366458Sdfr}
37466458Sdfr
37566458Sdfrstatic void
37666458Sdfrrelease_phys(vm_offset_t phys, u_int size)
37766458Sdfr{
37866458Sdfr
37966458Sdfr	(void)OF_call_method("release", memory, 3, 0, (uint32_t)phys,
38066458Sdfr	    (uint32_t)(phys >> 32), size);
38166458Sdfr}
38266458Sdfr
38366458Sdfrstatic int
38466458Sdfr__elfN(exec)(struct preloaded_file *fp)
38566458Sdfr{
38666458Sdfr	struct file_metadata *fmp;
38766458Sdfr	vm_offset_t mdp;
38866458Sdfr	Elf_Addr entry;
38966458Sdfr	Elf_Ehdr *e;
39066458Sdfr	int error;
39166458Sdfr
39266458Sdfr	if ((fmp = file_findmetadata(fp, MODINFOMD_ELFHDR)) == 0)
39366458Sdfr		return (EFTYPE);
39466458Sdfr	e = (Elf_Ehdr *)&fmp->md_data;
39566458Sdfr
39666458Sdfr	if ((error = md_load(fp->f_args, &mdp)) != 0)
39766458Sdfr		return (error);
39866458Sdfr
39966458Sdfr	printf("jumping to kernel entry at %#lx.\n", e->e_entry);
40066458Sdfr#ifdef LOADER_DEBUG
40166458Sdfr	pmap_print_tlb_sun4u();
40266458Sdfr#endif
40366458Sdfr
40466458Sdfr	dev_cleanup();
40566458Sdfr
40666458Sdfr	entry = e->e_entry;
40766458Sdfr
40866458Sdfr	OF_release((void *)heapva, HEAPSZ);
40966458Sdfr
41066458Sdfr	((kernel_entry_t *)entry)(mdp, 0, 0, 0, openfirmware);
41166458Sdfr
41266458Sdfr	panic("%s: exec returned", __func__);
41366458Sdfr}
41466458Sdfr
41566458Sdfrstatic inline u_long
41666458Sdfrdtlb_get_data_sun4u(u_int slot)
41766458Sdfr{
41866458Sdfr
41966458Sdfr	/*
42066458Sdfr	 * We read ASI_DTLB_DATA_ACCESS_REG twice in order to work
42166458Sdfr	 * around errata of USIII and beyond.
42266458Sdfr	 */
42366458Sdfr	(void)ldxa(TLB_DAR_SLOT(slot), ASI_DTLB_DATA_ACCESS_REG);
42466458Sdfr	return (ldxa(TLB_DAR_SLOT(slot), ASI_DTLB_DATA_ACCESS_REG));
42566458Sdfr}
42666458Sdfr
42766458Sdfrstatic inline u_long
42866458Sdfritlb_get_data_sun4u(u_int slot)
42966458Sdfr{
43066458Sdfr
43166458Sdfr	/*
43266458Sdfr	 * We read ASI_ITLB_DATA_ACCESS_REG twice in order to work
43366458Sdfr	 * around errata of USIII and beyond.
43466458Sdfr	 */
43566458Sdfr	(void)ldxa(TLB_DAR_SLOT(slot), ASI_ITLB_DATA_ACCESS_REG);
43666458Sdfr	return (ldxa(TLB_DAR_SLOT(slot), ASI_ITLB_DATA_ACCESS_REG));
43766458Sdfr}
43866458Sdfr
43966458Sdfrstatic vm_offset_t
44066458Sdfrdtlb_va_to_pa_sun4u(vm_offset_t va)
44166458Sdfr{
44266458Sdfr	u_long pstate, reg;
44366458Sdfr	int i;
44466458Sdfr
44566458Sdfr	pstate = rdpr(pstate);
44666458Sdfr	wrpr(pstate, pstate & ~PSTATE_IE, 0);
44766458Sdfr	for (i = 0; i < dtlb_slot_max; i++) {
44866458Sdfr		reg = ldxa(TLB_DAR_SLOT(i), ASI_DTLB_TAG_READ_REG);
44966458Sdfr		if (TLB_TAR_VA(reg) != va)
45066458Sdfr			continue;
45166458Sdfr		reg = dtlb_get_data_sun4u(i);
45266458Sdfr		wrpr(pstate, pstate, 0);
45366458Sdfr		reg >>= TD_PA_SHIFT;
45466458Sdfr		if (cpu_impl >= CPU_IMPL_ULTRASPARCIII)
45566458Sdfr			return (reg & TD_PA_CH_MASK);
45666458Sdfr		return (reg & TD_PA_SF_MASK);
45766458Sdfr	}
45866458Sdfr	wrpr(pstate, pstate, 0);
45966458Sdfr	return (-1);
46066458Sdfr}
46166458Sdfr
46266458Sdfrstatic vm_offset_t
46366458Sdfritlb_va_to_pa_sun4u(vm_offset_t va)
46466458Sdfr{
46566458Sdfr	u_long pstate, reg;
46666458Sdfr	int i;
46766458Sdfr
46866458Sdfr	pstate = rdpr(pstate);
46966458Sdfr	wrpr(pstate, pstate & ~PSTATE_IE, 0);
47066458Sdfr	for (i = 0; i < itlb_slot_max; i++) {
47166458Sdfr		reg = ldxa(TLB_DAR_SLOT(i), ASI_ITLB_TAG_READ_REG);
47266458Sdfr		if (TLB_TAR_VA(reg) != va)
47366458Sdfr			continue;
47466458Sdfr		reg = itlb_get_data_sun4u(i);
475141391Sphk		wrpr(pstate, pstate, 0);
476141391Sphk		reg >>= TD_PA_SHIFT;
477141391Sphk		if (cpu_impl >= CPU_IMPL_ULTRASPARCIII)
478141391Sphk			return (reg & TD_PA_CH_MASK);
479141391Sphk		return (reg & TD_PA_SF_MASK);
480141391Sphk	}
481141391Sphk	wrpr(pstate, pstate, 0);
482141391Sphk	return (-1);
483141391Sphk}
484141391Sphk
485141391Sphkstatic void
486141391Sphkdtlb_enter_sun4u(u_long vpn, u_long data)
487141391Sphk{
48866458Sdfr	u_long reg;
48966458Sdfr
49066458Sdfr	reg = rdpr(pstate);
49166458Sdfr	wrpr(pstate, reg & ~PSTATE_IE, 0);
49266458Sdfr	stxa(AA_DMMU_TAR, ASI_DMMU,
49366458Sdfr	    TLB_TAR_VA(vpn) | TLB_TAR_CTX(TLB_CTX_KERNEL));
49466458Sdfr	stxa(0, ASI_DTLB_DATA_IN_REG, data);
49566458Sdfr	membar(Sync);
49666458Sdfr	wrpr(pstate, reg, 0);
49766458Sdfr}
49866458Sdfr
49966458Sdfrstatic void
50066458Sdfritlb_enter_sun4u(u_long vpn, u_long data)
50166458Sdfr{
50266458Sdfr	u_long reg;
50366458Sdfr	int i;
50466458Sdfr
50566458Sdfr	reg = rdpr(pstate);
50666458Sdfr	wrpr(pstate, reg & ~PSTATE_IE, 0);
50766458Sdfr
50866458Sdfr	if (cpu_impl == CPU_IMPL_ULTRASPARCIIIp) {
509		/*
510		 * Search an unused slot != 0 and explicitly enter the data
511		 * and tag there in order to avoid Cheetah+ erratum 34.
512		 */
513		for (i = 1; i < itlb_slot_max; i++) {
514			if ((itlb_get_data_sun4u(i) & TD_V) != 0)
515				continue;
516
517			stxa(AA_IMMU_TAR, ASI_IMMU,
518			    TLB_TAR_VA(vpn) | TLB_TAR_CTX(TLB_CTX_KERNEL));
519			stxa(TLB_DAR_SLOT(i), ASI_ITLB_DATA_ACCESS_REG, data);
520			flush(PROMBASE);
521			break;
522		}
523		wrpr(pstate, reg, 0);
524		if (i == itlb_slot_max)
525			panic("%s: could not find an unused slot", __func__);
526		return;
527	}
528
529	stxa(AA_IMMU_TAR, ASI_IMMU,
530	    TLB_TAR_VA(vpn) | TLB_TAR_CTX(TLB_CTX_KERNEL));
531	stxa(0, ASI_ITLB_DATA_IN_REG, data);
532	flush(PROMBASE);
533	wrpr(pstate, reg, 0);
534}
535
536static void
537itlb_relocate_locked0_sun4u(void)
538{
539	u_long data, pstate, tag;
540	int i;
541
542	if (cpu_impl != CPU_IMPL_ULTRASPARCIIIp)
543		return;
544
545	pstate = rdpr(pstate);
546	wrpr(pstate, pstate & ~PSTATE_IE, 0);
547
548	data = itlb_get_data_sun4u(0);
549	if ((data & (TD_V | TD_L)) != (TD_V | TD_L)) {
550		wrpr(pstate, pstate, 0);
551		return;
552	}
553
554	/* Flush the mapping of slot 0. */
555	tag = ldxa(TLB_DAR_SLOT(0), ASI_ITLB_TAG_READ_REG);
556	stxa(TLB_DEMAP_VA(TLB_TAR_VA(tag)) | TLB_DEMAP_PRIMARY |
557	    TLB_DEMAP_PAGE, ASI_IMMU_DEMAP, 0);
558	flush(0);	/* The USIII-family ignores the address. */
559
560	/*
561	 * Search a replacement slot != 0 and enter the data and tag
562	 * that formerly were in slot 0.
563	 */
564	for (i = 1; i < itlb_slot_max; i++) {
565		if ((itlb_get_data_sun4u(i) & TD_V) != 0)
566			continue;
567
568		stxa(AA_IMMU_TAR, ASI_IMMU, tag);
569		stxa(TLB_DAR_SLOT(i), ASI_ITLB_DATA_ACCESS_REG, data);
570		flush(0);	/* The USIII-family ignores the address. */
571		break;
572	}
573	wrpr(pstate, pstate, 0);
574	if (i == itlb_slot_max)
575		panic("%s: could not find a replacement slot", __func__);
576}
577
578static int
579mmu_mapin_sun4u(vm_offset_t va, vm_size_t len)
580{
581	vm_offset_t pa, mva;
582	u_long data;
583
584	if (va + len > curkva)
585		curkva = va + len;
586
587	pa = (vm_offset_t)-1;
588	len += va & PAGE_MASK_4M;
589	va &= ~PAGE_MASK_4M;
590	while (len) {
591		if (dtlb_va_to_pa_sun4u(va) == (vm_offset_t)-1 ||
592		    itlb_va_to_pa_sun4u(va) == (vm_offset_t)-1) {
593			/* Allocate a physical page, claim the virtual area. */
594			if (pa == (vm_offset_t)-1) {
595				pa = alloc_phys(PAGE_SIZE_4M, PAGE_SIZE_4M);
596				if (pa == (vm_offset_t)-1)
597					panic("%s: out of memory", __func__);
598				mva = claim_virt(va, PAGE_SIZE_4M, 0);
599				if (mva != va)
600					panic("%s: can't claim virtual page "
601					    "(wanted %#lx, got %#lx)",
602					    __func__, va, mva);
603				/*
604				 * The mappings may have changed, be paranoid.
605				 */
606				continue;
607			}
608			/*
609			 * Actually, we can only allocate two pages less at
610			 * most (depending on the kernel TSB size).
611			 */
612			if (dtlb_slot >= dtlb_slot_max)
613				panic("%s: out of dtlb_slots", __func__);
614			if (itlb_slot >= itlb_slot_max)
615				panic("%s: out of itlb_slots", __func__);
616			data = TD_V | TD_4M | TD_PA(pa) | TD_L | TD_CP |
617			    TD_CV | TD_P | TD_W;
618			dtlb_store[dtlb_slot].te_pa = pa;
619			dtlb_store[dtlb_slot].te_va = va;
620			itlb_store[itlb_slot].te_pa = pa;
621			itlb_store[itlb_slot].te_va = va;
622			dtlb_slot++;
623			itlb_slot++;
624			dtlb_enter_sun4u(va, data);
625			itlb_enter_sun4u(va, data);
626			pa = (vm_offset_t)-1;
627		}
628		len -= len > PAGE_SIZE_4M ? PAGE_SIZE_4M : len;
629		va += PAGE_SIZE_4M;
630	}
631	if (pa != (vm_offset_t)-1)
632		release_phys(pa, PAGE_SIZE_4M);
633	return (0);
634}
635
636static int
637mmu_mapin_sun4v(vm_offset_t va, vm_size_t len)
638{
639	vm_offset_t pa, mva;
640
641	if (va + len > curkva)
642		curkva = va + len;
643
644	pa = (vm_offset_t)-1;
645	len += va & PAGE_MASK_4M;
646	va &= ~PAGE_MASK_4M;
647	while (len) {
648		if ((va >> 22) > SUN4V_TLB_SLOT_MAX)
649			panic("%s: trying to map more than 4GB", __func__);
650		if (tlb_store[va >> 22].te_pa == -1) {
651			/* Allocate a physical page, claim the virtual area */
652			if (pa == (vm_offset_t)-1) {
653				pa = alloc_phys(PAGE_SIZE_4M, PAGE_SIZE_4M);
654				if (pa == (vm_offset_t)-1)
655				    panic("%s: out of memory", __func__);
656				mva = claim_virt(va, PAGE_SIZE_4M, 0);
657				if (mva != va)
658					panic("%s: can't claim virtual page "
659					    "(wanted %#lx, got %#lx)",
660					    __func__, va, mva);
661			}
662
663			tlb_store[va >> 22].te_pa = pa;
664			if (map_phys(-1, PAGE_SIZE_4M, va, pa) == -1)
665				printf("%s: can't map physical page\n",
666				    __func__);
667			pa = (vm_offset_t)-1;
668		}
669		len -= len > PAGE_SIZE_4M ? PAGE_SIZE_4M : len;
670		va += PAGE_SIZE_4M;
671	}
672	if (pa != (vm_offset_t)-1)
673		release_phys(pa, PAGE_SIZE_4M);
674	return (0);
675}
676
677static vm_offset_t
678init_heap(void)
679{
680
681	/* There is no need for continuous physical heap memory. */
682	heapva = (vm_offset_t)OF_claim((void *)HEAPVA, HEAPSZ, 32);
683	return (heapva);
684}
685
686static phandle_t
687find_bsp_sun4u(phandle_t node, uint32_t bspid)
688{
689	char type[sizeof("cpu")];
690	phandle_t child;
691	uint32_t cpuid;
692
693	for (; node > 0; node = OF_peer(node)) {
694		child = OF_child(node);
695		if (child > 0) {
696			child = find_bsp_sun4u(child, bspid);
697			if (child > 0)
698				return (child);
699		} else {
700			if (OF_getprop(node, "device_type", type,
701			    sizeof(type)) <= 0)
702				continue;
703			if (strcmp(type, "cpu") != 0)
704				continue;
705			if (OF_getprop(node, cpu_cpuid_prop_sun4u(), &cpuid,
706			    sizeof(cpuid)) <= 0)
707				continue;
708			if (cpuid == bspid)
709				return (node);
710		}
711	}
712	return (0);
713}
714
715const char *
716cpu_cpuid_prop_sun4u(void)
717{
718
719	switch (cpu_impl) {
720	case CPU_IMPL_SPARC64:
721	case CPU_IMPL_ULTRASPARCI:
722	case CPU_IMPL_ULTRASPARCII:
723	case CPU_IMPL_ULTRASPARCIIi:
724	case CPU_IMPL_ULTRASPARCIIe:
725		return ("upa-portid");
726	case CPU_IMPL_ULTRASPARCIII:
727	case CPU_IMPL_ULTRASPARCIIIp:
728	case CPU_IMPL_ULTRASPARCIIIi:
729	case CPU_IMPL_ULTRASPARCIIIip:
730		return ("portid");
731	case CPU_IMPL_ULTRASPARCIV:
732	case CPU_IMPL_ULTRASPARCIVp:
733		return ("cpuid");
734	default:
735		return ("");
736	}
737}
738
739uint32_t
740cpu_get_mid_sun4u(void)
741{
742
743	switch (cpu_impl) {
744	case CPU_IMPL_SPARC64:
745	case CPU_IMPL_ULTRASPARCI:
746	case CPU_IMPL_ULTRASPARCII:
747	case CPU_IMPL_ULTRASPARCIIi:
748	case CPU_IMPL_ULTRASPARCIIe:
749		return (UPA_CR_GET_MID(ldxa(0, ASI_UPA_CONFIG_REG)));
750	case CPU_IMPL_ULTRASPARCIII:
751	case CPU_IMPL_ULTRASPARCIIIp:
752		return (FIREPLANE_CR_GET_AID(ldxa(AA_FIREPLANE_CONFIG,
753		    ASI_FIREPLANE_CONFIG_REG)));
754	case CPU_IMPL_ULTRASPARCIIIi:
755	case CPU_IMPL_ULTRASPARCIIIip:
756		return (JBUS_CR_GET_JID(ldxa(0, ASI_JBUS_CONFIG_REG)));
757	case CPU_IMPL_ULTRASPARCIV:
758	case CPU_IMPL_ULTRASPARCIVp:
759		return (INTR_ID_GET_ID(ldxa(AA_INTR_ID, ASI_INTR_ID)));
760	default:
761		return (0);
762	}
763}
764
765static void
766tlb_init_sun4u(void)
767{
768	phandle_t bsp;
769
770	cpu_impl = VER_IMPL(rdpr(ver));
771	bsp = find_bsp_sun4u(OF_child(root), cpu_get_mid_sun4u());
772	if (bsp == 0)
773		panic("%s: no node for bootcpu?!?!", __func__);
774
775	if (OF_getprop(bsp, "#dtlb-entries", &dtlb_slot_max,
776	    sizeof(dtlb_slot_max)) == -1 ||
777	    OF_getprop(bsp, "#itlb-entries", &itlb_slot_max,
778	    sizeof(itlb_slot_max)) == -1)
779		panic("%s: can't get TLB slot max.", __func__);
780
781	if (cpu_impl == CPU_IMPL_ULTRASPARCIIIp) {
782#ifdef LOADER_DEBUG
783		printf("pre fixup:\n");
784		pmap_print_tlb_sun4u();
785#endif
786
787		/*
788		 * Relocate the locked entry in it16 slot 0 (if existent)
789		 * as part of working around Cheetah+ erratum 34.
790		 */
791		itlb_relocate_locked0_sun4u();
792
793#ifdef LOADER_DEBUG
794		printf("post fixup:\n");
795		pmap_print_tlb_sun4u();
796#endif
797	}
798
799	dtlb_store = malloc(dtlb_slot_max * sizeof(*dtlb_store));
800	itlb_store = malloc(itlb_slot_max * sizeof(*itlb_store));
801	if (dtlb_store == NULL || itlb_store == NULL)
802		panic("%s: can't allocate TLB store", __func__);
803}
804
805static void
806tlb_init_sun4v(void)
807{
808
809	tlb_store = malloc(SUN4V_TLB_SLOT_MAX * sizeof(*tlb_store));
810	memset(tlb_store, 0xFF, SUN4V_TLB_SLOT_MAX * sizeof(*tlb_store));
811}
812
813int
814main(int (*openfirm)(void *))
815{
816	char bootpath[64];
817	char compatible[32];
818	struct devsw **dp;
819
820	/*
821	 * Tell the Open Firmware functions where they find the OFW gate.
822	 */
823	OF_init(openfirm);
824
825	archsw.arch_getdev = ofw_getdev;
826	archsw.arch_copyin = sparc64_copyin;
827	archsw.arch_copyout = ofw_copyout;
828	archsw.arch_readin = sparc64_readin;
829	archsw.arch_autoload = sparc64_autoload;
830	archsw.arch_maphint = sparc64_maphint;
831
832	/*
833	 * Probe for a console.
834	 */
835	cons_probe();
836
837	if (init_heap() == (vm_offset_t)-1)
838		panic("%s: can't claim heap", __func__);
839	setheap((void *)heapva, (void *)(heapva + HEAPSZ));
840
841	if ((root = OF_peer(0)) == -1)
842		panic("%s: can't get root phandle", __func__);
843	OF_getprop(root, "compatible", compatible, sizeof(compatible));
844	if (!strcmp(compatible, "sun4v")) {
845		printf("\nBooting with sun4v support.\n");
846		mmu_ops = &mmu_ops_sun4v;
847		is_sun4v = 1;
848	} else {
849		printf("\nBooting with sun4u support.\n");
850		mmu_ops = &mmu_ops_sun4u;
851	}
852
853	mmu_ops->tlb_init();
854
855	/*
856	 * Initialize devices.
857	 */
858	for (dp = devsw; *dp != 0; dp++) {
859		if ((*dp)->dv_init != 0)
860			(*dp)->dv_init();
861	}
862
863	/*
864	 * Set up the current device.
865	 */
866	OF_getprop(chosen, "bootpath", bootpath, sizeof(bootpath));
867
868	/*
869	 * Sun compatible bootable CD-ROMs have a disk label placed
870	 * before the cd9660 data, with the actual filesystem being
871	 * in the first partition, while the other partitions contain
872	 * pseudo disk labels with embedded boot blocks for different
873	 * architectures, which may be followed by UFS filesystems.
874	 * The firmware will set the boot path to the partition it
875	 * boots from ('f' in the sun4u case), but we want the kernel
876	 * to be loaded from the cd9660 fs ('a'), so the boot path
877	 * needs to be altered.
878	 */
879	if (bootpath[strlen(bootpath) - 2] == ':' &&
880	    bootpath[strlen(bootpath) - 1] == 'f') {
881		bootpath[strlen(bootpath) - 1] = 'a';
882		printf("Boot path set to %s\n", bootpath);
883	}
884
885	env_setenv("currdev", EV_VOLATILE, bootpath,
886	    ofw_setcurrdev, env_nounset);
887	env_setenv("loaddev", EV_VOLATILE, bootpath,
888	    env_noset, env_nounset);
889
890	printf("\n");
891	printf("%s, Revision %s\n", bootprog_name, bootprog_rev);
892	printf("(%s, %s)\n", bootprog_maker, bootprog_date);
893	printf("bootpath=\"%s\"\n", bootpath);
894
895	/* Give control to the machine independent loader code. */
896	interact();
897	return (1);
898}
899
900COMMAND_SET(reboot, "reboot", "reboot the system", command_reboot);
901
902static int
903command_reboot(int argc, char *argv[])
904{
905	int i;
906
907	for (i = 0; devsw[i] != NULL; ++i)
908		if (devsw[i]->dv_cleanup != NULL)
909			(devsw[i]->dv_cleanup)();
910
911	printf("Rebooting...\n");
912	OF_exit();
913}
914
915/* provide this for panic, as it's not in the startup code */
916void
917exit(int code)
918{
919
920	OF_exit();
921}
922
923#ifdef LOADER_DEBUG
924static const char *const page_sizes[] = {
925	"  8k", " 64k", "512k", "  4m"
926};
927
928static void
929pmap_print_tte_sun4u(tte_t tag, tte_t tte)
930{
931
932	printf("%s %s ",
933	    page_sizes[(tte >> TD_SIZE_SHIFT) & TD_SIZE_MASK],
934	    tag & TD_G ? "G" : " ");
935	printf(tte & TD_W ? "W " : "  ");
936	printf(tte & TD_P ? "\e[33mP\e[0m " : "  ");
937	printf(tte & TD_E ? "E " : "  ");
938	printf(tte & TD_CV ? "CV " : "   ");
939	printf(tte & TD_CP ? "CP " : "   ");
940	printf(tte & TD_L ? "\e[32mL\e[0m " : "  ");
941	printf(tte & TD_IE ? "IE " : "   ");
942	printf(tte & TD_NFO ? "NFO " : "    ");
943	printf("pa=0x%lx va=0x%lx ctx=%ld\n",
944	    TD_PA(tte), TLB_TAR_VA(tag), TLB_TAR_CTX(tag));
945}
946
947static void
948pmap_print_tlb_sun4u(void)
949{
950	tte_t tag, tte;
951	u_long pstate;
952	int i;
953
954	pstate = rdpr(pstate);
955	for (i = 0; i < itlb_slot_max; i++) {
956		wrpr(pstate, pstate & ~PSTATE_IE, 0);
957		tte = itlb_get_data_sun4u(i);
958		wrpr(pstate, pstate, 0);
959		if (!(tte & TD_V))
960			continue;
961		tag = ldxa(TLB_DAR_SLOT(i), ASI_ITLB_TAG_READ_REG);
962		printf("iTLB-%2u: ", i);
963		pmap_print_tte_sun4u(tag, tte);
964	}
965	for (i = 0; i < dtlb_slot_max; i++) {
966		wrpr(pstate, pstate & ~PSTATE_IE, 0);
967		tte = dtlb_get_data_sun4u(i);
968		wrpr(pstate, pstate, 0);
969		if (!(tte & TD_V))
970			continue;
971		tag = ldxa(TLB_DAR_SLOT(i), ASI_DTLB_TAG_READ_REG);
972		printf("dTLB-%2u: ", i);
973		pmap_print_tte_sun4u(tag, tte);
974	}
975}
976#endif
977