kernel - Fix auto port assignment collision in network code
[dragonfly.git] / sys / platform / pc64 / x86_64 / efirt.c
blob1cf80e031b142b8e4f0368edae7142a474723289
1 /*-
2 * Copyright (c) 2004 Marcel Moolenaar
3 * Copyright (c) 2001 Doug Rabson
4 * Copyright (c) 2016 The FreeBSD Foundation
5 * All rights reserved.
7 * Portions of this software were developed by Konstantin Belousov
8 * under sponsorship from the FreeBSD Foundation.
10 * Redistribution and use in source and binary forms, with or without
11 * modification, are permitted provided that the following conditions
12 * are met:
13 * 1. Redistributions of source code must retain the above copyright
14 * notice, this list of conditions and the following disclaimer.
15 * 2. Redistributions in binary form must reproduce the above copyright
16 * notice, this list of conditions and the following disclaimer in the
17 * documentation and/or other materials provided with the distribution.
19 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
20 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
21 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
22 * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
23 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
24 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
25 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
26 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
27 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
28 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
29 * SUCH DAMAGE.
31 * $FreeBSD: head/sys/amd64/amd64/efirt.c 307391 2016-10-16 06:07:43Z kib $
34 #include <sys/param.h>
35 #include <sys/efi.h>
36 #include <sys/kernel.h>
37 #include <sys/linker.h>
38 #include <sys/lock.h>
39 #include <sys/malloc.h>
40 #include <sys/module.h>
41 #include <sys/proc.h>
42 #include <sys/sched.h>
43 #include <sys/sysctl.h>
44 #include <sys/systm.h>
45 #include <sys/thread.h>
46 #include <sys/globaldata.h>
48 #include <vm/vm.h>
49 #include <vm/pmap.h>
50 #include <vm/vm_map.h>
51 #include <vm/vm_object.h>
52 #include <vm/vm_param.h>
53 #include <vm/vm_page.h>
54 #include <vm/vm_pager.h>
55 #include <vm/vm_extern.h>
57 #include <vm/vm_page2.h>
59 #include <machine/efi.h>
60 #include <machine/metadata.h>
61 #include <machine/md_var.h>
62 #include <machine/smp.h>
63 #include <machine/vmparam.h>
65 static struct efi_systbl *efi_systbl;
66 static struct efi_cfgtbl *efi_cfgtbl;
67 static struct efi_rt *efi_runtime;
69 static int efi_status2err[25] = {
70 0, /* EFI_SUCCESS */
71 ENOEXEC, /* EFI_LOAD_ERROR */
72 EINVAL, /* EFI_INVALID_PARAMETER */
73 ENOSYS, /* EFI_UNSUPPORTED */
74 EMSGSIZE, /* EFI_BAD_BUFFER_SIZE */
75 EOVERFLOW, /* EFI_BUFFER_TOO_SMALL */
76 EBUSY, /* EFI_NOT_READY */
77 EIO, /* EFI_DEVICE_ERROR */
78 EROFS, /* EFI_WRITE_PROTECTED */
79 EAGAIN, /* EFI_OUT_OF_RESOURCES */
80 EIO, /* EFI_VOLUME_CORRUPTED */
81 ENOSPC, /* EFI_VOLUME_FULL */
82 ENXIO, /* EFI_NO_MEDIA */
83 ESTALE, /* EFI_MEDIA_CHANGED */
84 ENOENT, /* EFI_NOT_FOUND */
85 EACCES, /* EFI_ACCESS_DENIED */
86 ETIMEDOUT, /* EFI_NO_RESPONSE */
87 EADDRNOTAVAIL, /* EFI_NO_MAPPING */
88 ETIMEDOUT, /* EFI_TIMEOUT */
89 EDOOFUS, /* EFI_NOT_STARTED */
90 EALREADY, /* EFI_ALREADY_STARTED */
91 ECANCELED, /* EFI_ABORTED */
92 EPROTO, /* EFI_ICMP_ERROR */
93 EPROTO, /* EFI_TFTP_ERROR */
94 EPROTO /* EFI_PROTOCOL_ERROR */
97 static MALLOC_DEFINE(M_EFI, "efi", "EFI BIOS");
99 static int
100 efi_status_to_errno(efi_status status)
102 u_long code;
104 code = status & 0x3ffffffffffffffful;
105 return (code < nitems(efi_status2err) ? efi_status2err[code] : EDOOFUS);
108 static struct lock efi_lock;
109 static struct lock resettodr_lock;
110 static mcontext_t efi_ctx;
111 static struct vmspace *efi_savevm;
112 static struct vmspace *efi_vmspace;
113 static vm_object_t efi_obj;
114 static struct efi_md *efi_map;
115 static int efi_ndesc;
116 static int efi_descsz;
118 static void
119 efi_destroy_1t1_map(void)
121 vm_object_t obj;
122 vm_page_t m;
124 if ((obj = efi_obj) != NULL) {
125 efi_obj = NULL;
126 vm_object_hold(obj);
127 vm_object_reference_locked(obj); /* match deallocate */
129 if (efi_vmspace) {
130 pmap_remove_pages(vmspace_pmap(efi_vmspace),
131 VM_MIN_USER_ADDRESS, VM_MAX_USER_ADDRESS);
132 vm_map_remove(&efi_vmspace->vm_map,
133 VM_MIN_USER_ADDRESS,
134 VM_MAX_USER_ADDRESS);
135 vmspace_rel(efi_vmspace);
136 efi_vmspace = NULL;
138 if (obj) {
139 while ((m = RB_ROOT(&obj->rb_memq)) != NULL) {
140 vm_page_busy_wait(m, FALSE, "efipg");
141 vm_page_unwire(m, 1);
142 vm_page_flag_clear(m, PG_MAPPED | PG_WRITEABLE);
143 cdev_pager_free_page(obj, m);
144 kfree(m, M_EFI);
146 vm_object_drop(obj);
147 vm_object_deallocate(obj);
151 static int
152 efi_pg_ctor(void *handle, vm_ooffset_t size, vm_prot_t prot,
153 vm_ooffset_t foff, struct ucred *cred, u_short *color)
155 *color = 0;
156 return 0;
159 static void
160 efi_pg_dtor(void *handle)
164 static int
165 efi_pg_fault(vm_object_t obj, vm_ooffset_t offset, int prot, vm_page_t *mres)
167 vm_page_t m;
169 m = *mres;
170 if ((m->flags & PG_FICTITIOUS) == 0) {
171 *mres = NULL;
172 vm_page_remove(m);
173 vm_page_free(m);
174 m = NULL;
176 if (m == NULL) {
177 kprintf("efi_pg_fault: unmapped pg @%016jx\n", offset);
178 return VM_PAGER_ERROR;
182 * Shouldn't get hit, we pre-loaded all the pages.
184 kprintf("efi_pg_fault: ok %p/%p @%016jx m=%016jx,%016jx\n",
185 obj, efi_obj, offset, m->pindex, m->phys_addr);
187 return VM_PAGER_OK;
190 static struct cdev_pager_ops efi_pager_ops = {
191 .cdev_pg_fault = efi_pg_fault,
192 .cdev_pg_ctor = efi_pg_ctor,
193 .cdev_pg_dtor = efi_pg_dtor
196 static bool
197 efi_create_1t1_map(struct efi_md *map, int ndesc, int descsz)
199 vm_page_t m;
200 struct efi_md *p;
201 int i;
202 int count;
203 int result;
205 efi_map = map;
206 efi_ndesc = ndesc;
207 efi_descsz = descsz;
210 * efi_obj is ref'd by cdev_pager_allocate
212 efi_vmspace = vmspace_alloc(VM_MIN_USER_ADDRESS, VM_MAX_USER_ADDRESS);
213 pmap_pinit2(vmspace_pmap(efi_vmspace));
214 efi_obj = cdev_pager_allocate(NULL, OBJT_MGTDEVICE, &efi_pager_ops,
215 VM_MAX_USER_ADDRESS,
216 VM_PROT_READ | VM_PROT_WRITE,
217 0, proc0.p_ucred);
218 vm_object_hold(efi_obj);
220 count = vm_map_entry_reserve(MAP_RESERVE_COUNT);
221 vm_map_lock(&efi_vmspace->vm_map);
222 result = vm_map_insert(&efi_vmspace->vm_map, &count, efi_obj, NULL,
223 0, NULL,
224 0, VM_MAX_USER_ADDRESS,
225 VM_MAPTYPE_NORMAL,
226 VM_SUBSYS_EFI,
227 VM_PROT_READ | VM_PROT_WRITE | VM_PROT_EXECUTE,
228 VM_PROT_READ | VM_PROT_WRITE | VM_PROT_EXECUTE,
230 vm_map_unlock(&efi_vmspace->vm_map);
231 if (result != KERN_SUCCESS)
232 goto fail;
234 for (i = 0, p = map;
235 i < ndesc; i++, p = efi_next_descriptor(p, descsz)) {
236 vm_offset_t va;
237 uint64_t idx;
238 int mode;
240 if ((p->md_attr & EFI_MD_ATTR_RT) == 0)
241 continue;
242 if (p->md_virt != NULL) {
243 if (bootverbose)
244 kprintf("EFI Runtime entry %d is mapped\n", i);
245 goto fail;
247 if ((p->md_phys & EFI_PAGE_MASK) != 0) {
248 if (bootverbose)
249 kprintf("EFI Runtime entry %d is not aligned\n",
251 goto fail;
253 if (p->md_phys + p->md_pages * EFI_PAGE_SIZE < p->md_phys ||
254 p->md_phys + p->md_pages * EFI_PAGE_SIZE >=
255 VM_MAX_USER_ADDRESS) {
256 kprintf("EFI Runtime entry %d is not in mappable for RT:"
257 "base %#016jx %#jx pages\n",
258 i, (uintmax_t)p->md_phys,
259 (uintmax_t)p->md_pages);
260 goto fail;
263 if ((p->md_attr & EFI_MD_ATTR_WB) != 0)
264 mode = VM_MEMATTR_WRITE_BACK;
265 else if ((p->md_attr & EFI_MD_ATTR_WT) != 0)
266 mode = VM_MEMATTR_WRITE_THROUGH;
267 else if ((p->md_attr & EFI_MD_ATTR_WC) != 0)
268 mode = VM_MEMATTR_WRITE_COMBINING;
269 else if ((p->md_attr & EFI_MD_ATTR_WP) != 0)
270 mode = VM_MEMATTR_WRITE_PROTECTED;
271 else if ((p->md_attr & EFI_MD_ATTR_UC) != 0)
272 mode = VM_MEMATTR_UNCACHEABLE;
273 else {
274 if (bootverbose)
275 kprintf("EFI Runtime entry %d mapping "
276 "attributes unsupported\n", i);
277 mode = VM_MEMATTR_UNCACHEABLE;
280 if (bootverbose) {
281 kprintf("efirt: map %016jx-%016jx\n",
282 p->md_phys,
283 p->md_phys + IDX_TO_OFF(p->md_pages));
286 for (va = p->md_phys, idx = 0; idx < p->md_pages; idx++,
287 va += PAGE_SIZE) {
288 m = kmalloc(sizeof(*m), M_EFI, M_WAITOK | M_ZERO);
289 /*m->flags |= PG_WRITEABLE;*/
290 vm_page_initfake(m, va, mode); /* va is phys addr */
291 m->valid = VM_PAGE_BITS_ALL;
292 m->dirty = m->valid;
293 vm_page_insert(m, efi_obj, OFF_TO_IDX(va));
294 vm_page_wakeup(m);
297 vm_object_drop(efi_obj);
298 vm_map_entry_release(count);
300 return true;
302 fail:
303 vm_object_drop(efi_obj);
304 vm_map_entry_release(count);
305 efi_destroy_1t1_map();
307 return false;
311 * Create an environment for the EFI runtime code call. The most
312 * important part is creating the required 1:1 physical->virtual
313 * mappings for the runtime segments. To do that, we manually create
314 * page table which unmap userspace but gives correct kernel mapping.
315 * The 1:1 mappings for runtime segments usually occupy low 4G of the
316 * physical address map.
318 * The 1:1 mappings were chosen over the SetVirtualAddressMap() EFI RT
319 * service, because there are some BIOSes which fail to correctly
320 * relocate itself on the call, requiring both 1:1 and virtual
321 * mapping. As result, we must provide 1:1 mapping anyway, so no
322 * reason to bother with the virtual map, and no need to add a
323 * complexity into loader.
325 * The fpu_kern_enter() call allows firmware to use FPU, as mandated
326 * by the specification. In particular, CR0.TS bit is cleared. Also
327 * it enters critical section, giving us neccessary protection against
328 * context switch.
330 * There is no need to disable interrupts around the change of %cr3,
331 * the kernel mappings are correct, while we only grabbed the
332 * userspace portion of VA. Interrupts handlers must not access
333 * userspace. Having interrupts enabled fixes the issue with
334 * firmware/SMM long operation, which would negatively affect IPIs,
335 * esp. TLB shootdown requests.
337 * We must disable SMAP (aka smap_open()) operation to access the
338 * direct map as it will likely be using userspace addresses.
340 static int
341 efi_enter(void)
343 thread_t td = curthread;
345 if (efi_runtime == NULL)
346 return (ENXIO);
347 lockmgr(&efi_lock, LK_EXCLUSIVE);
348 efi_savevm = td->td_lwp->lwp_vmspace;
349 pmap_setlwpvm(td->td_lwp, efi_vmspace);
350 npxpush(&efi_ctx);
351 cpu_invltlb();
352 smap_smep_disable();
354 return (0);
357 static void
358 efi_leave(void)
360 thread_t td = curthread;
362 smap_smep_enable();
363 pmap_setlwpvm(td->td_lwp, efi_savevm);
364 npxpop(&efi_ctx);
365 cpu_invltlb();
366 efi_savevm = NULL;
367 lockmgr(&efi_lock, LK_RELEASE);
370 static int
371 efi_init(void)
373 struct efi_map_header *efihdr;
374 struct efi_md *map;
375 caddr_t kmdp;
376 size_t efisz;
378 lockinit(&efi_lock, "efi", 0, LK_CANRECURSE);
379 lockinit(&resettodr_lock, "efitodr", 0, LK_CANRECURSE);
381 if (efi_systbl_phys == 0) {
382 if (bootverbose)
383 kprintf("EFI systbl not available\n");
384 return (ENXIO);
386 efi_systbl = (struct efi_systbl *)PHYS_TO_DMAP(efi_systbl_phys);
387 if (efi_systbl->st_hdr.th_sig != EFI_SYSTBL_SIG) {
388 efi_systbl = NULL;
389 if (bootverbose)
390 kprintf("EFI systbl signature invalid\n");
391 return (ENXIO);
393 efi_cfgtbl = (efi_systbl->st_cfgtbl == 0) ? NULL :
394 (struct efi_cfgtbl *)efi_systbl->st_cfgtbl;
395 if (efi_cfgtbl == NULL) {
396 if (bootverbose)
397 kprintf("EFI config table is not present\n");
400 kmdp = preload_search_by_type("elf kernel");
401 if (kmdp == NULL)
402 kmdp = preload_search_by_type("elf64 kernel");
403 efihdr = (struct efi_map_header *)preload_search_info(kmdp,
404 MODINFO_METADATA | MODINFOMD_EFI_MAP);
405 if (efihdr == NULL) {
406 if (bootverbose)
407 kprintf("EFI map is not present\n");
408 return (ENXIO);
410 efisz = (sizeof(struct efi_map_header) + 0xf) & ~0xf;
411 map = (struct efi_md *)((uint8_t *)efihdr + efisz);
412 if (efihdr->descriptor_size == 0)
413 return (ENOMEM);
415 if (!efi_create_1t1_map(map, efihdr->memory_size /
416 efihdr->descriptor_size, efihdr->descriptor_size)) {
417 if (bootverbose)
418 kprintf("EFI cannot create runtime map\n");
419 return (ENOMEM);
422 efi_runtime = (efi_systbl->st_rt == 0) ? NULL :
423 (struct efi_rt *)efi_systbl->st_rt;
424 if (efi_runtime == NULL) {
425 if (bootverbose)
426 kprintf("EFI runtime services table is not present\n");
427 efi_destroy_1t1_map();
428 return (ENXIO);
431 return (0);
434 static void
435 efi_uninit(void)
437 efi_destroy_1t1_map();
439 efi_systbl = NULL;
440 efi_cfgtbl = NULL;
441 efi_runtime = NULL;
443 lockuninit(&efi_lock);
444 lockuninit(&resettodr_lock);
448 efi_get_table(struct uuid *uuid, void **ptr)
450 struct efi_cfgtbl *ct;
451 u_long count;
453 if (efi_cfgtbl == NULL)
454 return (ENXIO);
455 count = efi_systbl->st_entries;
456 ct = efi_cfgtbl;
457 while (count--) {
458 if (!bcmp(&ct->ct_uuid, uuid, sizeof(*uuid))) {
459 *ptr = (void *)PHYS_TO_DMAP(ct->ct_data);
460 return (0);
462 ct++;
464 return (ENOENT);
468 efi_get_time_locked(struct efi_tm *tm)
470 efi_status status;
471 int error;
473 KKASSERT(lockowned(&resettodr_lock) != 0);
474 error = efi_enter();
475 if (error != 0)
476 return (error);
477 status = efi_runtime->rt_gettime(tm, NULL);
478 efi_leave();
479 error = efi_status_to_errno(status);
481 return (error);
485 efi_get_time(struct efi_tm *tm)
487 int error;
489 if (efi_runtime == NULL)
490 return (ENXIO);
491 lockmgr(&resettodr_lock, LK_EXCLUSIVE);
492 error = efi_get_time_locked(tm);
493 lockmgr(&resettodr_lock, LK_RELEASE);
495 return (error);
499 efi_reset_system(void)
501 int error;
503 error = efi_enter();
504 if (error != 0)
505 return (error);
506 efi_runtime->rt_reset(EFI_RESET_WARM, 0, 0, NULL);
507 efi_leave();
508 return (EIO);
512 efi_set_time_locked(struct efi_tm *tm)
514 efi_status status;
515 int error;
517 KKASSERT(lockowned(&resettodr_lock) != 0);
518 error = efi_enter();
519 if (error != 0)
520 return (error);
521 status = efi_runtime->rt_settime(tm);
522 efi_leave();
523 error = efi_status_to_errno(status);
524 return (error);
528 efi_set_time(struct efi_tm *tm)
530 int error;
532 if (efi_runtime == NULL)
533 return (ENXIO);
534 lockmgr(&resettodr_lock, LK_EXCLUSIVE);
535 error = efi_set_time_locked(tm);
536 lockmgr(&resettodr_lock, LK_RELEASE);
537 return (error);
541 efi_var_get(efi_char *name, struct uuid *vendor, uint32_t *attrib,
542 size_t *datasize, void *data)
544 efi_status status;
545 int error;
547 error = efi_enter();
548 if (error != 0)
549 return (error);
550 status = efi_runtime->rt_getvar(name, vendor, attrib, datasize, data);
551 efi_leave();
552 error = efi_status_to_errno(status);
553 return (error);
557 efi_var_nextname(size_t *namesize, efi_char *name, struct uuid *vendor)
559 efi_status status;
560 int error;
562 error = efi_enter();
563 if (error != 0)
564 return (error);
565 status = efi_runtime->rt_scanvar(namesize, name, vendor);
566 efi_leave();
567 error = efi_status_to_errno(status);
568 return (error);
572 efi_var_set(efi_char *name, struct uuid *vendor, uint32_t attrib,
573 size_t datasize, void *data)
575 efi_status status;
576 int error;
578 error = efi_enter();
579 if (error != 0)
580 return (error);
581 status = efi_runtime->rt_setvar(name, vendor, attrib, datasize, data);
582 efi_leave();
583 error = efi_status_to_errno(status);
584 return (error);
587 static int
588 efirt_modevents(module_t m, int event, void *arg __unused)
591 switch (event) {
592 case MOD_LOAD:
593 return (efi_init());
595 case MOD_UNLOAD:
596 efi_uninit();
597 return (0);
599 case MOD_SHUTDOWN:
600 return (0);
602 default:
603 return (EOPNOTSUPP);
607 static moduledata_t efirt_moddata = {
608 .name = "efirt",
609 .evhand = efirt_modevents,
610 .priv = NULL,
613 DECLARE_MODULE(efirt, efirt_moddata, SI_SUB_DRIVERS, SI_ORDER_ANY);
614 MODULE_VERSION(efirt, 1);
617 /* XXX debug stuff */
618 static int
619 efi_time_sysctl_handler(SYSCTL_HANDLER_ARGS)
621 struct efi_tm tm;
622 int error, val;
624 val = 0;
625 error = sysctl_handle_int(oidp, &val, 0, req);
626 if (error != 0 || req->newptr == NULL)
627 return (error);
628 error = efi_get_time(&tm);
629 if (error == 0) {
630 uprintf("EFI reports: Year %d Month %d Day %d Hour %d Min %d "
631 "Sec %d\n", tm.tm_year, tm.tm_mon, tm.tm_mday, tm.tm_hour,
632 tm.tm_min, tm.tm_sec);
634 return (error);
637 SYSCTL_PROC(_debug, OID_AUTO, efi_time, CTLTYPE_INT | CTLFLAG_RW, NULL, 0,
638 efi_time_sysctl_handler, "I", "");