SUPDrv-linux.c revision 105f22555863c3877b21add507647917e2615a13
/** @file
* The VirtualBox Support Driver - Linux hosts.
*/
/*
* Copyright (C) 2006-2007 innotek GmbH
*
* This file is part of VirtualBox Open Source Edition (OSE), as
* available from http://www.virtualbox.org. This file is free software;
* you can redistribute it and/or modify it under the terms of the GNU
* General Public License (GPL) as published by the Free Software
* Foundation, in version 2 as it comes in the "COPYING" file of the
* VirtualBox OSE distribution. VirtualBox OSE is distributed in the
* hope that it will be useful, but WITHOUT ANY WARRANTY of any kind.
*
* The contents of this file may alternatively be used under the terms
* of the Common Development and Distribution License Version 1.0
* (CDDL) only, as it comes in the "COPYING.CDDL" file of the
* VirtualBox OSE distribution, in which case the provisions of the
* CDDL are applicable instead of those of the GPL.
*
* You may elect to license modified versions of this file under the
* terms and conditions of either the GPL or the CDDL or both.
* Some lines of code to disable the local APIC on x86_64 machines taken
* from a Mandriva patch by Gwenole Beauchesne <gbeauchesne@mandriva.com>.
*/
/*******************************************************************************
* Header Files *
*******************************************************************************/
#include "SUPDRV.h"
#include "the-linux-kernel.h"
#include "version-generated.h"
#include <iprt/assert.h>
#include <iprt/spinlock.h>
#include <iprt/semaphore.h>
#include <iprt/initterm.h>
#include <iprt/process.h>
#include <iprt/err.h>
#include <iprt/mem.h>
#include <iprt/log.h>
#include <linux/sched.h>
#ifdef CONFIG_DEVFS_FS
# include <linux/devfs_fs_kernel.h>
#endif
#ifdef CONFIG_VBOXDRV_AS_MISC
# include <linux/miscdevice.h>
#endif
#ifdef CONFIG_X86_LOCAL_APIC
# include <asm/apic.h>
# if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 0)
# include <asm/nmi.h>
# endif
#endif
#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 0)
# include <asm/pgtable.h>
# define global_flush_tlb __flush_tlb_global
#endif
#include <iprt/mem.h>
/* devfs defines */
#if defined(CONFIG_DEVFS_FS) && !defined(CONFIG_VBOXDRV_AS_MISC)
# if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 0)
# define VBOX_REGISTER_DEVFS() \
({ \
void *rc = NULL; \
if (devfs_mk_cdev(MKDEV(DEVICE_MAJOR, 0), \
S_IFCHR | S_IRUGO | S_IWUGO, \
DEVICE_NAME) == 0) \
rc = (void *)' '; /* return not NULL */ \
rc; \
})
# define VBOX_UNREGISTER_DEVFS(handle) \
devfs_remove(DEVICE_NAME);
# else /* < 2.6.0 */
# define VBOX_REGISTER_DEVFS() \
devfs_register(NULL, DEVICE_NAME, DEVFS_FL_DEFAULT, \
DEVICE_MAJOR, 0, \
S_IFCHR | S_IRUGO | S_IWUGO, \
&gFileOpsVBoxDrv, NULL)
# define VBOX_UNREGISTER_DEVFS(handle) \
if (handle != NULL) \
devfs_unregister(handle)
# endif /* < 2.6.0 */
#endif /* CONFIG_DEV_FS && !CONFIG_VBOXDEV_AS_MISC */
#ifndef CONFIG_VBOXDRV_AS_MISC
# if defined(CONFIG_DEVFS_FS) && LINUX_VERSION_CODE <= KERNEL_VERSION(2, 6, 0)
# define VBOX_REGISTER_DEVICE(a,b,c) devfs_register_chrdev(a,b,c)
# define VBOX_UNREGISTER_DEVICE(a,b) devfs_unregister_chrdev(a,b)
# else
# define VBOX_REGISTER_DEVICE(a,b,c) register_chrdev(a,b,c)
# define VBOX_UNREGISTER_DEVICE(a,b) unregister_chrdev(a,b)
# endif
#endif /* !CONFIG_VBOXDRV_AS_MISC */
#ifdef CONFIG_X86_HIGH_ENTRY
# error "CONFIG_X86_HIGH_ENTRY is not supported by VBoxDrv at this time."
#endif
/*
* This sucks soooo badly on x86! Why don't they export __PAGE_KERNEL_EXEC so PAGE_KERNEL_EXEC would be usable?
*/
#if defined(RT_ARCH_AMD64)
# define MY_PAGE_KERNEL_EXEC PAGE_KERNEL_EXEC
#elif defined(PAGE_KERNEL_EXEC) && defined(CONFIG_X86_PAE)
# define MY_PAGE_KERNEL_EXEC __pgprot(cpu_has_pge ? _PAGE_KERNEL_EXEC | _PAGE_GLOBAL : _PAGE_KERNEL_EXEC)
#else
# define MY_PAGE_KERNEL_EXEC PAGE_KERNEL
#endif
/*
* The redhat hack section.
* - The current hacks are for 2.4.21-15.EL only.
*/
#ifndef NO_REDHAT_HACKS
/* accounting. */
# if LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 0)
# ifdef VM_ACCOUNT
# define MY_DO_MUNMAP(a,b,c) do_munmap(a, b, c, 0) /* should it be 1 or 0? */
# endif
# endif
/* backported remap_page_range. */
# if LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 0)
# include <asm/tlb.h>
# ifdef tlb_vma /* probably not good enough... */
# define HAVE_26_STYLE_REMAP_PAGE_RANGE 1
# endif
# endif
# ifndef RT_ARCH_AMD64
/* In 2.6.9-22.ELsmp we have to call change_page_attr() twice when changing
* the page attributes from PAGE_KERNEL to something else, because there appears
* to be a bug in one of the many patches that redhat applied.
* It should be safe to do this on less buggy linux kernels too. ;-)
*/
# define MY_CHANGE_PAGE_ATTR(pPages, cPages, prot) \
do { \
if (pgprot_val(prot) != pgprot_val(PAGE_KERNEL)) \
change_page_attr(pPages, cPages, prot); \
change_page_attr(pPages, cPages, prot); \
} while (0)
# endif
#endif /* !NO_REDHAT_HACKS */
#ifndef MY_DO_MUNMAP
# define MY_DO_MUNMAP(a,b,c) do_munmap(a, b, c)
#endif
#ifndef MY_CHANGE_PAGE_ATTR
# ifdef RT_ARCH_AMD64 /** @todo This is a cheap hack, but it'll get around that 'else BUG();' in __change_page_attr(). */
# define MY_CHANGE_PAGE_ATTR(pPages, cPages, prot) \
do { \
change_page_attr(pPages, cPages, PAGE_KERNEL_NOCACHE); \
change_page_attr(pPages, cPages, prot); \
} while (0)
# else
# define MY_CHANGE_PAGE_ATTR(pPages, cPages, prot) change_page_attr(pPages, cPages, prot)
# endif
#endif
/** @def ONE_MSEC_IN_JIFFIES
* The number of jiffies that make up 1 millisecond. Must be at least 1! */
#if HZ <= 1000
# define ONE_MSEC_IN_JIFFIES 1
#elif !(HZ % 1000)
# define ONE_MSEC_IN_JIFFIES (HZ / 1000)
#else
# define ONE_MSEC_IN_JIFFIES ((HZ + 999) / 1000)
# error "HZ is not a multiple of 1000, the GIP stuff won't work right!"
#endif
/** @def TICK_NSEC
* The time between ticks in nsec */
#ifndef TICK_NSEC
# define TICK_NSEC (1000000UL / HZ)
#endif
#ifdef CONFIG_X86_LOCAL_APIC
/* If an NMI occurs while we are inside the world switcher the machine will
* crash. The Linux NMI watchdog generates periodic NMIs increasing a counter
* which is compared with another counter increased in the timer interrupt
* handler. We disable the NMI watchdog.
*
* - Linux >= 2.6.21: The watchdog is disabled by default on i386 and x86_64.
* - Linux < 2.6.21: The watchdog is normally enabled by default on x86_64
* and disabled on i386.
*/
# if defined(RT_ARCH_AMD64)
# if LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 21) && !defined(VBOX_REDHAT_KABI)
# define DO_DISABLE_NMI 1
# endif
# endif
# if LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 19)
extern int nmi_active;
# define nmi_atomic_read(P) *(P)
# define nmi_atomic_set(P, V) *(P) = (V)
# define nmi_atomic_dec(P) nmi_atomic_set(P, 0)
# else
# define nmi_atomic_read(P) atomic_read(P)
# define nmi_atomic_set(P, V) atomic_set(P, V)
# define nmi_atomic_dec(P) atomic_dec(P)
# endif
# ifndef X86_FEATURE_ARCH_PERFMON
# define X86_FEATURE_ARCH_PERFMON (3*32+9) /* Intel Architectural PerfMon */
# endif
# ifndef MSR_ARCH_PERFMON_EVENTSEL0
# define MSR_ARCH_PERFMON_EVENTSEL0 0x186
# endif
# ifndef ARCH_PERFMON_UNHALTED_CORE_CYCLES_PRESENT
# define ARCH_PERFMON_UNHALTED_CORE_CYCLES_PRESENT (1 << 0)
# endif
#endif /* CONFIG_X86_LOCAL_APIC */
#define xstr(s) str(s)
#define str(s) #s
/*******************************************************************************
* Defined Constants And Macros *
*******************************************************************************/
/**
* Device extention & session data association structure.
*/
static SUPDRVDEVEXT g_DevExt;
/** Timer structure for the GIP update. */
static VBOXKTIMER g_GipTimer;
/** Pointer to the page structure for the GIP. */
struct page *g_pGipPage;
/** Registered devfs device handle. */
#if defined(CONFIG_DEVFS_FS) && !defined(CONFIG_VBOXDRV_AS_MISC)
# if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 0)
static void *g_hDevFsVBoxDrv = NULL;
# else
static devfs_handle_t g_hDevFsVBoxDrv = NULL;
# endif
#endif
#ifndef CONFIG_VBOXDRV_AS_MISC
/** Module major number */
#define DEVICE_MAJOR 234
/** Saved major device number */
static int g_iModuleMajor;
#endif /* !CONFIG_VBOXDRV_AS_MISC */
/** Module parameter.
* Not prefixed because the name is used by macros and the end of this file. */
static int force_async_tsc = 0;
/** The module name. */
#define DEVICE_NAME "vboxdrv"
#ifdef RT_ARCH_AMD64
/**
* Memory for the executable memory heap (in IPRT).
*/
extern uint8_t g_abExecMemory[1572864]; /* 1.5 MB */
__asm__(".section execmemory, \"awx\", @progbits\n\t"
".align 32\n\t"
".globl g_abExecMemory\n"
"g_abExecMemory:\n\t"
".zero 1572864\n\t"
".type g_abExecMemory, @object\n\t"
".size g_abExecMemory, 1572864\n\t"
".text\n\t");
#endif
/*******************************************************************************
* Internal Functions *
*******************************************************************************/
#ifdef VBOX_HRTIMER
typedef enum hrtimer_restart (*PFNVBOXKTIMER)(struct hrtimer *);
#else
typedef void (*PFNVBOXKTIMER)(unsigned long);
#endif
static int VBoxDrvLinuxInit(void);
static void VBoxDrvLinuxUnload(void);
static int VBoxDrvLinuxCreate(struct inode *pInode, struct file *pFilp);
static int VBoxDrvLinuxClose(struct inode *pInode, struct file *pFilp);
#ifdef HAVE_UNLOCKED_IOCTL
static long VBoxDrvLinuxIOCtl(struct file *pFilp, unsigned int uCmd, unsigned long ulArg);
#else
static int VBoxDrvLinuxIOCtl(struct inode *pInode, struct file *pFilp, unsigned int uCmd, unsigned long ulArg);
#endif
static int VBoxDrvLinuxIOCtlSlow(struct file *pFilp, unsigned int uCmd, unsigned long ulArg);
static int VBoxDrvLinuxInitGip(PSUPDRVDEVEXT pDevExt);
static int VBoxDrvLinuxTermGip(PSUPDRVDEVEXT pDevExt);
#ifdef VBOX_HRTIMER
static enum hrtimer_restart VBoxDrvLinuxGipTimer(struct hrtimer *pTimer);
#else
static void VBoxDrvLinuxGipTimer(unsigned long ulUser);
#endif
#ifdef CONFIG_SMP
# ifdef VBOX_HRTIMER
static enum hrtimer_restart VBoxDrvLinuxGipTimerPerCpu(struct hrtimer *pTimer);
# else
static void VBoxDrvLinuxGipTimerPerCpu(unsigned long ulUser);
# endif
static void VBoxDrvLinuxGipResumePerCpu(void *pvUser);
#endif
static int VBoxDrvLinuxErr2LinuxErr(int);
/** The file_operations structure. */
static struct file_operations gFileOpsVBoxDrv =
{
owner: THIS_MODULE,
open: VBoxDrvLinuxCreate,
release: VBoxDrvLinuxClose,
#ifdef HAVE_UNLOCKED_IOCTL
unlocked_ioctl: VBoxDrvLinuxIOCtl,
#else
ioctl: VBoxDrvLinuxIOCtl,
#endif
};
#ifdef CONFIG_VBOXDRV_AS_MISC
/** The miscdevice structure. */
static struct miscdevice gMiscDevice =
{
minor: MISC_DYNAMIC_MINOR,
name: DEVICE_NAME,
fops: &gFileOpsVBoxDrv,
# if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 0) && \
LINUX_VERSION_CODE <= KERNEL_VERSION(2, 6, 17)
devfs_name: DEVICE_NAME,
# endif
};
#endif
static inline void vbox_ktimer_init(PVBOXKTIMER pTimer, PFNVBOXKTIMER pfnFunction, unsigned long ulData)
{
#ifdef VBOX_HRTIMER
hrtimer_init(pTimer, CLOCK_MONOTONIC, HRTIMER_MODE_ABS);
pTimer->function = pfnFunction;
#else
init_timer(pTimer);
pTimer->data = ulData;
pTimer->function = pfnFunction;
pTimer->expires = jiffies;
#endif
}
static inline void vbox_ktimer_start(PVBOXKTIMER pTimer)
{
#ifdef VBOX_HRTIMER
hrtimer_start(pTimer, ktime_add_ns(ktime_get(), 1000000), HRTIMER_MODE_ABS);
#else
mod_timer(pTimer, jiffies);
#endif
}
static inline void vbox_ktimer_stop(PVBOXKTIMER pTimer)
{
#ifdef VBOX_HRTIMER
hrtimer_cancel(pTimer);
#else
if (timer_pending(pTimer))
del_timer_sync(pTimer);
#endif
}
#ifdef CONFIG_X86_LOCAL_APIC
# ifdef DO_DISABLE_NMI
/** Stop AMD NMI watchdog (x86_64 only). */
static int stop_k7_watchdog(void)
{
wrmsr(MSR_K7_EVNTSEL0, 0, 0);
return 1;
}
/** Stop Intel P4 NMI watchdog (x86_64 only). */
static int stop_p4_watchdog(void)
{
wrmsr(MSR_P4_IQ_CCCR0, 0, 0);
wrmsr(MSR_P4_IQ_CCCR1, 0, 0);
wrmsr(MSR_P4_CRU_ESCR0, 0, 0);
return 1;
}
/** The new method of detecting the event counter */
static int stop_intel_arch_watchdog(void)
{
unsigned ebx;
ebx = cpuid_ebx(10);
if (!(ebx & ARCH_PERFMON_UNHALTED_CORE_CYCLES_PRESENT))
wrmsr(MSR_ARCH_PERFMON_EVENTSEL0, 0, 0);
return 1;
}
/** Stop NMI watchdog. */
static void vbox_stop_apic_nmi_watchdog(void *unused)
{
int stopped = 0;
/* only support LOCAL and IO APICs for now */
if ((nmi_watchdog != NMI_LOCAL_APIC) &&
(nmi_watchdog != NMI_IO_APIC))
return;
if (nmi_watchdog == NMI_LOCAL_APIC)
{
switch (boot_cpu_data.x86_vendor)
{
case X86_VENDOR_AMD:
if (strstr(boot_cpu_data.x86_model_id, "Screwdriver"))
return;
stopped = stop_k7_watchdog();
break;
case X86_VENDOR_INTEL:
if (cpu_has(&boot_cpu_data, X86_FEATURE_ARCH_PERFMON))
{
stopped = stop_intel_arch_watchdog();
break;
}
stopped = stop_p4_watchdog();
break;
default:
return;
}
}
if (stopped)
nmi_atomic_dec(&nmi_active);
}
/** Disable LAPIC NMI watchdog. */
static void disable_lapic_nmi_watchdog(void)
{
BUG_ON(nmi_watchdog != NMI_LOCAL_APIC);
if (nmi_atomic_read(&nmi_active) <= 0)
return;
on_each_cpu(vbox_stop_apic_nmi_watchdog, NULL, 1, 1);
BUG_ON(nmi_atomic_read(&nmi_active) != 0);
/* tell do_nmi() and others that we're not active any more */
nmi_watchdog = NMI_NONE;
}
/** Shutdown NMI. */
static void nmi_cpu_shutdown(void * dummy)
{
unsigned int vERR, vPC;
vPC = apic_read(APIC_LVTPC);
if ((GET_APIC_DELIVERY_MODE(vPC) == APIC_MODE_NMI) && !(vPC & APIC_LVT_MASKED))
{
vERR = apic_read(APIC_LVTERR);
apic_write(APIC_LVTERR, vERR | APIC_LVT_MASKED);
apic_write(APIC_LVTPC, vPC | APIC_LVT_MASKED);
apic_write(APIC_LVTERR, vERR);
}
}
static void nmi_shutdown(void)
{
on_each_cpu(nmi_cpu_shutdown, NULL, 0, 1);
}
# endif /* DO_DISABLE_NMI */
#endif /* CONFIG_X86_LOCAL_APIC */
/**
* Initialize module.
*
* @returns appropriate status code.
*/
static int __init VBoxDrvLinuxInit(void)
{
int rc;
dprintf(("VBoxDrv::ModuleInit\n"));
#ifdef CONFIG_X86_LOCAL_APIC
/*
* If an NMI occurs while we are inside the world switcher the macine will crash.
* The Linux NMI watchdog generates periodic NMIs increasing a counter which is
* compared with another counter increased in the timer interrupt handler. Therefore
* we don't allow to setup an NMI watchdog.
*/
# if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 0) && !defined(VBOX_REDHAT_KABI)
/*
* First test: NMI actiated? Works only works with Linux 2.6 -- 2.4 does not export
* the nmi_watchdog variable.
*/
# if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 19) || \
(defined CONFIG_X86_64 && LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 0))
# ifdef DO_DISABLE_NMI
if (nmi_atomic_read(&nmi_active) > 0)
{
printk(KERN_DEBUG DEVICE_NAME ": Trying to deactivate the NMI watchdog...\n");
switch (nmi_watchdog)
{
case NMI_LOCAL_APIC:
disable_lapic_nmi_watchdog();
break;
case NMI_NONE:
nmi_atomic_dec(&nmi_active);
break;
}
if (nmi_atomic_read(&nmi_active) == 0)
{
nmi_shutdown();
printk(KERN_DEBUG DEVICE_NAME ": Successfully done.\n");
}
else
printk(KERN_DEBUG DEVICE_NAME ": Failed!\n");
}
# endif /* DO_DISABLE_NMI */
/*
* Permanent IO_APIC mode active? No way to handle this!
*/
if (nmi_watchdog == NMI_IO_APIC)
{
printk(KERN_ERR DEVICE_NAME
": NMI watchdog in IO_APIC mode active -- refused to load the kernel module!\n"
DEVICE_NAME
": Please disable the NMI watchdog by specifying 'nmi_watchdog=0' at kernel\n"
DEVICE_NAME
": command line.\n");
return -EINVAL;
}
/*
* See arch/i386/kernel/nmi.c on >= 2.6.19: -1 means it can never enabled again
*/
nmi_atomic_set(&nmi_active, -1);
printk(KERN_DEBUG DEVICE_NAME ": Trying to deactivate the NMI watchdog permanently...\n");
/*
* Now fall through and see if it actually was enabled before. If so, fail
* as we cannot deactivate it cleanly from here.
*/
# else /* < 2.6.19 */
/*
* Older 2.6 kernels: nmi_watchdog is not initalized by default
*/
if (nmi_watchdog != NMI_NONE)
goto nmi_activated;
# endif
# endif /* >= 2.6.0 && !defined(VBOX_REDHAT_KABI) */
/*
* Second test: Interrupt generated by performance counter not masked and can
* generate an NMI. Works also with Linux 2.4.
*/
{
unsigned int v, ver, maxlvt;
v = apic_read(APIC_LVR);
ver = GET_APIC_VERSION(v);
/* 82489DXs do not report # of LVT entries. */
maxlvt = APIC_INTEGRATED(ver) ? GET_APIC_MAXLVT(v) : 2;
if (maxlvt >= 4)
{
/* Read status of performance counter IRQ vector */
v = apic_read(APIC_LVTPC);
/* performance counter generates NMI and is not masked? */
if ((GET_APIC_DELIVERY_MODE(v) == APIC_MODE_NMI) && !(v & APIC_LVT_MASKED))
{
# if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 19) || \
(defined CONFIG_X86_64 && LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 0))
printk(KERN_ERR DEVICE_NAME
": NMI watchdog either active or at least initialized. Please disable the NMI\n"
DEVICE_NAME
": watchdog by specifying 'nmi_watchdog=0' at kernel command line.\n");
return -EINVAL;
# else /* < 2.6.19 */
# if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 0) && !defined(VBOX_REDHAT_KABI)
nmi_activated:
# endif
printk(KERN_ERR DEVICE_NAME
": NMI watchdog active -- refused to load the kernel module! Please disable\n"
DEVICE_NAME
": the NMI watchdog by specifying 'nmi_watchdog=0' at kernel command line.\n");
return -EINVAL;
# endif /* >= 2.6.19 */
}
}
}
# if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 19)
printk(KERN_DEBUG DEVICE_NAME ": Successfully done.\n");
# endif /* >= 2.6.19 */
#endif /* CONFIG_X86_LOCAL_APIC */
#ifdef CONFIG_VBOXDRV_AS_MISC
rc = misc_register(&gMiscDevice);
if (rc)
{
printk(KERN_ERR DEVICE_NAME ": Can't register misc device! rc=%d\n", rc);
return rc;
}
#else /* !CONFIG_VBOXDRV_AS_MISC */
/*
* Register character device.
*/
g_iModuleMajor = DEVICE_MAJOR;
rc = VBOX_REGISTER_DEVICE((dev_t)g_iModuleMajor, DEVICE_NAME, &gFileOpsVBoxDrv);
if (rc < 0)
{
dprintf(("VBOX_REGISTER_DEVICE failed with rc=%#x!\n", rc));
return rc;
}
/*
* Save returned module major number
*/
if (DEVICE_MAJOR != 0)
g_iModuleMajor = DEVICE_MAJOR;
else
g_iModuleMajor = rc;
rc = 0;
#ifdef CONFIG_DEVFS_FS
/*
* Register a device entry
*/
g_hDevFsVBoxDrv = VBOX_REGISTER_DEVFS();
if (g_hDevFsVBoxDrv == NULL)
{
dprintf(("devfs_register failed!\n"));
rc = -EINVAL;
}
#endif
#endif /* !CONFIG_VBOXDRV_AS_MISC */
if (!rc)
{
/*
* Initialize the runtime.
* On AMD64 we'll have to donate the high rwx memory block to the exec allocator.
*/
rc = RTR0Init(0);
if (RT_SUCCESS(rc))
{
#ifdef RT_ARCH_AMD64
rc = RTR0MemExecDonate(&g_abExecMemory[0], sizeof(g_abExecMemory));
#endif
/*
* Initialize the device extension.
*/
if (RT_SUCCESS(rc))
rc = supdrvInitDevExt(&g_DevExt);
if (!rc)
{
/*
* Create the GIP page.
*/
rc = VBoxDrvLinuxInitGip(&g_DevExt);
if (!rc)
{
printk(KERN_INFO DEVICE_NAME ": TSC mode is %s, kernel timer mode is "
#ifdef VBOX_HRTIMER
"'high-res'"
#else
"'normal'"
#endif
".\n",
g_DevExt.pGip->u32Mode == SUPGIPMODE_SYNC_TSC ? "'synchronous'" : "'asynchronous'");
LogFlow(("VBoxDrv::ModuleInit returning %#x\n", rc));
printk(KERN_DEBUG DEVICE_NAME ": Successfully loaded version "
VBOX_VERSION_STRING " (interface " xstr(SUPDRVIOC_VERSION) ").\n");
return rc;
}
supdrvDeleteDevExt(&g_DevExt);
}
else
rc = -EINVAL;
RTR0Term();
}
else
rc = -EINVAL;
/*
* Failed, cleanup and return the error code.
*/
#if defined(CONFIG_DEVFS_FS) && !defined(CONFIG_VBOXDRV_AS_MISC)
VBOX_UNREGISTER_DEVFS(g_hDevFsVBoxDrv);
#endif
}
#ifdef CONFIG_VBOXDRV_AS_MISC
misc_deregister(&gMiscDevice);
dprintf(("VBoxDrv::ModuleInit returning %#x (minor:%d)\n", rc, gMiscDevice.minor));
#else
VBOX_UNREGISTER_DEVICE(g_iModuleMajor, DEVICE_NAME);
dprintf(("VBoxDrv::ModuleInit returning %#x (major:%d)\n", rc, g_iModuleMajor));
#endif
return rc;
}
/**
* Unload the module.
*/
static void __exit VBoxDrvLinuxUnload(void)
{
int rc;
dprintf(("VBoxDrvLinuxUnload\n"));
/*
* I Don't think it's possible to unload a driver which processes have
* opened, at least we'll blindly assume that here.
*/
#ifdef CONFIG_VBOXDRV_AS_MISC
rc = misc_deregister(&gMiscDevice);
if (rc < 0)
{
dprintf(("misc_deregister failed with rc=%#x\n", rc));
}
#else /* !CONFIG_VBOXDRV_AS_MISC */
# ifdef CONFIG_DEVFS_FS
/*
* Unregister a device entry
*/
VBOX_UNREGISTER_DEVFS(g_hDevFsVBoxDrv);
# endif /* devfs */
rc = VBOX_UNREGISTER_DEVICE(g_iModuleMajor, DEVICE_NAME);
if (rc < 0)
{
dprintf(("VBOX_UNREGISTER_DEVICE failed with rc=%#x (major:%d)\n", rc, g_iModuleMajor));
}
#endif /* !CONFIG_VBOXDRV_AS_MISC */
/*
* Destroy GIP, delete the device extension and terminate IPRT.
*/
VBoxDrvLinuxTermGip(&g_DevExt);
supdrvDeleteDevExt(&g_DevExt);
RTR0Term();
}
/**
* Device open. Called on open /dev/vboxdrv
*
* @param pInode Pointer to inode info structure.
* @param pFilp Associated file pointer.
*/
static int VBoxDrvLinuxCreate(struct inode *pInode, struct file *pFilp)
{
int rc;
PSUPDRVSESSION pSession;
Log(("VBoxDrvLinuxCreate: pFilp=%p pid=%d/%d %s\n", pFilp, RTProcSelf(), current->pid, current->comm));
/*
* Call common code for the rest.
*/
rc = supdrvCreateSession(&g_DevExt, (PSUPDRVSESSION *)&pSession);
if (!rc)
{
pSession->Uid = current->euid;
pSession->Gid = current->egid;
pSession->Process = RTProcSelf();
pSession->R0Process = RTR0ProcHandleSelf();
}
pFilp->private_data = pSession;
Log(("VBoxDrvLinuxCreate: g_DevExt=%p pSession=%p rc=%d/%d (pid=%d/%d %s)\n",
&g_DevExt, pSession, rc, VBoxDrvLinuxErr2LinuxErr(rc),
RTProcSelf(), current->pid, current->comm));
return VBoxDrvLinuxErr2LinuxErr(rc);
}
/**
* Close device.
*
* @param pInode Pointer to inode info structure.
* @param pFilp Associated file pointer.
*/
static int VBoxDrvLinuxClose(struct inode *pInode, struct file *pFilp)
{
Log(("VBoxDrvLinuxClose: pFilp=%p pSession=%p pid=%d/%d %s\n",
pFilp, pFilp->private_data, RTProcSelf(), current->pid, current->comm));
supdrvCloseSession(&g_DevExt, (PSUPDRVSESSION)pFilp->private_data);
pFilp->private_data = NULL;
return 0;
}
/**
* Device I/O Control entry point.
*
* @param pFilp Associated file pointer.
* @param uCmd The function specified to ioctl().
* @param ulArg The argument specified to ioctl().
*/
#ifdef HAVE_UNLOCKED_IOCTL
static long VBoxDrvLinuxIOCtl(struct file *pFilp, unsigned int uCmd, unsigned long ulArg)
#else
static int VBoxDrvLinuxIOCtl(struct inode *pInode, struct file *pFilp, unsigned int uCmd, unsigned long ulArg)
#endif
{
/*
* Deal with the two high-speed IOCtl that takes it's arguments from
* the session and iCmd, and only returns a VBox status code.
*/
#ifdef HAVE_UNLOCKED_IOCTL
if (RT_LIKELY( uCmd == SUP_IOCTL_FAST_DO_RAW_RUN
|| uCmd == SUP_IOCTL_FAST_DO_HWACC_RUN
|| uCmd == SUP_IOCTL_FAST_DO_NOP))
return supdrvIOCtlFast(uCmd, &g_DevExt, (PSUPDRVSESSION)pFilp->private_data);
return VBoxDrvLinuxIOCtlSlow(pFilp, uCmd, ulArg);
#else /* !HAVE_UNLOCKED_IOCTL */
int rc;
unlock_kernel();
if (RT_LIKELY( uCmd == SUP_IOCTL_FAST_DO_RAW_RUN
|| uCmd == SUP_IOCTL_FAST_DO_HWACC_RUN
|| uCmd == SUP_IOCTL_FAST_DO_NOP))
rc = supdrvIOCtlFast(uCmd, &g_DevExt, (PSUPDRVSESSION)pFilp->private_data);
else
rc = VBoxDrvLinuxIOCtlSlow(pFilp, uCmd, ulArg);
lock_kernel();
return rc;
#endif /* !HAVE_UNLOCKED_IOCTL */
}
/**
* Device I/O Control entry point.
*
* @param pFilp Associated file pointer.
* @param uCmd The function specified to ioctl().
* @param ulArg The argument specified to ioctl().
*/
static int VBoxDrvLinuxIOCtlSlow(struct file *pFilp, unsigned int uCmd, unsigned long ulArg)
{
int rc;
SUPREQHDR Hdr;
PSUPREQHDR pHdr;
uint32_t cbBuf;
Log6(("VBoxDrvLinuxIOCtl: pFilp=%p uCmd=%#x ulArg=%p pid=%d/%d\n", pFilp, uCmd, (void *)ulArg, RTProcSelf(), current->pid));
/*
* Read the header.
*/
if (RT_UNLIKELY(copy_from_user(&Hdr, (void *)ulArg, sizeof(Hdr))))
{
Log(("VBoxDrvLinuxIOCtl: copy_from_user(,%#lx,) failed; uCmd=%#x.\n", ulArg, uCmd));
return -EFAULT;
}
if (RT_UNLIKELY((Hdr.fFlags & SUPREQHDR_FLAGS_MAGIC_MASK) != SUPREQHDR_FLAGS_MAGIC))
{
Log(("VBoxDrvLinuxIOCtl: bad header magic %#x; uCmd=%#x\n", Hdr.fFlags & SUPREQHDR_FLAGS_MAGIC_MASK, uCmd));
return -EINVAL;
}
/*
* Buffer the request.
*/
cbBuf = RT_MAX(Hdr.cbIn, Hdr.cbOut);
if (RT_UNLIKELY(cbBuf > _1M*16))
{
Log(("VBoxDrvLinuxIOCtl: too big cbBuf=%#x; uCmd=%#x\n", cbBuf, uCmd));
return -E2BIG;
}
if (RT_UNLIKELY(cbBuf != _IOC_SIZE(uCmd) && _IOC_SIZE(uCmd)))
{
Log(("VBoxDrvLinuxIOCtl: bad ioctl cbBuf=%#x _IOC_SIZE=%#x; uCmd=%#x.\n", cbBuf, _IOC_SIZE(uCmd), uCmd));
return -EINVAL;
}
pHdr = RTMemAlloc(cbBuf);
if (RT_UNLIKELY(!pHdr))
{
OSDBGPRINT(("VBoxDrvLinuxIOCtl: failed to allocate buffer of %d bytes for uCmd=%#x.\n", cbBuf, uCmd));
return -ENOMEM;
}
if (RT_UNLIKELY(copy_from_user(pHdr, (void *)ulArg, Hdr.cbIn)))
{
Log(("VBoxDrvLinuxIOCtl: copy_from_user(,%#lx, %#x) failed; uCmd=%#x.\n", ulArg, Hdr.cbIn, uCmd));
RTMemFree(pHdr);
return -EFAULT;
}
/*
* Process the IOCtl.
*/
rc = supdrvIOCtl(uCmd, &g_DevExt, (PSUPDRVSESSION)pFilp->private_data, pHdr);
/*
* Copy ioctl data and output buffer back to user space.
*/
if (RT_LIKELY(!rc))
{
uint32_t cbOut = pHdr->cbOut;
if (RT_UNLIKELY(cbOut > cbBuf))
{
OSDBGPRINT(("VBoxDrvLinuxIOCtl: too much output! %#x > %#x; uCmd=%#x!\n", cbOut, cbBuf, uCmd));
cbOut = cbBuf;
}
if (RT_UNLIKELY(copy_to_user((void *)ulArg, pHdr, cbOut)))
{
/* this is really bad! */
OSDBGPRINT(("VBoxDrvLinuxIOCtl: copy_to_user(%#lx,,%#x); uCmd=%#x!\n", ulArg, cbOut, uCmd));
rc = -EFAULT;
}
}
else
{
Log(("VBoxDrvLinuxIOCtl: pFilp=%p uCmd=%#x ulArg=%p failed, rc=%d\n", pFilp, uCmd, (void *)ulArg, rc));
rc = -EINVAL;
}
RTMemFree(pHdr);
Log6(("VBoxDrvLinuxIOCtl: returns %d (pid=%d/%d)\n", rc, RTProcSelf(), current->pid));
return rc;
}
/**
* Initializes any OS specific object creator fields.
*/
void VBOXCALL supdrvOSObjInitCreator(PSUPDRVOBJ pObj, PSUPDRVSESSION pSession)
{
NOREF(pObj);
NOREF(pSession);
}
/**
* Checks if the session can access the object.
*
* @returns true if a decision has been made.
* @returns false if the default access policy should be applied.
*
* @param pObj The object in question.
* @param pSession The session wanting to access the object.
* @param pszObjName The object name, can be NULL.
* @param prc Where to store the result when returning true.
*/
bool VBOXCALL supdrvOSObjCanAccess(PSUPDRVOBJ pObj, PSUPDRVSESSION pSession, const char *pszObjName, int *prc)
{
NOREF(pObj);
NOREF(pSession);
NOREF(pszObjName);
NOREF(prc);
return false;
}
/**
* Initializes the GIP.
*
* @returns negative errno.
* @param pDevExt Instance data. GIP stuff may be updated.
*/
static int VBoxDrvLinuxInitGip(PSUPDRVDEVEXT pDevExt)
{
struct page *pPage;
dma_addr_t HCPhys;
PSUPGLOBALINFOPAGE pGip;
#ifdef CONFIG_SMP
unsigned i;
#endif
LogFlow(("VBoxDrvLinuxInitGip:\n"));
/*
* Allocate the page.
*/
pPage = alloc_pages(GFP_USER, 0);
if (!pPage)
{
Log(("VBoxDrvLinuxInitGip: failed to allocate the GIP page\n"));
return -ENOMEM;
}
/*
* Lock the page.
*/
SetPageReserved(pPage);
g_pGipPage = pPage;
/*
* Call common initialization routine.
*/
HCPhys = page_to_phys(pPage);
pGip = (PSUPGLOBALINFOPAGE)page_address(pPage);
pDevExt->ulLastJiffies = jiffies;
pDevExt->u64LastMonotime = (uint64_t)pDevExt->ulLastJiffies * TICK_NSEC;
Log(("VBoxDrvInitGIP: TICK_NSEC=%ld HZ=%d jiffies=%ld now=%lld\n",
TICK_NSEC, HZ, pDevExt->ulLastJiffies, pDevExt->u64LastMonotime));
supdrvGipInit(pDevExt, pGip, HCPhys, pDevExt->u64LastMonotime,
HZ <= 1000 ? HZ : 1000);
/*
* Initialize the timer.
*/
vbox_ktimer_init(&g_GipTimer, VBoxDrvLinuxGipTimer, (unsigned long)pDevExt);
#ifdef CONFIG_SMP
for (i = 0; i < RT_ELEMENTS(pDevExt->aCPUs); i++)
{
pDevExt->aCPUs[i].u64LastMonotime = pDevExt->u64LastMonotime;
pDevExt->aCPUs[i].ulLastJiffies = pDevExt->ulLastJiffies;
pDevExt->aCPUs[i].iSmpProcessorId = -512;
vbox_ktimer_init(&pDevExt->aCPUs[i].Timer, VBoxDrvLinuxGipTimerPerCpu, i);
}
#endif
return 0;
}
/**
* Terminates the GIP.
*
* @returns negative errno.
* @param pDevExt Instance data. GIP stuff may be updated.
*/
static int VBoxDrvLinuxTermGip(PSUPDRVDEVEXT pDevExt)
{
struct page *pPage;
PSUPGLOBALINFOPAGE pGip;
#ifdef CONFIG_SMP
unsigned i;
#endif
LogFlow(("VBoxDrvLinuxTermGip:\n"));
/*
* Delete the timer if it's pending.
*/
vbox_ktimer_stop(&g_GipTimer);
#ifdef CONFIG_SMP
for (i = 0; i < RT_ELEMENTS(pDevExt->aCPUs); i++)
vbox_ktimer_stop(&pDevExt->aCPUs[i].Timer);
#endif
/*
* Uninitialize the content.
*/
pGip = pDevExt->pGip;
pDevExt->pGip = NULL;
if (pGip)
supdrvGipTerm(pGip);
/*
* Free the page.
*/
pPage = g_pGipPage;
g_pGipPage = NULL;
if (pPage)
{
ClearPageReserved(pPage);
__free_pages(pPage, 0);
}
return 0;
}
/**
* Timer callback function.
*
* In ASYNC TSC mode this is called on the primary CPU, and we're
* assuming that the CPU remains online.
*
* @param ulUser The device extension pointer.
*/
#ifdef VBOX_HRTIMER
static enum hrtimer_restart VBoxDrvLinuxGipTimer(struct hrtimer *pTimer)
#else
static void VBoxDrvLinuxGipTimer(unsigned long ulUser)
#endif
{
PSUPDRVDEVEXT pDevExt;
PSUPGLOBALINFOPAGE pGip;
unsigned long ulNow;
unsigned long ulDiff;
uint64_t u64Monotime;
unsigned long SavedFlags;
#ifdef VBOX_HRTIMER
ktime_t KtNow;
#endif
local_irq_save(SavedFlags);
ulNow = jiffies;
#ifdef VBOX_HRTIMER
KtNow = ktime_get();
pDevExt = &g_DevExt;
#else
pDevExt = (PSUPDRVDEVEXT)ulUser;
#endif
pGip = pDevExt->pGip;
#ifdef CONFIG_SMP
if (pGip && pGip->u32Mode == SUPGIPMODE_ASYNC_TSC)
{
uint8_t iCPU = ASMGetApicId();
ulDiff = ulNow - pDevExt->aCPUs[iCPU].ulLastJiffies;
pDevExt->aCPUs[iCPU].ulLastJiffies = ulNow;
u64Monotime = pDevExt->aCPUs[iCPU].u64LastMonotime + ulDiff * TICK_NSEC;
pDevExt->aCPUs[iCPU].u64LastMonotime = u64Monotime;
}
else
#endif /* CONFIG_SMP */
{
ulDiff = ulNow - pDevExt->ulLastJiffies;
pDevExt->ulLastJiffies = ulNow;
u64Monotime = pDevExt->u64LastMonotime + ulDiff * TICK_NSEC;
pDevExt->u64LastMonotime = u64Monotime;
}
if (RT_LIKELY(pGip))
supdrvGipUpdate(pDevExt->pGip, u64Monotime);
if (RT_LIKELY(!pDevExt->fGIPSuspended))
{
#ifdef VBOX_HRTIMER
hrtimer_forward(&g_GipTimer, KtNow, ktime_set(0, 1000000));
#else
mod_timer(&g_GipTimer, ulNow + ONE_MSEC_IN_JIFFIES);
#endif
}
local_irq_restore(SavedFlags);
#ifdef VBOX_HRTIMER
return pDevExt->fGIPSuspended ? HRTIMER_NORESTART : HRTIMER_RESTART;
#endif
}
#ifdef CONFIG_SMP
/**
* Timer callback function for the other CPUs.
*
* @param iTimerCPU The APIC ID of this timer.
*/
#ifdef VBOX_HRTIMER
static enum hrtimer_restart VBoxDrvLinuxGipTimerPerCpu(struct hrtimer *pTimer)
#else
static void VBoxDrvLinuxGipTimerPerCpu(unsigned long iTimerCPU)
#endif
{
PSUPDRVDEVEXT pDevExt;
PSUPGLOBALINFOPAGE pGip;
uint8_t iCPU;
uint64_t u64Monotime;
unsigned long SavedFlags;
unsigned long ulNow;
# ifdef VBOX_HRTIMER
unsigned long iTimerCPU;
ktime_t KtNow;
# endif
local_irq_save(SavedFlags);
ulNow = jiffies;
pDevExt = &g_DevExt;
pGip = pDevExt->pGip;
iCPU = ASMGetApicId();
# ifdef VBOX_HRTIMER
iTimerCPU = iCPU; /* XXX hrtimer does not support a 'data' field */
KtNow = ktime_get();
# endif
if (RT_LIKELY(iCPU < RT_ELEMENTS(pGip->aCPUs)))
{
if (RT_LIKELY(iTimerCPU == iCPU))
{
unsigned long ulDiff = ulNow - pDevExt->aCPUs[iCPU].ulLastJiffies;
pDevExt->aCPUs[iCPU].ulLastJiffies = ulNow;
u64Monotime = pDevExt->aCPUs[iCPU].u64LastMonotime + ulDiff * TICK_NSEC;
pDevExt->aCPUs[iCPU].u64LastMonotime = u64Monotime;
if (RT_LIKELY(pGip))
supdrvGipUpdatePerCpu(pGip, u64Monotime, iCPU);
if (RT_LIKELY(!pDevExt->fGIPSuspended))
{
# ifdef VBOX_HRTIMER
hrtimer_forward(&pDevExt->aCPUs[iCPU].Timer, KtNow, ktime_set(0, 1000000));
# else
mod_timer(&pDevExt->aCPUs[iCPU].Timer, ulNow + ONE_MSEC_IN_JIFFIES);
# endif
}
}
else
printk("vboxdrv: error: GIP CPU update timer executing on the wrong CPU: apicid=%d != timer-apicid=%ld (cpuid=%d !=? timer-cpuid=%d)\n",
iCPU, iTimerCPU, smp_processor_id(), pDevExt->aCPUs[iTimerCPU].iSmpProcessorId);
}
else
printk("vboxdrv: error: APIC ID is bogus (GIP CPU update): apicid=%d max=%lu cpuid=%d\n",
iCPU, (unsigned long)RT_ELEMENTS(pGip->aCPUs), smp_processor_id());
local_irq_restore(SavedFlags);
# ifdef VBOX_HRTIMER
return pDevExt->fGIPSuspended ? HRTIMER_NORESTART : HRTIMER_RESTART;
# endif
}
#endif /* CONFIG_SMP */
/**
* Maps the GIP into user space.
*
* @returns negative errno.
* @param pDevExt Instance data.
*/
int VBOXCALL supdrvOSGipMap(PSUPDRVDEVEXT pDevExt, PSUPGLOBALINFOPAGE *ppGip)
{
int rc = 0;
unsigned long ulAddr;
unsigned long HCPhys = pDevExt->HCPhysGip;
pgprot_t pgFlags;
pgprot_val(pgFlags) = _PAGE_PRESENT | _PAGE_USER;
LogFlow(("supdrvOSGipMap: ppGip=%p\n", ppGip));
/*
* Allocate user space mapping and put the physical pages into it.
*/
down_write(&current->mm->mmap_sem);
ulAddr = do_mmap(NULL, 0, PAGE_SIZE, PROT_READ, MAP_SHARED | MAP_ANONYMOUS, 0);
if (!(ulAddr & ~PAGE_MASK))
{
#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 0) && !defined(HAVE_26_STYLE_REMAP_PAGE_RANGE)
int rc2 = remap_page_range(ulAddr, HCPhys, PAGE_SIZE, pgFlags);
#else
int rc2 = 0;
struct vm_area_struct *vma = find_vma(current->mm, ulAddr);
if (vma)
#if LINUX_VERSION_CODE < KERNEL_VERSION(2, 6, 11)
rc2 = remap_page_range(vma, ulAddr, HCPhys, PAGE_SIZE, pgFlags);
#else
rc2 = remap_pfn_range(vma, ulAddr, HCPhys >> PAGE_SHIFT, PAGE_SIZE, pgFlags);
#endif
else
{
rc = SUPDRV_ERR_NO_MEMORY;
Log(("supdrvOSGipMap: no vma found for ulAddr=%#lx!\n", ulAddr));
}
#endif
if (rc2)
{
rc = SUPDRV_ERR_NO_MEMORY;
Log(("supdrvOSGipMap: remap_page_range failed rc2=%d\n", rc2));
}
}
else
{
Log(("supdrvOSGipMap: do_mmap failed ulAddr=%#lx\n", ulAddr));
rc = SUPDRV_ERR_NO_MEMORY;
}
up_write(&current->mm->mmap_sem); /* not quite sure when to give this up. */
/*
* Success?
*/
if (!rc)
{
*ppGip = (PSUPGLOBALINFOPAGE)ulAddr;
LogFlow(("supdrvOSGipMap: ppGip=%p\n", *ppGip));
return 0;
}
/*
* Failure, cleanup and be gone.
*/
if (ulAddr & ~PAGE_MASK)
{
down_write(&current->mm->mmap_sem);
MY_DO_MUNMAP(current->mm, ulAddr, PAGE_SIZE);
up_write(&current->mm->mmap_sem);
}
LogFlow(("supdrvOSGipMap: returns %d\n", rc));
return rc;
}
/**
* Maps the GIP into user space.
*
* @returns negative errno.
* @param pDevExt Instance data.
*/
int VBOXCALL supdrvOSGipUnmap(PSUPDRVDEVEXT pDevExt, PSUPGLOBALINFOPAGE pGip)
{
LogFlow(("supdrvOSGipUnmap: pGip=%p\n", pGip));
if (current->mm)
{
down_write(&current->mm->mmap_sem);
MY_DO_MUNMAP(current->mm, (unsigned long)pGip, PAGE_SIZE);
up_write(&current->mm->mmap_sem);
}
LogFlow(("supdrvOSGipUnmap: returns 0\n"));
return 0;
}
/**
* Resumes the GIP updating.
*
* @param pDevExt Instance data.
*/
void VBOXCALL supdrvOSGipResume(PSUPDRVDEVEXT pDevExt)
{
LogFlow(("supdrvOSGipResume:\n"));
ASMAtomicXchgU8(&pDevExt->fGIPSuspended, false);
#ifdef CONFIG_SMP
if (pDevExt->pGip->u32Mode != SUPGIPMODE_ASYNC_TSC)
{
#endif
vbox_ktimer_start(&g_GipTimer);
#ifdef CONFIG_SMP
}
else
{
vbox_ktimer_start(&g_GipTimer);
smp_call_function(VBoxDrvLinuxGipResumePerCpu, pDevExt, 0 /* retry */, 1 /* wait */);
}
#endif
}
#ifdef CONFIG_SMP
/**
* Callback for resuming GIP updating on the other CPUs.
*
* This is only used when the GIP is in async tsc mode.
*
* @param pvUser Pointer to the device instance.
*/
static void VBoxDrvLinuxGipResumePerCpu(void *pvUser)
{
PSUPDRVDEVEXT pDevExt = (PSUPDRVDEVEXT)pvUser;
uint8_t iCPU = ASMGetApicId();
if (RT_UNLIKELY(iCPU >= RT_ELEMENTS(pDevExt->pGip->aCPUs)))
{
printk("vboxdrv: error: apicid=%d max=%lu cpuid=%d\n",
iCPU, (unsigned long)RT_ELEMENTS(pDevExt->pGip->aCPUs), smp_processor_id());
return;
}
pDevExt->aCPUs[iCPU].iSmpProcessorId = smp_processor_id();
vbox_ktimer_start(&pDevExt->aCPUs[iCPU].Timer);
}
#endif /* CONFIG_SMP */
/**
* Suspends the GIP updating.
*
* @param pDevExt Instance data.
*/
void VBOXCALL supdrvOSGipSuspend(PSUPDRVDEVEXT pDevExt)
{
#ifdef CONFIG_SMP
unsigned i;
#endif
LogFlow(("supdrvOSGipSuspend:\n"));
ASMAtomicXchgU8(&pDevExt->fGIPSuspended, true);
vbox_ktimer_stop(&g_GipTimer);
#ifdef CONFIG_SMP
for (i = 0; i < RT_ELEMENTS(pDevExt->aCPUs); i++)
vbox_ktimer_stop(&pDevExt->aCPUs[i].Timer);
#endif
}
/**
* Get the current CPU count.
* @returns Number of cpus.
*/
unsigned VBOXCALL supdrvOSGetCPUCount(void)
{
#ifdef CONFIG_SMP
# if defined(num_present_cpus) && !defined(VBOX_REDHAT_KABI)
return num_present_cpus();
# elif defined(num_possible_cpus)
return num_possible_cpus();
# else
return smp_num_cpus;
# endif
#else
return 1;
#endif
}
/**
* Force async tsc mode.
* @todo add a module argument for this.
*/
bool VBOXCALL supdrvOSGetForcedAsyncTscMode(void)
{
return force_async_tsc != 0;
}
/**
* Converts a supdrv error code to an linux error code.
*
* @returns corresponding linux error code.
* @param rc supdrv error code (SUPDRV_ERR_* defines).
*/
static int VBoxDrvLinuxErr2LinuxErr(int rc)
{
switch (rc)
{
case 0: return 0;
case SUPDRV_ERR_GENERAL_FAILURE: return -EACCES;
case SUPDRV_ERR_INVALID_PARAM: return -EINVAL;
case SUPDRV_ERR_INVALID_MAGIC: return -EILSEQ;
case SUPDRV_ERR_INVALID_HANDLE: return -ENXIO;
case SUPDRV_ERR_INVALID_POINTER: return -EFAULT;
case SUPDRV_ERR_LOCK_FAILED: return -ENOLCK;
case SUPDRV_ERR_ALREADY_LOADED: return -EEXIST;
case SUPDRV_ERR_PERMISSION_DENIED: return -EPERM;
case SUPDRV_ERR_VERSION_MISMATCH: return -ENOSYS;
case SUPDRV_ERR_IDT_FAILED: return -1000;
}
return -EPERM;
}
RTDECL(int) SUPR0Printf(const char *pszFormat, ...)
{
#if 1
va_list args;
char szMsg[512];
va_start(args, pszFormat);
vsnprintf(szMsg, sizeof(szMsg) - 1, pszFormat, args);
szMsg[sizeof(szMsg) - 1] = '\0';
printk("%s", szMsg);
va_end(args);
#else
/* forward to printf - needs some more GCC hacking to fix ebp... */
__asm__ __volatile__ ("mov %0, %esp\n\t"
"jmp %1\n\t",
:: "r" ((uintptr_t)&pszFormat - 4),
"m" (printk));
#endif
return 0;
}
/** Runtime assert implementation for Linux Ring-0. */
RTDECL(bool) RTAssertDoBreakpoint(void)
{
return true;
}
/** Runtime assert implementation for Linux Ring-0. */
RTDECL(void) AssertMsg1(const char *pszExpr, unsigned uLine, const char *pszFile, const char *pszFunction)
{
printk("!!Assertion Failed!!\n"
"Expression: %s\n"
"Location : %s(%d) %s\n",
pszExpr, pszFile, uLine, pszFunction);
}
/** Runtime assert implementation for Linux Ring-0. */
RTDECL(void) AssertMsg2(const char *pszFormat, ...)
{ /* forwarder. */
va_list ap;
char msg[256];
va_start(ap, pszFormat);
vsnprintf(msg, sizeof(msg) - 1, pszFormat, ap);
msg[sizeof(msg) - 1] = '\0';
printk("%s", msg);
va_end(ap);
}
/* GCC C++ hack. */
unsigned __gxx_personality_v0 = 0xcccccccc;
module_init(VBoxDrvLinuxInit);
module_exit(VBoxDrvLinuxUnload);
MODULE_AUTHOR("innotek GmbH");
MODULE_DESCRIPTION("VirtualBox Support Driver");
MODULE_LICENSE("GPL");
#ifdef MODULE_VERSION
MODULE_VERSION(VBOX_VERSION_STRING " (" xstr(SUPDRVIOC_VERSION) ")");
#endif
#if LINUX_VERSION_CODE >= KERNEL_VERSION(2, 6, 0)
module_param(force_async_tsc, int, 0444);
#else
MODULE_PARM(force_async_tsc, "i");
#endif
MODULE_PARM_DESC(force_async_tsc, "force the asynchronous TSC mode");