blob: 5b821b5eb1251a2e65ebb1e7e170bc8683fd4ba7 [file] [log] [blame] [raw]
#include "libcflat.h"
#include "smp.h"
#include "processor.h"
#include "atomic.h"
#include "pci.h"
#include "x86/vm.h"
#include "x86/desc.h"
#include "x86/acpi.h"
#include "x86/apic.h"
#include "x86/isr.h"
#define IPI_TEST_VECTOR 0xb0
struct test {
void (*func)(void);
const char *name;
int (*valid)(void);
int parallel;
bool (*next)(struct test *);
};
#define GOAL (1ull << 30)
static int nr_cpus;
static void cpuid_test(void)
{
asm volatile ("push %%"R "bx; cpuid; pop %%"R "bx"
: : : "eax", "ecx", "edx");
}
static void vmcall(void)
{
unsigned long a = 0, b, c, d;
asm volatile ("vmcall" : "+a"(a), "=b"(b), "=c"(c), "=d"(d));
}
#define MSR_TSC_ADJUST 0x3b
#define MSR_EFER 0xc0000080
#define EFER_NX_MASK (1ull << 11)
#ifdef __x86_64__
static void mov_from_cr8(void)
{
unsigned long cr8;
asm volatile ("mov %%cr8, %0" : "=r"(cr8));
}
static void mov_to_cr8(void)
{
unsigned long cr8 = 0;
asm volatile ("mov %0, %%cr8" : : "r"(cr8));
}
#endif
static int is_smp(void)
{
return cpu_count() > 1;
}
static void nop(void *junk)
{
}
volatile int x = 0;
static void self_ipi_isr(isr_regs_t *regs)
{
x++;
eoi();
}
static void x2apic_self_ipi(int vec)
{
wrmsr(0x83f, vec);
}
static void apic_self_ipi(int vec)
{
apic_icr_write(APIC_INT_ASSERT | APIC_DEST_SELF | APIC_DEST_PHYSICAL |
APIC_DM_FIXED | IPI_TEST_VECTOR, vec);
}
static void self_ipi_sti_nop(void)
{
x = 0;
irq_disable();
apic_self_ipi(IPI_TEST_VECTOR);
asm volatile("sti; nop");
if (x != 1) printf("%d", x);
}
static void self_ipi_sti_hlt(void)
{
x = 0;
irq_disable();
apic_self_ipi(IPI_TEST_VECTOR);
asm volatile("sti; hlt");
if (x != 1) printf("%d", x);
}
static void self_ipi_tpr(void)
{
x = 0;
apic_set_tpr(0x0f);
apic_self_ipi(IPI_TEST_VECTOR);
apic_set_tpr(0x00);
asm volatile("nop");
if (x != 1) printf("%d", x);
}
static void self_ipi_tpr_sti_nop(void)
{
x = 0;
irq_disable();
apic_set_tpr(0x0f);
apic_self_ipi(IPI_TEST_VECTOR);
apic_set_tpr(0x00);
asm volatile("sti; nop");
if (x != 1) printf("%d", x);
}
static void self_ipi_tpr_sti_hlt(void)
{
x = 0;
irq_disable();
apic_set_tpr(0x0f);
apic_self_ipi(IPI_TEST_VECTOR);
apic_set_tpr(0x00);
asm volatile("sti; hlt");
if (x != 1) printf("%d", x);
}
static int is_x2apic(void)
{
return rdmsr(MSR_IA32_APICBASE) & APIC_EXTD;
}
static void x2apic_self_ipi_sti_nop(void)
{
irq_disable();
x2apic_self_ipi(IPI_TEST_VECTOR);
asm volatile("sti; nop");
}
static void x2apic_self_ipi_sti_hlt(void)
{
irq_disable();
x2apic_self_ipi(IPI_TEST_VECTOR);
asm volatile("sti; hlt");
}
static void x2apic_self_ipi_tpr(void)
{
apic_set_tpr(0x0f);
x2apic_self_ipi(IPI_TEST_VECTOR);
apic_set_tpr(0x00);
asm volatile("nop");
}
static void x2apic_self_ipi_tpr_sti_nop(void)
{
irq_disable();
apic_set_tpr(0x0f);
x2apic_self_ipi(IPI_TEST_VECTOR);
apic_set_tpr(0x00);
asm volatile("sti; nop");
}
static void x2apic_self_ipi_tpr_sti_hlt(void)
{
irq_disable();
apic_set_tpr(0x0f);
x2apic_self_ipi(IPI_TEST_VECTOR);
apic_set_tpr(0x00);
asm volatile("sti; hlt");
}
static void ipi(void)
{
on_cpu(1, nop, 0);
}
static void ipi_halt(void)
{
unsigned long long t;
on_cpu(1, nop, 0);
t = rdtsc() + 2000;
while (rdtsc() < t)
;
}
int pm_tmr_blk;
static void inl_pmtimer(void)
{
inl(pm_tmr_blk);
}
static void inl_nop_qemu(void)
{
inl(0x1234);
}
static void inl_nop_kernel(void)
{
inb(0x4d0);
}
static void outl_elcr_kernel(void)
{
outb(0, 0x4d0);
}
static void mov_dr(void)
{
asm volatile("mov %0, %%dr7" : : "r" (0x400L));
}
static void ple_round_robin(void)
{
struct counter {
volatile int n1;
int n2;
} __attribute__((aligned(64)));
static struct counter counters[64] = { { -1, 0 } };
int me = smp_id();
int you;
volatile struct counter *p = &counters[me];
while (p->n1 == p->n2)
asm volatile ("pause");
p->n2 = p->n1;
you = me + 1;
if (you == nr_cpus)
you = 0;
++counters[you].n1;
}
static void rd_tsc_adjust_msr(void)
{
rdmsr(MSR_TSC_ADJUST);
}
static void wr_tsc_adjust_msr(void)
{
wrmsr(MSR_TSC_ADJUST, 0x0);
}
static struct pci_test {
unsigned iobar;
unsigned ioport;
volatile void *memaddr;
volatile void *mem;
int test_idx;
uint32_t data;
uint32_t offset;
} pci_test = {
.test_idx = -1
};
static void pci_mem_testb(void)
{
*(volatile uint8_t *)pci_test.mem = pci_test.data;
}
static void pci_mem_testw(void)
{
*(volatile uint16_t *)pci_test.mem = pci_test.data;
}
static void pci_mem_testl(void)
{
*(volatile uint32_t *)pci_test.mem = pci_test.data;
}
static void pci_io_testb(void)
{
outb(pci_test.data, pci_test.ioport);
}
static void pci_io_testw(void)
{
outw(pci_test.data, pci_test.ioport);
}
static void pci_io_testl(void)
{
outl(pci_test.data, pci_test.ioport);
}
static uint8_t ioreadb(unsigned long addr, bool io)
{
if (io) {
return inb(addr);
} else {
return *(volatile uint8_t *)addr;
}
}
static uint32_t ioreadl(unsigned long addr, bool io)
{
/* Note: assumes little endian */
if (io) {
return inl(addr);
} else {
return *(volatile uint32_t *)addr;
}
}
static void iowriteb(unsigned long addr, uint8_t data, bool io)
{
if (io) {
outb(data, addr);
} else {
*(volatile uint8_t *)addr = data;
}
}
static bool pci_next(struct test *test, unsigned long addr, bool io)
{
int i;
uint8_t width;
if (!pci_test.memaddr) {
test->func = NULL;
return true;
}
pci_test.test_idx++;
iowriteb(addr + offsetof(struct pci_test_dev_hdr, test),
pci_test.test_idx, io);
width = ioreadb(addr + offsetof(struct pci_test_dev_hdr, width),
io);
switch (width) {
case 1:
test->func = io ? pci_io_testb : pci_mem_testb;
break;
case 2:
test->func = io ? pci_io_testw : pci_mem_testw;
break;
case 4:
test->func = io ? pci_io_testl : pci_mem_testl;
break;
default:
/* Reset index for purposes of the next test */
pci_test.test_idx = -1;
test->func = NULL;
return false;
}
pci_test.data = ioreadl(addr + offsetof(struct pci_test_dev_hdr, data),
io);
pci_test.offset = ioreadl(addr + offsetof(struct pci_test_dev_hdr,
offset), io);
for (i = 0; i < pci_test.offset; ++i) {
char c = ioreadb(addr + offsetof(struct pci_test_dev_hdr,
name) + i, io);
if (!c) {
break;
}
printf("%c",c);
}
printf(":");
return true;
}
static bool pci_mem_next(struct test *test)
{
bool ret;
ret = pci_next(test, ((unsigned long)pci_test.memaddr), false);
if (ret) {
pci_test.mem = pci_test.memaddr + pci_test.offset;
}
return ret;
}
static bool pci_io_next(struct test *test)
{
bool ret;
ret = pci_next(test, ((unsigned long)pci_test.iobar), true);
if (ret) {
pci_test.ioport = pci_test.iobar + pci_test.offset;
}
return ret;
}
static struct test tests[] = {
{ cpuid_test, "cpuid", .parallel = 1, },
{ vmcall, "vmcall", .parallel = 1, },
#ifdef __x86_64__
{ mov_from_cr8, "mov_from_cr8", .parallel = 1, },
{ mov_to_cr8, "mov_to_cr8" , .parallel = 1, },
#endif
{ inl_pmtimer, "inl_from_pmtimer", .parallel = 1, },
{ inl_nop_qemu, "inl_from_qemu", .parallel = 1 },
{ inl_nop_kernel, "inl_from_kernel", .parallel = 1 },
{ outl_elcr_kernel, "outl_to_kernel", .parallel = 1 },
{ mov_dr, "mov_dr", .parallel = 1 },
{ self_ipi_sti_nop, "self_ipi_sti_nop", .parallel = 0, },
{ self_ipi_sti_hlt, "self_ipi_sti_hlt", .parallel = 0, },
{ self_ipi_tpr, "self_ipi_tpr", .parallel = 0, },
{ self_ipi_tpr_sti_nop, "self_ipi_tpr_sti_nop", .parallel = 0, },
{ self_ipi_tpr_sti_hlt, "self_ipi_tpr_sti_hlt", .parallel = 0, },
{ x2apic_self_ipi_sti_nop, "x2apic_self_ipi_sti_nop", is_x2apic, .parallel = 0, },
{ x2apic_self_ipi_sti_hlt, "x2apic_self_ipi_sti_hlt", is_x2apic, .parallel = 0, },
{ x2apic_self_ipi_tpr, "x2apic_self_ipi_tpr", is_x2apic, .parallel = 0, },
{ x2apic_self_ipi_tpr_sti_nop, "x2apic_self_ipi_tpr_sti_nop", is_x2apic, .parallel = 0, },
{ x2apic_self_ipi_tpr_sti_hlt, "x2apic_self_ipi_tpr_sti_hlt", is_x2apic, .parallel = 0, },
{ ipi, "ipi", is_smp, .parallel = 0, },
{ ipi_halt, "ipi+halt", is_smp, .parallel = 0, },
{ ple_round_robin, "ple-round-robin", .parallel = 1 },
{ wr_tsc_adjust_msr, "wr_tsc_adjust_msr", .parallel = 1 },
{ rd_tsc_adjust_msr, "rd_tsc_adjust_msr", .parallel = 1 },
{ NULL, "pci-mem", .parallel = 0, .next = pci_mem_next },
{ NULL, "pci-io", .parallel = 0, .next = pci_io_next },
};
unsigned iterations;
static atomic_t nr_cpus_done;
static void run_test(void *_func)
{
int i;
void (*func)(void) = _func;
for (i = 0; i < iterations; ++i)
func();
atomic_inc(&nr_cpus_done);
}
static bool do_test(struct test *test)
{
int i;
unsigned long long t1, t2;
void (*func)(void);
iterations = 32;
if (test->valid && !test->valid()) {
printf("%s (skipped)\n", test->name);
return false;
}
if (test->next && !test->next(test)) {
return false;
}
func = test->func;
if (!func) {
printf("%s (skipped)\n", test->name);
return false;
}
do {
iterations *= 2;
t1 = rdtsc();
if (!test->parallel) {
for (i = 0; i < iterations; ++i)
func();
} else {
atomic_set(&nr_cpus_done, 0);
for (i = cpu_count(); i > 0; i--)
on_cpu_async(i-1, run_test, func);
while (atomic_read(&nr_cpus_done) < cpu_count())
;
}
t2 = rdtsc();
} while ((t2 - t1) < GOAL);
printf("%s %d\n", test->name, (int)((t2 - t1) / iterations));
return test->next;
}
static void enable_nx(void *junk)
{
if (cpuid(0x80000001).d & (1 << 20))
wrmsr(MSR_EFER, rdmsr(MSR_EFER) | EFER_NX_MASK);
}
bool test_wanted(struct test *test, char *wanted[], int nwanted)
{
int i;
if (!nwanted)
return true;
for (i = 0; i < nwanted; ++i)
if (strcmp(wanted[i], test->name) == 0)
return true;
return false;
}
int main(int ac, char **av)
{
struct fadt_descriptor_rev1 *fadt;
int i;
unsigned long membar = 0;
struct pci_dev pcidev;
int ret;
smp_init();
setup_vm();
handle_irq(IPI_TEST_VECTOR, self_ipi_isr);
nr_cpus = cpu_count();
irq_enable();
for (i = cpu_count(); i > 0; i--)
on_cpu(i-1, enable_nx, 0);
fadt = find_acpi_table_addr(FACP_SIGNATURE);
pm_tmr_blk = fadt->pm_tmr_blk;
printf("PM timer port is %x\n", pm_tmr_blk);
ret = pci_find_dev(PCI_VENDOR_ID_REDHAT, PCI_DEVICE_ID_REDHAT_TEST);
if (ret != PCIDEVADDR_INVALID) {
pci_dev_init(&pcidev, ret);
assert(pci_bar_is_memory(&pcidev, PCI_TESTDEV_BAR_MEM));
assert(!pci_bar_is_memory(&pcidev, PCI_TESTDEV_BAR_IO));
membar = pcidev.resource[PCI_TESTDEV_BAR_MEM];
pci_test.memaddr = ioremap(membar, PAGE_SIZE);
pci_test.iobar = pcidev.resource[PCI_TESTDEV_BAR_IO];
printf("pci-testdev at 0x%x membar %lx iobar %x\n",
pcidev.bdf, membar, pci_test.iobar);
}
for (i = 0; i < ARRAY_SIZE(tests); ++i)
if (test_wanted(&tests[i], av + 1, ac - 1))
while (do_test(&tests[i])) {}
return 0;
}