Create spapr_nested.c for most of the nested HV implementation. Signed-off-by: Nicholas Piggin <npiggin@gmail.com> Reviewed-by: Harsh Prateek Bora <harshpb@linux.ibm.com> Signed-off-by: Cédric Le Goater <clg@kaod.org>
		
			
				
	
	
		
			396 lines
		
	
	
		
			12 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			396 lines
		
	
	
		
			12 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
#include "qemu/osdep.h"
 | 
						|
#include "qemu/cutils.h"
 | 
						|
#include "exec/exec-all.h"
 | 
						|
#include "helper_regs.h"
 | 
						|
#include "hw/ppc/ppc.h"
 | 
						|
#include "hw/ppc/spapr.h"
 | 
						|
#include "hw/ppc/spapr_cpu_core.h"
 | 
						|
#include "hw/ppc/spapr_nested.h"
 | 
						|
 | 
						|
#ifdef CONFIG_TCG
 | 
						|
#define PRTS_MASK      0x1f
 | 
						|
 | 
						|
static target_ulong h_set_ptbl(PowerPCCPU *cpu,
 | 
						|
                               SpaprMachineState *spapr,
 | 
						|
                               target_ulong opcode,
 | 
						|
                               target_ulong *args)
 | 
						|
{
 | 
						|
    target_ulong ptcr = args[0];
 | 
						|
 | 
						|
    if (!spapr_get_cap(spapr, SPAPR_CAP_NESTED_KVM_HV)) {
 | 
						|
        return H_FUNCTION;
 | 
						|
    }
 | 
						|
 | 
						|
    if ((ptcr & PRTS_MASK) + 12 - 4 > 12) {
 | 
						|
        return H_PARAMETER;
 | 
						|
    }
 | 
						|
 | 
						|
    spapr->nested_ptcr = ptcr; /* Save new partition table */
 | 
						|
 | 
						|
    return H_SUCCESS;
 | 
						|
}
 | 
						|
 | 
						|
static target_ulong h_tlb_invalidate(PowerPCCPU *cpu,
 | 
						|
                                     SpaprMachineState *spapr,
 | 
						|
                                     target_ulong opcode,
 | 
						|
                                     target_ulong *args)
 | 
						|
{
 | 
						|
    /*
 | 
						|
     * The spapr virtual hypervisor nested HV implementation retains no L2
 | 
						|
     * translation state except for TLB. And the TLB is always invalidated
 | 
						|
     * across L1<->L2 transitions, so nothing is required here.
 | 
						|
     */
 | 
						|
 | 
						|
    return H_SUCCESS;
 | 
						|
}
 | 
						|
 | 
						|
static target_ulong h_copy_tofrom_guest(PowerPCCPU *cpu,
 | 
						|
                                        SpaprMachineState *spapr,
 | 
						|
                                        target_ulong opcode,
 | 
						|
                                        target_ulong *args)
 | 
						|
{
 | 
						|
    /*
 | 
						|
     * This HCALL is not required, L1 KVM will take a slow path and walk the
 | 
						|
     * page tables manually to do the data copy.
 | 
						|
     */
 | 
						|
    return H_FUNCTION;
 | 
						|
}
 | 
						|
 | 
						|
static void nested_save_state(struct nested_ppc_state *save, PowerPCCPU *cpu)
 | 
						|
{
 | 
						|
    CPUPPCState *env = &cpu->env;
 | 
						|
 | 
						|
    memcpy(save->gpr, env->gpr, sizeof(save->gpr));
 | 
						|
 | 
						|
    save->lr = env->lr;
 | 
						|
    save->ctr = env->ctr;
 | 
						|
    save->cfar = env->cfar;
 | 
						|
    save->msr = env->msr;
 | 
						|
    save->nip = env->nip;
 | 
						|
 | 
						|
    save->cr = ppc_get_cr(env);
 | 
						|
    save->xer = cpu_read_xer(env);
 | 
						|
 | 
						|
    save->lpcr = env->spr[SPR_LPCR];
 | 
						|
    save->lpidr = env->spr[SPR_LPIDR];
 | 
						|
    save->pcr = env->spr[SPR_PCR];
 | 
						|
    save->dpdes = env->spr[SPR_DPDES];
 | 
						|
    save->hfscr = env->spr[SPR_HFSCR];
 | 
						|
    save->srr0 = env->spr[SPR_SRR0];
 | 
						|
    save->srr1 = env->spr[SPR_SRR1];
 | 
						|
    save->sprg0 = env->spr[SPR_SPRG0];
 | 
						|
    save->sprg1 = env->spr[SPR_SPRG1];
 | 
						|
    save->sprg2 = env->spr[SPR_SPRG2];
 | 
						|
    save->sprg3 = env->spr[SPR_SPRG3];
 | 
						|
    save->pidr = env->spr[SPR_BOOKS_PID];
 | 
						|
    save->ppr = env->spr[SPR_PPR];
 | 
						|
 | 
						|
    save->tb_offset = env->tb_env->tb_offset;
 | 
						|
}
 | 
						|
 | 
						|
static void nested_load_state(PowerPCCPU *cpu, struct nested_ppc_state *load)
 | 
						|
{
 | 
						|
    CPUState *cs = CPU(cpu);
 | 
						|
    CPUPPCState *env = &cpu->env;
 | 
						|
 | 
						|
    memcpy(env->gpr, load->gpr, sizeof(env->gpr));
 | 
						|
 | 
						|
    env->lr = load->lr;
 | 
						|
    env->ctr = load->ctr;
 | 
						|
    env->cfar = load->cfar;
 | 
						|
    env->msr = load->msr;
 | 
						|
    env->nip = load->nip;
 | 
						|
 | 
						|
    ppc_set_cr(env, load->cr);
 | 
						|
    cpu_write_xer(env, load->xer);
 | 
						|
 | 
						|
    env->spr[SPR_LPCR] = load->lpcr;
 | 
						|
    env->spr[SPR_LPIDR] = load->lpidr;
 | 
						|
    env->spr[SPR_PCR] = load->pcr;
 | 
						|
    env->spr[SPR_DPDES] = load->dpdes;
 | 
						|
    env->spr[SPR_HFSCR] = load->hfscr;
 | 
						|
    env->spr[SPR_SRR0] = load->srr0;
 | 
						|
    env->spr[SPR_SRR1] = load->srr1;
 | 
						|
    env->spr[SPR_SPRG0] = load->sprg0;
 | 
						|
    env->spr[SPR_SPRG1] = load->sprg1;
 | 
						|
    env->spr[SPR_SPRG2] = load->sprg2;
 | 
						|
    env->spr[SPR_SPRG3] = load->sprg3;
 | 
						|
    env->spr[SPR_BOOKS_PID] = load->pidr;
 | 
						|
    env->spr[SPR_PPR] = load->ppr;
 | 
						|
 | 
						|
    env->tb_env->tb_offset = load->tb_offset;
 | 
						|
 | 
						|
    /*
 | 
						|
     * MSR updated, compute hflags and possible interrupts.
 | 
						|
     */
 | 
						|
    hreg_compute_hflags(env);
 | 
						|
    ppc_maybe_interrupt(env);
 | 
						|
 | 
						|
    /*
 | 
						|
     * Nested HV does not tag TLB entries between L1 and L2, so must
 | 
						|
     * flush on transition.
 | 
						|
     */
 | 
						|
    tlb_flush(cs);
 | 
						|
    env->reserve_addr = -1; /* Reset the reservation */
 | 
						|
}
 | 
						|
 | 
						|
/*
 | 
						|
 * When this handler returns, the environment is switched to the L2 guest
 | 
						|
 * and TCG begins running that. spapr_exit_nested() performs the switch from
 | 
						|
 * L2 back to L1 and returns from the H_ENTER_NESTED hcall.
 | 
						|
 */
 | 
						|
static target_ulong h_enter_nested(PowerPCCPU *cpu,
 | 
						|
                                   SpaprMachineState *spapr,
 | 
						|
                                   target_ulong opcode,
 | 
						|
                                   target_ulong *args)
 | 
						|
{
 | 
						|
    PowerPCCPUClass *pcc = POWERPC_CPU_GET_CLASS(cpu);
 | 
						|
    CPUPPCState *env = &cpu->env;
 | 
						|
    SpaprCpuState *spapr_cpu = spapr_cpu_state(cpu);
 | 
						|
    struct nested_ppc_state l2_state;
 | 
						|
    target_ulong hv_ptr = args[0];
 | 
						|
    target_ulong regs_ptr = args[1];
 | 
						|
    target_ulong hdec, now = cpu_ppc_load_tbl(env);
 | 
						|
    target_ulong lpcr, lpcr_mask;
 | 
						|
    struct kvmppc_hv_guest_state *hvstate;
 | 
						|
    struct kvmppc_hv_guest_state hv_state;
 | 
						|
    struct kvmppc_pt_regs *regs;
 | 
						|
    hwaddr len;
 | 
						|
 | 
						|
    if (spapr->nested_ptcr == 0) {
 | 
						|
        return H_NOT_AVAILABLE;
 | 
						|
    }
 | 
						|
 | 
						|
    len = sizeof(*hvstate);
 | 
						|
    hvstate = address_space_map(CPU(cpu)->as, hv_ptr, &len, false,
 | 
						|
                                MEMTXATTRS_UNSPECIFIED);
 | 
						|
    if (len != sizeof(*hvstate)) {
 | 
						|
        address_space_unmap(CPU(cpu)->as, hvstate, len, 0, false);
 | 
						|
        return H_PARAMETER;
 | 
						|
    }
 | 
						|
 | 
						|
    memcpy(&hv_state, hvstate, len);
 | 
						|
 | 
						|
    address_space_unmap(CPU(cpu)->as, hvstate, len, len, false);
 | 
						|
 | 
						|
    /*
 | 
						|
     * We accept versions 1 and 2. Version 2 fields are unused because TCG
 | 
						|
     * does not implement DAWR*.
 | 
						|
     */
 | 
						|
    if (hv_state.version > HV_GUEST_STATE_VERSION) {
 | 
						|
        return H_PARAMETER;
 | 
						|
    }
 | 
						|
 | 
						|
    if (hv_state.lpid == 0) {
 | 
						|
        return H_PARAMETER;
 | 
						|
    }
 | 
						|
 | 
						|
    spapr_cpu->nested_host_state = g_try_new(struct nested_ppc_state, 1);
 | 
						|
    if (!spapr_cpu->nested_host_state) {
 | 
						|
        return H_NO_MEM;
 | 
						|
    }
 | 
						|
 | 
						|
    assert(env->spr[SPR_LPIDR] == 0);
 | 
						|
    assert(env->spr[SPR_DPDES] == 0);
 | 
						|
    nested_save_state(spapr_cpu->nested_host_state, cpu);
 | 
						|
 | 
						|
    len = sizeof(*regs);
 | 
						|
    regs = address_space_map(CPU(cpu)->as, regs_ptr, &len, false,
 | 
						|
                                MEMTXATTRS_UNSPECIFIED);
 | 
						|
    if (!regs || len != sizeof(*regs)) {
 | 
						|
        address_space_unmap(CPU(cpu)->as, regs, len, 0, false);
 | 
						|
        g_free(spapr_cpu->nested_host_state);
 | 
						|
        return H_P2;
 | 
						|
    }
 | 
						|
 | 
						|
    len = sizeof(l2_state.gpr);
 | 
						|
    assert(len == sizeof(regs->gpr));
 | 
						|
    memcpy(l2_state.gpr, regs->gpr, len);
 | 
						|
 | 
						|
    l2_state.lr = regs->link;
 | 
						|
    l2_state.ctr = regs->ctr;
 | 
						|
    l2_state.xer = regs->xer;
 | 
						|
    l2_state.cr = regs->ccr;
 | 
						|
    l2_state.msr = regs->msr;
 | 
						|
    l2_state.nip = regs->nip;
 | 
						|
 | 
						|
    address_space_unmap(CPU(cpu)->as, regs, len, len, false);
 | 
						|
 | 
						|
    l2_state.cfar = hv_state.cfar;
 | 
						|
    l2_state.lpidr = hv_state.lpid;
 | 
						|
 | 
						|
    lpcr_mask = LPCR_DPFD | LPCR_ILE | LPCR_AIL | LPCR_LD | LPCR_MER;
 | 
						|
    lpcr = (env->spr[SPR_LPCR] & ~lpcr_mask) | (hv_state.lpcr & lpcr_mask);
 | 
						|
    lpcr |= LPCR_HR | LPCR_UPRT | LPCR_GTSE | LPCR_HVICE | LPCR_HDICE;
 | 
						|
    lpcr &= ~LPCR_LPES0;
 | 
						|
    l2_state.lpcr = lpcr & pcc->lpcr_mask;
 | 
						|
 | 
						|
    l2_state.pcr = hv_state.pcr;
 | 
						|
    /* hv_state.amor is not used */
 | 
						|
    l2_state.dpdes = hv_state.dpdes;
 | 
						|
    l2_state.hfscr = hv_state.hfscr;
 | 
						|
    /* TCG does not implement DAWR*, CIABR, PURR, SPURR, IC, VTB, HEIR SPRs*/
 | 
						|
    l2_state.srr0 = hv_state.srr0;
 | 
						|
    l2_state.srr1 = hv_state.srr1;
 | 
						|
    l2_state.sprg0 = hv_state.sprg[0];
 | 
						|
    l2_state.sprg1 = hv_state.sprg[1];
 | 
						|
    l2_state.sprg2 = hv_state.sprg[2];
 | 
						|
    l2_state.sprg3 = hv_state.sprg[3];
 | 
						|
    l2_state.pidr = hv_state.pidr;
 | 
						|
    l2_state.ppr = hv_state.ppr;
 | 
						|
    l2_state.tb_offset = env->tb_env->tb_offset + hv_state.tb_offset;
 | 
						|
 | 
						|
    /*
 | 
						|
     * Switch to the nested guest environment and start the "hdec" timer.
 | 
						|
     */
 | 
						|
    nested_load_state(cpu, &l2_state);
 | 
						|
 | 
						|
    hdec = hv_state.hdec_expiry - now;
 | 
						|
    cpu_ppc_hdecr_init(env);
 | 
						|
    cpu_ppc_store_hdecr(env, hdec);
 | 
						|
 | 
						|
    /*
 | 
						|
     * The hv_state.vcpu_token is not needed. It is used by the KVM
 | 
						|
     * implementation to remember which L2 vCPU last ran on which physical
 | 
						|
     * CPU so as to invalidate process scope translations if it is moved
 | 
						|
     * between physical CPUs. For now TLBs are always flushed on L1<->L2
 | 
						|
     * transitions so this is not a problem.
 | 
						|
     *
 | 
						|
     * Could validate that the same vcpu_token does not attempt to run on
 | 
						|
     * different L1 vCPUs at the same time, but that would be a L1 KVM bug
 | 
						|
     * and it's not obviously worth a new data structure to do it.
 | 
						|
     */
 | 
						|
 | 
						|
    spapr_cpu->in_nested = true;
 | 
						|
 | 
						|
    /*
 | 
						|
     * The spapr hcall helper sets env->gpr[3] to the return value, but at
 | 
						|
     * this point the L1 is not returning from the hcall but rather we
 | 
						|
     * start running the L2, so r3 must not be clobbered, so return env->gpr[3]
 | 
						|
     * to leave it unchanged.
 | 
						|
     */
 | 
						|
    return env->gpr[3];
 | 
						|
}
 | 
						|
 | 
						|
void spapr_exit_nested(PowerPCCPU *cpu, int excp)
 | 
						|
{
 | 
						|
    CPUPPCState *env = &cpu->env;
 | 
						|
    SpaprCpuState *spapr_cpu = spapr_cpu_state(cpu);
 | 
						|
    struct nested_ppc_state l2_state;
 | 
						|
    target_ulong hv_ptr = spapr_cpu->nested_host_state->gpr[4];
 | 
						|
    target_ulong regs_ptr = spapr_cpu->nested_host_state->gpr[5];
 | 
						|
    target_ulong hsrr0, hsrr1, hdar, asdr, hdsisr;
 | 
						|
    struct kvmppc_hv_guest_state *hvstate;
 | 
						|
    struct kvmppc_pt_regs *regs;
 | 
						|
    hwaddr len;
 | 
						|
 | 
						|
    assert(spapr_cpu->in_nested);
 | 
						|
 | 
						|
    nested_save_state(&l2_state, cpu);
 | 
						|
    hsrr0 = env->spr[SPR_HSRR0];
 | 
						|
    hsrr1 = env->spr[SPR_HSRR1];
 | 
						|
    hdar = env->spr[SPR_HDAR];
 | 
						|
    hdsisr = env->spr[SPR_HDSISR];
 | 
						|
    asdr = env->spr[SPR_ASDR];
 | 
						|
 | 
						|
    /*
 | 
						|
     * Switch back to the host environment (including for any error).
 | 
						|
     */
 | 
						|
    assert(env->spr[SPR_LPIDR] != 0);
 | 
						|
    nested_load_state(cpu, spapr_cpu->nested_host_state);
 | 
						|
    env->gpr[3] = env->excp_vectors[excp]; /* hcall return value */
 | 
						|
 | 
						|
    cpu_ppc_hdecr_exit(env);
 | 
						|
 | 
						|
    spapr_cpu->in_nested = false;
 | 
						|
 | 
						|
    g_free(spapr_cpu->nested_host_state);
 | 
						|
    spapr_cpu->nested_host_state = NULL;
 | 
						|
 | 
						|
    len = sizeof(*hvstate);
 | 
						|
    hvstate = address_space_map(CPU(cpu)->as, hv_ptr, &len, true,
 | 
						|
                                MEMTXATTRS_UNSPECIFIED);
 | 
						|
    if (len != sizeof(*hvstate)) {
 | 
						|
        address_space_unmap(CPU(cpu)->as, hvstate, len, 0, true);
 | 
						|
        env->gpr[3] = H_PARAMETER;
 | 
						|
        return;
 | 
						|
    }
 | 
						|
 | 
						|
    hvstate->cfar = l2_state.cfar;
 | 
						|
    hvstate->lpcr = l2_state.lpcr;
 | 
						|
    hvstate->pcr = l2_state.pcr;
 | 
						|
    hvstate->dpdes = l2_state.dpdes;
 | 
						|
    hvstate->hfscr = l2_state.hfscr;
 | 
						|
 | 
						|
    if (excp == POWERPC_EXCP_HDSI) {
 | 
						|
        hvstate->hdar = hdar;
 | 
						|
        hvstate->hdsisr = hdsisr;
 | 
						|
        hvstate->asdr = asdr;
 | 
						|
    } else if (excp == POWERPC_EXCP_HISI) {
 | 
						|
        hvstate->asdr = asdr;
 | 
						|
    }
 | 
						|
 | 
						|
    /* HEIR should be implemented for HV mode and saved here. */
 | 
						|
    hvstate->srr0 = l2_state.srr0;
 | 
						|
    hvstate->srr1 = l2_state.srr1;
 | 
						|
    hvstate->sprg[0] = l2_state.sprg0;
 | 
						|
    hvstate->sprg[1] = l2_state.sprg1;
 | 
						|
    hvstate->sprg[2] = l2_state.sprg2;
 | 
						|
    hvstate->sprg[3] = l2_state.sprg3;
 | 
						|
    hvstate->pidr = l2_state.pidr;
 | 
						|
    hvstate->ppr = l2_state.ppr;
 | 
						|
 | 
						|
    /* Is it okay to specify write length larger than actual data written? */
 | 
						|
    address_space_unmap(CPU(cpu)->as, hvstate, len, len, true);
 | 
						|
 | 
						|
    len = sizeof(*regs);
 | 
						|
    regs = address_space_map(CPU(cpu)->as, regs_ptr, &len, true,
 | 
						|
                                MEMTXATTRS_UNSPECIFIED);
 | 
						|
    if (!regs || len != sizeof(*regs)) {
 | 
						|
        address_space_unmap(CPU(cpu)->as, regs, len, 0, true);
 | 
						|
        env->gpr[3] = H_P2;
 | 
						|
        return;
 | 
						|
    }
 | 
						|
 | 
						|
    len = sizeof(env->gpr);
 | 
						|
    assert(len == sizeof(regs->gpr));
 | 
						|
    memcpy(regs->gpr, l2_state.gpr, len);
 | 
						|
 | 
						|
    regs->link = l2_state.lr;
 | 
						|
    regs->ctr = l2_state.ctr;
 | 
						|
    regs->xer = l2_state.xer;
 | 
						|
    regs->ccr = l2_state.cr;
 | 
						|
 | 
						|
    if (excp == POWERPC_EXCP_MCHECK ||
 | 
						|
        excp == POWERPC_EXCP_RESET ||
 | 
						|
        excp == POWERPC_EXCP_SYSCALL) {
 | 
						|
        regs->nip = l2_state.srr0;
 | 
						|
        regs->msr = l2_state.srr1 & env->msr_mask;
 | 
						|
    } else {
 | 
						|
        regs->nip = hsrr0;
 | 
						|
        regs->msr = hsrr1 & env->msr_mask;
 | 
						|
    }
 | 
						|
 | 
						|
    /* Is it okay to specify write length larger than actual data written? */
 | 
						|
    address_space_unmap(CPU(cpu)->as, regs, len, len, true);
 | 
						|
}
 | 
						|
 | 
						|
void spapr_register_nested(void)
 | 
						|
{
 | 
						|
    spapr_register_hypercall(KVMPPC_H_SET_PARTITION_TABLE, h_set_ptbl);
 | 
						|
    spapr_register_hypercall(KVMPPC_H_ENTER_NESTED, h_enter_nested);
 | 
						|
    spapr_register_hypercall(KVMPPC_H_TLB_INVALIDATE, h_tlb_invalidate);
 | 
						|
    spapr_register_hypercall(KVMPPC_H_COPY_TOFROM_GUEST, h_copy_tofrom_guest);
 | 
						|
}
 | 
						|
#else
 | 
						|
void spapr_exit_nested(PowerPCCPU *cpu, int excp)
 | 
						|
{
 | 
						|
    g_assert_not_reached();
 | 
						|
}
 | 
						|
 | 
						|
void spapr_register_nested(void)
 | 
						|
{
 | 
						|
    /* DO NOTHING */
 | 
						|
}
 | 
						|
#endif
 |